Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

PMM-12805 Collstats, indexstats iterate only over collections, not views. #790

Merged
merged 25 commits into from
Feb 9, 2024
Merged
Show file tree
Hide file tree
Changes from 19 commits
Commits
Show all changes
25 commits
Select commit Hold shift + click to select a range
ac586c7
PMM-12805 Func to list collections without views.
JiriCtvrtka Jan 31, 2024
4656b4f
PMM-12805 Filter for real collections.
JiriCtvrtka Jan 31, 2024
1f02217
PMM-12805 Remove print.
JiriCtvrtka Jan 31, 2024
e76cf31
PMM-12805 Remove comment.
JiriCtvrtka Jan 31, 2024
1d88101
Merge branch 'main' into PMM-12805-view-error
JiriCtvrtka Jan 31, 2024
257c3b5
PMM-12805 Format.
JiriCtvrtka Jan 31, 2024
2189b78
PMM-12805 Lint.
JiriCtvrtka Jan 31, 2024
7e90ef4
PMM-12805 Lint.
JiriCtvrtka Jan 31, 2024
107f41f
PMM-12805 Required changes.
JiriCtvrtka Feb 6, 2024
4afd507
PMM-12805 Lint.
JiriCtvrtka Feb 6, 2024
cc39990
PMM-12805 Fix test.
JiriCtvrtka Feb 6, 2024
e52fb67
PMM-12805 Change in logic.
JiriCtvrtka Feb 6, 2024
43ab368
PMM-12805 Better name for func.
JiriCtvrtka Feb 6, 2024
648f754
PMM-12805 Refactor to get collections with/without views.
JiriCtvrtka Feb 6, 2024
b48fdd7
Update exporter/common.go
JiriCtvrtka Feb 6, 2024
dcaa9dd
PMM-12805 Fix tests after refactor.
JiriCtvrtka Feb 6, 2024
6a01aa1
PMM-12805 Fix.
JiriCtvrtka Feb 6, 2024
5c694dd
PMM-12805 Better naming.
JiriCtvrtka Feb 6, 2024
67297ab
PMM-12805 Better naming for converted map.
JiriCtvrtka Feb 6, 2024
cc2a079
Update exporter/common_test.go
JiriCtvrtka Feb 7, 2024
f2cd323
PMM-12805 Small change to check exact error message.
JiriCtvrtka Feb 7, 2024
20242d8
PMM-12805 Fix for empty namaspace.
JiriCtvrtka Feb 8, 2024
5ba2cb9
PMM-12805 Fix for namespaces.
JiriCtvrtka Feb 8, 2024
7d03f95
PMM-12805 Skip not complete namespaces.
JiriCtvrtka Feb 9, 2024
e97c9cb
PMM-12805 Better performance for discovery mode.
JiriCtvrtka Feb 9, 2024
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
26 changes: 11 additions & 15 deletions exporter/collstats_collector.go
Original file line number Diff line number Diff line change
Expand Up @@ -61,20 +61,27 @@ func (d *collstatsCollector) Collect(ch chan<- prometheus.Metric) {
func (d *collstatsCollector) collect(ch chan<- prometheus.Metric) {
defer measureCollectTime(ch, "mongodb", "collstats")()

collections := d.collections

client := d.base.client
logger := d.base.logger

collections, err := checkNamespacesForViews(d.ctx, client, d.collections)
if err != nil {
logger.Errorf("cannot list collections: %s", err.Error())

return
}

if d.discoveringMode {
namespaces, err := listAllCollections(d.ctx, client, d.collections, systemDBs)
onlyCollectionsNamespaces, err := listAllCollections(d.ctx, client, d.collections, systemDBs, true)
if err != nil {
logger.Errorf("cannot auto discover databases and collections: %s", err.Error())

return
}

collections = fromMapToSlice(namespaces)
for collectionNamespace := range onlyCollectionsNamespaces {
collections = append(collections, collectionNamespace)
}
}

for _, dbCollection := range collections {
Expand Down Expand Up @@ -134,15 +141,4 @@ func (d *collstatsCollector) collect(ch chan<- prometheus.Metric) {
}
}

func fromMapToSlice(databases map[string][]string) []string {
var collections []string
for db, cols := range databases {
for _, value := range cols {
collections = append(collections, db+"."+value)
}
}

return collections
}

var _ prometheus.Collector = (*collstatsCollector)(nil)
38 changes: 34 additions & 4 deletions exporter/common.go
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@ package exporter

import (
"context"
"fmt"
"sort"
"strings"

Expand All @@ -30,7 +31,7 @@ import (

var systemDBs = []string{"admin", "config", "local"} //nolint:gochecknoglobals

func listCollections(ctx context.Context, client *mongo.Client, database string, filterInNamespaces []string) ([]string, error) {
func listCollections(ctx context.Context, client *mongo.Client, database string, filterInNamespaces []string, skipViews bool) ([]string, error) {
filter := bson.D{} // Default=empty -> list all collections

// if there is a filter with the list of collections we want, create a filter like
Expand All @@ -57,6 +58,10 @@ func listCollections(ctx context.Context, client *mongo.Client, database string,
}
}

if skipViews {
filter = append(filter, primitive.E{Key: "type", Value: "collection"})
}

collections, err := client.Database(database).ListCollectionNames(ctx, filter)
if err != nil {
return nil, errors.Wrap(err, "cannot get the list of collections for discovery")
Expand Down Expand Up @@ -153,7 +158,32 @@ func unique(slice []string) []string {
return list
}

func listAllCollections(ctx context.Context, client *mongo.Client, filterInNamespaces []string, excludeDBs []string) (map[string][]string, error) {
func checkNamespacesForViews(ctx context.Context, client *mongo.Client, collections []string) ([]string, error) {
onlyCollectionsNamespaces, err := listAllCollections(ctx, client, nil, nil, true)
if err != nil {
return nil, err
}

namespaces := make(map[string]struct{})
for db, collections := range onlyCollectionsNamespaces {
for _, collection := range collections {
namespaces[fmt.Sprintf("%s.%s", db, collection)] = struct{}{}
}
}

filteredCollections := []string{}
for _, collection := range collections {
if _, ok := namespaces[collection]; !ok {
return nil, errors.Errorf("namespace %s is a view and cannot be used for collstats/indexstats", collection)
}

filteredCollections = append(filteredCollections, collection)
}

return filteredCollections, nil
}

func listAllCollections(ctx context.Context, client *mongo.Client, filterInNamespaces []string, excludeDBs []string, skipViews bool) (map[string][]string, error) {
namespaces := make(map[string][]string)

dbs, err := databases(ctx, client, filterInNamespaces, excludeDBs)
Expand All @@ -177,7 +207,7 @@ func listAllCollections(ctx context.Context, client *mongo.Client, filterInNames
continue
}

colls, err := listCollections(ctx, client, db, []string{namespace})
colls, err := listCollections(ctx, client, db, []string{namespace}, skipViews)
if err != nil {
return nil, errors.Wrapf(err, "cannot list the collections for %q", db)
}
Expand Down Expand Up @@ -209,7 +239,7 @@ func nonSystemCollectionsCount(ctx context.Context, client *mongo.Client, includ
var count int

for _, dbname := range databases {
colls, err := listCollections(ctx, client, dbname, filterInCollections)
colls, err := listCollections(ctx, client, dbname, filterInCollections, true)
if err != nil {
return 0, errors.Wrap(err, "cannot get collections count")
}
Expand Down
49 changes: 43 additions & 6 deletions exporter/common_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,7 @@ import (
var (
testDBs = []string{"testdb01", "testdb02"}
testColls = []string{"col01", "col02", "colxx", "colyy"}
testViews = []string{"view01", "view02"}
)

func setupDB(ctx context.Context, t *testing.T, client *mongo.Client) {
Expand All @@ -45,6 +46,10 @@ func setupDB(ctx context.Context, t *testing.T, client *mongo.Client) {
}
}
}
for _, view := range testViews {
err := client.Database(testDBs[0]).CreateView(ctx, view, testColls[0], mongo.Pipeline{})
assert.NoError(t, err)
}
}

func cleanupDB(ctx context.Context, client *mongo.Client) {
Expand Down Expand Up @@ -105,7 +110,7 @@ func TestListCollections(t *testing.T) {
t.Run("Filter in databases", func(t *testing.T) {
want := []string{"col01", "col02", "colxx"}
inNameSpaces := []string{testDBs[0] + ".col0", testDBs[0] + ".colx"}
colls, err := listCollections(ctx, client, testDBs[0], inNameSpaces)
colls, err := listCollections(ctx, client, testDBs[0], inNameSpaces, true)
sort.Strings(colls)

assert.NoError(t, err)
Expand All @@ -115,30 +120,40 @@ func TestListCollections(t *testing.T) {
t.Run("With namespaces list", func(t *testing.T) {
// Advanced filtering test
wantNS := map[string][]string{
"testdb01": {"col01", "col02", "colxx", "colyy"},
"testdb01": {"col01", "col02", "colxx", "colyy", "system.views"},
"testdb02": {"col01", "col02"},
}
// List all collections in testdb01 (inDBs[0]) but only col01 and col02 from testdb02.
filterInNameSpaces := []string{testDBs[0], testDBs[1] + ".col01", testDBs[1] + ".col02"}
namespaces, err := listAllCollections(ctx, client, filterInNameSpaces, systemDBs)
namespaces, err := listAllCollections(ctx, client, filterInNameSpaces, systemDBs, true)
assert.NoError(t, err)
assert.Equal(t, wantNS, namespaces)
})

t.Run("Empty namespaces list", func(t *testing.T) {
wantNS := map[string][]string{
"testdb01": {"col01", "col02", "colxx", "colyy"},
"testdb01": {"col01", "col02", "colxx", "colyy", "system.views"},
"testdb02": {"col01", "col02", "colxx", "colyy"},
}
namespaces, err := listAllCollections(ctx, client, nil, systemDBs, true)
assert.NoError(t, err)
assert.Equal(t, wantNS, namespaces)
})

t.Run("Collections with views", func(t *testing.T) {
wantNS := map[string][]string{
"testdb01": {"col01", "col02", "colxx", "colyy", "system.views", "view01", "view02"},
"testdb02": {"col01", "col02", "colxx", "colyy"},
}
namespaces, err := listAllCollections(ctx, client, nil, systemDBs)
namespaces, err := listAllCollections(ctx, client, nil, systemDBs, false)
assert.NoError(t, err)
assert.Equal(t, wantNS, namespaces)
})

t.Run("Count basic", func(t *testing.T) {
count, err := nonSystemCollectionsCount(ctx, client, nil, nil)
assert.NoError(t, err)
assert.Equal(t, 8, count)
assert.Equal(t, 9, count)
})

t.Run("Filtered count", func(t *testing.T) {
Expand Down Expand Up @@ -172,3 +187,25 @@ func TestSplitNamespace(t *testing.T) {
assert.Equal(t, tc.wantCollection, coll)
}
}

//nolint:paralleltest
func TestCheckNamespacesForViews(t *testing.T) {
ctx, cancel := context.WithTimeout(context.Background(), 3*time.Second)
defer cancel()

client := tu.DefaultTestClient(ctx, t)

setupDB(ctx, t, client)
defer cleanupDB(ctx, client)

t.Run("Views in provided collection list (should fail)", func(t *testing.T) {
_, err := checkNamespacesForViews(ctx, client, []string{"testdb01.col01", "testdb01.system.views", "testdb01.view01"})
assert.Error(t, err, "namespace testdb01.view01 is view and annot be used for collstats/indexstats")
JiriCtvrtka marked this conversation as resolved.
Show resolved Hide resolved
})

t.Run("No Views in provided collection list", func(t *testing.T) {
filtered, err := checkNamespacesForViews(ctx, client, []string{"testdb01.col01", "testdb01.system.views"})
assert.NoError(t, err)
assert.Equal(t, []string{"testdb01.col01", "testdb01.system.views"}, filtered)
})
}
19 changes: 13 additions & 6 deletions exporter/indexstats_collector.go
Original file line number Diff line number Diff line change
Expand Up @@ -62,20 +62,27 @@ func (d *indexstatsCollector) Collect(ch chan<- prometheus.Metric) {
func (d *indexstatsCollector) collect(ch chan<- prometheus.Metric) {
defer measureCollectTime(ch, "mongodb", "indexstats")()

collections := d.collections

logger := d.base.logger
client := d.base.client
logger := d.base.logger

collections, err := checkNamespacesForViews(d.ctx, client, d.collections)
if err != nil {
logger.Errorf("cannot list collections: %s", err.Error())

return
}

if d.discoveringMode {
namespaces, err := listAllCollections(d.ctx, client, d.collections, systemDBs)
onlyCollectionsNamespaces, err := listAllCollections(d.ctx, client, d.collections, systemDBs, true)
if err != nil {
logger.Errorf("cannot auto discover databases and collections")
logger.Errorf("cannot auto discover databases and collections: %s", err.Error())

return
}

collections = fromMapToSlice(namespaces)
for collectionNamespace := range onlyCollectionsNamespaces {
collections = append(collections, collectionNamespace)
}
}

for _, dbCollection := range collections {
Expand Down