REP-6634 Add time-series support (#140)

FGasper · web-flow · commit 439fc9db2fa5 · 2025-09-22T15:29:34.000-04:00
This changeset adds basic time-series support.

Because of the verifier’s `_id` dependency, this verifies buckets rather than logical measurements. This implies a requirement that the migration copy time-series collections via buckets as well since a logical replication would not preserve artifacts like bucket `_id`, and possibly not even the grouping of measurements.

Because of the bucket-level verification, details in mismatch reports are not very useful for time-series because they reference bucket-level fields that the logical API doesn’t expose.

This works with per-shard verification (i.e., it can verify with or without a view). It _does not_ currently support namespace filtering.
diff --git a/README.md b/README.md
@@ -357,8 +357,16 @@ Additionally, because the amount of data sent to migration-verifier doesn’t ac
 
 - If the server’s memory usage rises after generation 0, try reducing `recheckMaxSizeMB`. This will shrink the queries that the verifier sends, which in turn should reduce the server’s memory usage. (The number of actual queries sent will rise, of course.)
 
+## Time-Series Collections
+
+Because the verifier compares documents by `_id`, it cannot compare logical time-series measurements (i.e., the data that users actually insert). Instead it compares the server’s internal time-series “buckets”. Unfortunately, this makes mismatch details essentially useless with time-series since they will be details about time-series buckets, which users generally don’t see.
+
+It also requires that migrations replicate the raw buckets rather than the logical measurements. This is because a logical migration would cause `_id` mismatches between source & destination buckets. A user application wouldn’t care (since it never sees the buckets’ `_id`s), but verification does.
+
+NB: Given bucket documents’ size, hashed document comparison can be especially useful with time-series.
+
 # Limitations
 
-- The verifier’s iterative process can handle data changes while it is running, until you hit the writesOff endpoint.  However, it cannot handle DDL commands.  If the verifier receives a DDL change stream event, the verification will fail.
+- The verifier’s iterative process can handle data changes while it is running, until you hit the writesOff endpoint.  However, it cannot handle DDL commands.  If the verifier receives a DDL change stream event from the source, the verification will fail permanently.
 
-- The verifier crashes if it tries to compare time-series collections. The error will include a phrase like “Collection has nil UUID (most probably is a view)” and also mention “timeseries”.
+- The verifier cannot verify time-series collections under namespace filtering.
diff --git a/internal/verifier/change_stream.go b/internal/verifier/change_stream.go
@@ -622,7 +622,12 @@ func (csr *ChangeStreamReader) createChangeStream(
 		SetMaxAwaitTime(maxChangeStreamAwaitTime)
 
 	if csr.clusterInfo.VersionArray[0] >= 6 {
-		opts = opts.SetCustomPipeline(bson.M{"showExpandedEvents": true})
+		opts = opts.SetCustomPipeline(
+			bson.M{
+				"showSystemEvents":   true,
+				"showExpandedEvents": true,
+			},
+		)
 	}
 
 	savedResumeToken, err := csr.loadChangeStreamResumeToken(ctx)
diff --git a/internal/verifier/check.go b/internal/verifier/check.go
@@ -202,13 +202,13 @@ func (verifier *Verifier) CheckDriver(ctx context.Context, filter bson.D, testCh
 		err = verifier.verificationDatabase().Drop(ctx)
 		if err != nil {
 			verifier.mux.Unlock()
-			return err
+			return errors.Wrap(err, "dropping metadata")
 		}
 	} else {
 		genOpt, err := verifier.readGeneration(ctx)
 		if err != nil {
 			verifier.mux.Unlock()
-			return err
+			return errors.Wrap(err, "reading generation from metadata")
 		}
 
 		if gen, has := genOpt.Get(); has {
@@ -221,6 +221,8 @@ func (verifier *Verifier) CheckDriver(ctx context.Context, filter bson.D, testCh
 		}
 	}
 
+	verifier.logger.Info().Msg("Starting change streams.")
+
 	// Now that we’ve initialized verifier.generation we can
 	// start the change stream readers.
 	verifier.initializeChangeStreamReaders()
@@ -230,7 +232,7 @@ func (verifier *Verifier) CheckDriver(ctx context.Context, filter bson.D, testCh
 		func(ctx context.Context, _ *retry.FuncInfo) error {
 			err = verifier.AddMetaIndexes(ctx)
 			if err != nil {
-				return err
+				return errors.Wrap(err, "adding metadata indexes")
 			}
 
 			err = verifier.doInMetaTransaction(
@@ -457,7 +459,7 @@ func (verifier *Verifier) CreateInitialTasksIfNeeded(ctx context.Context) error
 	}
 	isPrimary, err := verifier.CreatePrimaryTaskIfNeeded(ctx)
 	if err != nil {
-		return err
+		return errors.Wrap(err, "creating primary task")
 	}
 	if !isPrimary {
 		verifier.logger.Info().Msg("Primary task already existed; skipping setup")
@@ -466,7 +468,7 @@ func (verifier *Verifier) CreateInitialTasksIfNeeded(ctx context.Context) error
 	if verifier.verifyAll {
 		err := verifier.setupAllNamespaceList(ctx)
 		if err != nil {
-			return err
+			return errors.Wrap(err, "creating namespace list")
 		}
 	}
 	for _, src := range verifier.srcNamespaces {
diff --git a/internal/verifier/list_namespaces.go b/internal/verifier/list_namespaces.go
@@ -5,6 +5,7 @@ import (
 
 	"github.com/10gen/migration-verifier/internal/logger"
 	"github.com/10gen/migration-verifier/internal/util"
+	"github.com/10gen/migration-verifier/mmongo"
 	"github.com/10gen/migration-verifier/mslices"
 	"go.mongodb.org/mongo-driver/bson"
 	"go.mongodb.org/mongo-driver/mongo"
@@ -27,8 +28,12 @@ var (
 	ExcludedSystemCollPrefix = "system."
 )
 
-// Lists all the user collections on a cluster.  Unlike mongosync, we don't use the internal $listCatalog, since we need to
-// work on old versions without that command.  This means this does not run with read concern majority.
+// ListAllUserNamespaces lists all the user collections on a cluster,
+// in addition to time-series “system.buckets.*” collections.
+//
+// Unlike mongosync, we don't use the internal $listCatalog, since we need to
+// work on old versions without that command. Thus, this does *NOT* run with
+// majority read concern.
 func ListAllUserNamespaces(
 	ctx context.Context,
 	logger *logger.Logger,
@@ -62,10 +67,17 @@ func ListAllUserNamespaces(
 	for _, dbName := range dbNames {
 		db := client.Database(dbName)
 
-		filter := util.ExcludePrefixesQuery(
-			"name",
-			mslices.Of(ExcludedSystemCollPrefix),
-		)
+		filter := bson.D{
+			{"$or", []bson.D{
+				util.ExcludePrefixesQuery(
+					"name",
+					mslices.Of(ExcludedSystemCollPrefix),
+				),
+				{
+					{"$expr", mmongo.StartsWithAgg("$name", timeseriesBucketsPrefix)},
+				},
+			}},
+		}
 
 		specifications, err := db.ListCollectionSpecifications(ctx, filter, options.ListCollections().SetNameOnly(true))
 		if err != nil {
diff --git a/internal/verifier/migration_verifier.go b/internal/verifier/migration_verifier.go
@@ -822,8 +822,20 @@ func (verifier *Verifier) compareCollectionSpecifications(
 		}
 	}
 
-	// Don't compare view data; they have no data of their own.
-	canCompareData := srcSpec.Type != "view"
+	canCompareData := false
+
+	switch srcSpec.Type {
+	case "collection":
+		canCompareData = true
+	case "view":
+	case "timeseries":
+		if !verifier.verifyAll {
+			return nil, false, fmt.Errorf("cannot verify time-series collection (%#q) under namespace filtering", srcNs)
+		}
+	default:
+		return nil, false, fmt.Errorf("unrecognized collection type (spec: %+v)", srcSpec)
+	}
+
 	// Do not compare data between capped and uncapped collections because the partitioning is different.
 	canCompareData = canCompareData && srcSpec.Options.Lookup("capped").Equal(dstSpec.Options.Lookup("capped"))
 
diff --git a/internal/verifier/timeseries.go b/internal/verifier/timeseries.go
@@ -0,0 +1,3 @@
+package verifier
+
+const timeseriesBucketsPrefix = "system.buckets."
diff --git a/internal/verifier/timeseries_test.go b/internal/verifier/timeseries_test.go

Original file line number	Diff line number	Diff line change
`@@ -202,13 +202,13 @@ func (verifier *Verifier) CheckDriver(ctx context.Context, filter bson.D, testCh`
`202`	`202`	`err = verifier.verificationDatabase().Drop(ctx)`
`203`	`203`	`if err != nil {`
`204`	`204`	`verifier.mux.Unlock()`
`205`		`- return err`
	`205`	`+ return errors.Wrap(err, "dropping metadata")`
`206`	`206`	`}`
`207`	`207`	`} else {`
`208`	`208`	`genOpt, err := verifier.readGeneration(ctx)`
`209`	`209`	`if err != nil {`
`210`	`210`	`verifier.mux.Unlock()`
`211`		`- return err`
	`211`	`+ return errors.Wrap(err, "reading generation from metadata")`
`212`	`212`	`}`
`213`	`213`
`214`	`214`	`if gen, has := genOpt.Get(); has {`
`@@ -221,6 +221,8 @@ func (verifier *Verifier) CheckDriver(ctx context.Context, filter bson.D, testCh`
`221`	`221`	`}`
`222`	`222`	`}`
`223`	`223`
	`224`	`+ verifier.logger.Info().Msg("Starting change streams.")`
	`225`	`+`
`224`	`226`	`// Now that we’ve initialized verifier.generation we can`
`225`	`227`	`// start the change stream readers.`
`226`	`228`	`verifier.initializeChangeStreamReaders()`
`@@ -230,7 +232,7 @@ func (verifier *Verifier) CheckDriver(ctx context.Context, filter bson.D, testCh`
`230`	`232`	`func(ctx context.Context, _ *retry.FuncInfo) error {`
`231`	`233`	`err = verifier.AddMetaIndexes(ctx)`
`232`	`234`	`if err != nil {`
`233`		`- return err`
	`235`	`+ return errors.Wrap(err, "adding metadata indexes")`
`234`	`236`	`}`
`235`	`237`
`236`	`238`	`err = verifier.doInMetaTransaction(`
`@@ -457,7 +459,7 @@ func (verifier *Verifier) CreateInitialTasksIfNeeded(ctx context.Context) error`
`457`	`459`	`}`
`458`	`460`	`isPrimary, err := verifier.CreatePrimaryTaskIfNeeded(ctx)`
`459`	`461`	`if err != nil {`
`460`		`- return err`
	`462`	`+ return errors.Wrap(err, "creating primary task")`
`461`	`463`	`}`
`462`	`464`	`if !isPrimary {`
`463`	`465`	`verifier.logger.Info().Msg("Primary task already existed; skipping setup")`
`@@ -466,7 +468,7 @@ func (verifier *Verifier) CreateInitialTasksIfNeeded(ctx context.Context) error`
`466`	`468`	`if verifier.verifyAll {`
`467`	`469`	`err := verifier.setupAllNamespaceList(ctx)`
`468`	`470`	`if err != nil {`
`469`		`- return err`
	`471`	`+ return errors.Wrap(err, "creating namespace list")`
`470`	`472`	`}`
`471`	`473`	`}`
`472`	`474`	`for _, src := range verifier.srcNamespaces {`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+package verifier`
	`2`	`+`
	`3`	`+const timeseriesBucketsPrefix = "system.buckets."`