mongodb-labs · FGasper · Nov 11, 2025 · Nov 11, 2025 · Nov 11, 2025 · Nov 11, 2025
diff --git a/internal/util/clusterinfo.go b/internal/util/clusterinfo.go
@@ -19,6 +19,18 @@ type ClusterInfo struct {
 	Topology     ClusterTopology
 }
 
+// ClusterHasBSONSize indicates whether a cluster with the given
+// major & minor version numbers supports the $bsonSize aggregation operator.
+func ClusterHasBSONSize(va [2]int) bool {
+	major := va[0]
+
+	if major == 4 {
+		return va[1] >= 4
+	}
+
+	return major > 4
+}
+
 const (
 	TopologySharded ClusterTopology = "sharded"
 	TopologyReplset ClusterTopology = "replset"

diff --git a/internal/verifier/change_reader.go b/internal/verifier/change_reader.go
@@ -0,0 +1,226 @@
+package verifier
+
+import (
+	"context"
+	"time"
+
+	"github.com/10gen/migration-verifier/history"
+	"github.com/10gen/migration-verifier/internal/logger"
+	"github.com/10gen/migration-verifier/internal/util"
+	"github.com/10gen/migration-verifier/msync"
+	"github.com/10gen/migration-verifier/option"
+	"github.com/pkg/errors"
+	"github.com/rs/zerolog"
+	"github.com/samber/lo"
+	"go.mongodb.org/mongo-driver/v2/bson"
+	"go.mongodb.org/mongo-driver/v2/mongo"
+	"go.mongodb.org/mongo-driver/v2/mongo/options"
+	"golang.org/x/sync/errgroup"
+)
+
+type ddlEventHandling string
+
+const (
+	fauxDocSizeForDeleteEvents = 1024
+
+	// The number of batches we’ll hold in memory at once.
+	batchChanBufferSize = 100
+
+	onDDLEventAllow ddlEventHandling = "allow"
+
+	changeReaderCollectionName = "changeReader"
+)
+
+type changeReader interface {
+	getWhichCluster() whichCluster
+	getReadChannel() <-chan changeEventBatch
+	getError() *util.Eventual[error]
+	getStartTimestamp() option.Option[bson.Timestamp]
+	getEventsPerSecond() option.Option[float64]
+	getLag() option.Option[time.Duration]
+	getBufferSaturation() float64
+	setWritesOff(bson.Timestamp)
+	start(context.Context, *errgroup.Group) error
+	done() <-chan struct{}
+	persistResumeToken(context.Context, bson.Raw) error
+	isRunning() bool
+	String() string
+}
+
+type ChangeReaderCommon struct {
+	readerType whichCluster
+
+	lastChangeEventTime *bson.Timestamp
+	logger              *logger.Logger
+	namespaces          []string
+
+	metaDB        *mongo.Database
+	watcherClient *mongo.Client
+	clusterInfo   util.ClusterInfo
+
+	resumeTokenTSExtractor func(bson.Raw) (bson.Timestamp, error)
+
+	running              bool
+	changeEventBatchChan chan changeEventBatch
+	writesOffTs          *util.Eventual[bson.Timestamp]
+	readerError          *util.Eventual[error]
+	doneChan             chan struct{}
+
+	startAtTs *bson.Timestamp
+
+	lag              *msync.TypedAtomic[option.Option[time.Duration]]
+	batchSizeHistory *history.History[int]
+
+	onDDLEvent ddlEventHandling
+}
+
+func (rc *ChangeReaderCommon) getWhichCluster() whichCluster {
+	return rc.readerType
+}
+
+func (rc *ChangeReaderCommon) getError() *util.Eventual[error] {
+	return rc.readerError
+}
+
+func (rc *ChangeReaderCommon) getStartTimestamp() option.Option[bson.Timestamp] {
+	return option.FromPointer(rc.startAtTs)
+}
+
+func (rc *ChangeReaderCommon) setWritesOff(ts bson.Timestamp) {
+	rc.writesOffTs.Set(ts)
+}
+
+func (rc *ChangeReaderCommon) isRunning() bool {
+	return rc.running
+}
+
+func (rc *ChangeReaderCommon) getReadChannel() <-chan changeEventBatch {
+	return rc.changeEventBatchChan
+}
+
+func (rc *ChangeReaderCommon) done() <-chan struct{} {
+	return rc.doneChan
+}
+
+// getBufferSaturation returns the reader’s internal buffer’s saturation level
+// as a fraction. If saturation rises, that means we’re reading events faster
+// than we can persist them.
+func (rc *ChangeReaderCommon) getBufferSaturation() float64 {
+	return util.DivideToF64(len(rc.changeEventBatchChan), cap(rc.changeEventBatchChan))
+}
+
+// getLag returns the observed change stream lag (i.e., the delta between
+// cluster time and the most-recently-seen change event).
+func (rc *ChangeReaderCommon) getLag() option.Option[time.Duration] {
+	return rc.lag.Load()
+}
+
+// getEventsPerSecond returns the number of change events per second we’ve been
+// seeing “recently”. (See implementation for the actual period over which we
+// compile this metric.)
+func (rc *ChangeReaderCommon) getEventsPerSecond() option.Option[float64] {
+	logs := rc.batchSizeHistory.Get()
+	lastLog, hasLogs := lo.Last(logs)
+
+	if hasLogs && lastLog.At != logs[0].At {
+		span := lastLog.At.Sub(logs[0].At)
+
+		// Each log contains a time and a # of events that happened since
+		// the prior log. Thus, each log’s Datum is a count of events that
+		// happened before the timestamp. Since we want the # of events that
+		// happened between the first & last times, we only want events *after*
+		// the first time. Thus, we skip the first log entry here.
+		totalEvents := 0
+		for _, log := range logs[1:] {
+			totalEvents += log.Datum
+		}
+
+		return option.Some(util.DivideToF64(totalEvents, span.Seconds()))
+	}
+
+	return option.None[float64]()
+}
+
+func (rc *ChangeReaderCommon) persistResumeToken(ctx context.Context, token bson.Raw) error {
+	coll := rc.metaDB.Collection(changeReaderCollectionName)
+	_, err := coll.ReplaceOne(
+		ctx,
+		bson.D{{"_id", rc.resumeTokenDocID()}},
+		token,
+		options.Replace().SetUpsert(true),
+	)
+
+	if err == nil {
+		ts, err := rc.resumeTokenTSExtractor(token)
+
+		logEvent := rc.logger.Debug()
+
+		if err == nil {
+			logEvent = addTimestampToLogEvent(ts, logEvent)
+		} else {
+			rc.logger.Warn().Err(err).
+				Msg("failed to extract resume token timestamp")
+		}
+
+		logEvent.Msgf("Persisted %s's resume token.", rc.readerType)
+
+		return nil
+	}
+
+	return errors.Wrapf(err, "failed to persist %s resume token (%v)", rc.readerType, token)
+}
+
+func (rc *ChangeReaderCommon) resumeTokenDocID() string {
+	switch rc.readerType {
+	case src:
+		return "srcResumeToken"
+	case dst:
+		return "dstResumeToken"
+	default:
+		panic("unknown readerType: " + rc.readerType)
+	}
+}
+
+func (rc *ChangeReaderCommon) getMetadataCollection() *mongo.Collection {
+	return rc.metaDB.Collection(changeReaderCollectionName)
+}
+
+func (rc *ChangeReaderCommon) loadResumeToken(ctx context.Context) (option.Option[bson.Raw], error) {
+	coll := rc.getMetadataCollection()
+
+	token, err := coll.FindOne(
+		ctx,
+		bson.D{{"_id", rc.resumeTokenDocID()}},
+	).Raw()
+
+	if errors.Is(err, mongo.ErrNoDocuments) {
+		return option.None[bson.Raw](), nil
+	}
+
+	return option.Some(token), err
+}
+
+func (rc *ChangeReaderCommon) updateLag(sess *mongo.Session, token bson.Raw) {
+	tokenTs, err := rc.resumeTokenTSExtractor(token)
+	if err == nil {
+		lagSecs := int64(sess.OperationTime().T) - int64(tokenTs.T)
+		rc.lag.Store(option.Some(time.Second * time.Duration(lagSecs)))
+	} else {
+		rc.logger.Warn().
+			Err(err).
+			Msgf("Failed to extract timestamp from %s's resume token to compute lag.", rc.readerType)
+	}
+}
+
+func (rc *ChangeReaderCommon) logIgnoredDDL(rawEvent bson.Raw) {
+	rc.logger.Info().
+		Str("reader", string(rc.readerType)).
+		Stringer("event", rawEvent).
+		Msg("Ignoring event with unrecognized type on destination. (It’s assumedly internal to the migration.)")
+}
+
+func addTimestampToLogEvent(ts bson.Timestamp, event *zerolog.Event) *zerolog.Event {
+	return event.
+		Any("timestamp", ts).
+		Time("time", time.Unix(int64(ts.T), int64(0)))
+}