PeerDB-io · Amogh-Bharadwaj · Dec 5, 2025 · jgao54 · Dec 5, 2025 · Amogh-Bharadwaj
diff --git a/flow/activities/flowable.go b/flow/activities/flowable.go
@@ -1862,13 +1862,29 @@ func (a *FlowableActivity) MigratePostgresTableOIDs(
 			}
 			destinationTableOidMap[destinationTableIdentifier] = oid
 		}
+		tableNames := make([]string, 0, len(destinationTableOidMap))
+		for tableName := range destinationTableOidMap {
+			tableNames = append(tableNames, tableName)
+		}
+		tableSchemas, err := internal.LoadTableSchemasFromCatalog(ctx, a.CatalogPool, flowName, tableNames)
+		if err != nil {
+			return fmt.Errorf("failed to load table schemas from catalog: %w", err)
+		}
+
+		for destinationTableName, oid := range destinationTableOidMap {
+			schema, ok := tableSchemas[destinationTableName]
+			if !ok {
+				return fmt.Errorf("table schema not found for table %s", destinationTableName)
+			}
+			schema.TableOid = oid
+		}
 
-		err := internal.UpdateTableOIDsInTableSchemaInCatalog(
+		err = internal.UpdateTableSchemasInCatalog(
 			ctx,
 			a.CatalogPool,
 			logger,
 			flowName,
-			destinationTableOidMap,
+			tableSchemas,
 		)
 		if err != nil {
 			return fmt.Errorf("failed to update table OIDs in catalog: %w", err)

diff --git a/flow/activities/flowable_core.go b/flow/activities/flowable_core.go
@@ -6,7 +6,6 @@
 	"errors"
 	"fmt"
 	"log/slog"
-	"slices"
 	"sync/atomic"
 	"time"
 
@@ -64,31 +63,57 @@
 
 func (a *FlowableActivity) applySchemaDeltas(
 	ctx context.Context,
-	config *protos.FlowConnectionConfigsCore,
-	options *protos.SyncFlowOptions,
+	flowJobName string,
 	schemaDeltas []*protos.TableSchemaDelta,
 ) error {
-	filteredTableMappings := make([]*protos.TableMapping, 0, len(schemaDeltas))
-	for _, tableMapping := range options.TableMappings {
-		if slices.ContainsFunc(schemaDeltas, func(schemaDelta *protos.TableSchemaDelta) bool {
-			return schemaDelta.SrcTableName == tableMapping.SourceTableIdentifier &&
-				schemaDelta.DstTableName == tableMapping.DestinationTableIdentifier
-		}) {
-			filteredTableMappings = append(filteredTableMappings, tableMapping)
-		}
-	}
-
-	if len(schemaDeltas) > 0 {
-		if err := a.SetupTableSchema(ctx, &protos.SetupTableSchemaBatchInput{
-			PeerName:      config.SourceName,
-			TableMappings: filteredTableMappings,
-			FlowName:      config.FlowJobName,
-			System:        config.System,
-			Env:           config.Env,
-			Version:       config.Version,
-		}); err != nil {
-			return a.Alerter.LogFlowError(ctx, config.FlowJobName, fmt.Errorf("failed to execute schema update at source: %w", err))
+	logger := internal.LoggerFromCtx(ctx)
+	destinationNameListInDeltas := make([]string, 0, len(schemaDeltas))
+	for _, tableSchemaDelta := range schemaDeltas {
+		destinationNameListInDeltas = append(destinationNameListInDeltas, tableSchemaDelta.DstTableName)
+	}
+	logger.Info("loading table schemas from catalog for applying schema deltas",
+		slog.Int("numDeltas", len(schemaDeltas)),
+		slog.String("flowJobName", flowJobName),
+	)
+	schemasInCatalog, err := internal.LoadTableSchemasFromCatalog(ctx, a.CatalogPool, flowJobName, destinationNameListInDeltas)
+	if err != nil {
+		return fmt.Errorf("failed to load table schemas from catalog for applying schema deltas: %w", err)
+	}
+	for _, tableSchemaDelta := range schemaDeltas {
+		columnsInCatalog := schemasInCatalog[tableSchemaDelta.DstTableName].GetColumns()
+		addedColumns := tableSchemaDelta.GetAddedColumns()
+
+		// Create a map to track existing column names to avoid duplicates
+		existingColumnNames := make(map[string]bool)
+		for _, col := range columnsInCatalog {
+			existingColumnNames[col.Name] = true
 		}
+
+		// Only add columns that don't already exist
+		var newColumnsToAdd []*protos.FieldDescription
+		for _, addedCol := range addedColumns {
+			if !existingColumnNames[addedCol.Name] {
+				newColumnsToAdd = append(newColumnsToAdd, addedCol)
+				existingColumnNames[addedCol.Name] = true
+			}
+		}
+		updatedColumnsInCatalog := append(columnsInCatalog, newColumnsToAdd...)
+		schemasInCatalog[tableSchemaDelta.DstTableName].Columns = updatedColumnsInCatalog
+	}
+	logger.Info("applying schema deltas to catalog",
+		slog.Int("numTables", len(schemasInCatalog)),
+		slog.Int("numDeltas", len(schemaDeltas)),
+		slog.String("flowJobName", flowJobName),
+	)
+	err = internal.UpdateTableSchemasInCatalog(
+		ctx,
+		a.CatalogPool,
+		logger,
+		flowJobName,
+		schemasInCatalog,
+	)
+	if err != nil {
+		return fmt.Errorf("failed to update table schemas in catalog: %w", err)
 	}
 	return nil
 }
@@ -223,7 +248,7 @@
 			return nil, fmt.Errorf("failed to sync schema: %w", err)
 		}
 
-		return nil, a.applySchemaDeltas(ctx, config, options, recordBatchSync.SchemaDeltas)
+		return nil, a.applySchemaDeltas(ctx, config.FlowJobName, recordBatchSync.SchemaDeltas)
 	}
 
 	var res *model.SyncResponse
@@ -319,7 +344,7 @@
 	a.OtelManager.Metrics.CurrentBatchIdGauge.Record(ctx, res.CurrentSyncBatchID)
 
 	syncState.Store(shared.Ptr("updating schema"))
-	if err := a.applySchemaDeltas(ctx, config, options, res.TableSchemaDeltas); err != nil {
+	if err := a.applySchemaDeltas(ctx, config.FlowJobName, res.TableSchemaDeltas); err != nil {
 		return nil, err
 	}
 

diff --git a/flow/internal/postgres.go b/flow/internal/postgres.go
@@ -74,31 +74,22 @@ func LoadTableSchemaFromCatalog(
 	return tableSchema, proto.Unmarshal(tableSchemaBytes, tableSchema)
 }
 
-func UpdateTableOIDsInTableSchemaInCatalog(
+func UpdateTableSchemasInCatalog(
 	ctx context.Context,
 	pool shared.CatalogPool,
 	logger log.Logger,
 	flowName string,
-	tableOIDs map[string]uint32, // map[destinationTableName]tableOID
+	destinationTableSourceSchemaMap map[string]*protos.TableSchema, // map[destinationTableName]tableSchema
 ) error {
-	if len(tableOIDs) == 0 {
-		logger.Info("no table OIDs to update, skipping migration",
+	if len(destinationTableSourceSchemaMap) == 0 {
+		logger.Info("no schema deltas to update, skipping migration",
 			slog.String("flowName", flowName))
 		return nil
 	}
 
-	logger.Info("updating table OIDs in catalog",
+	logger.Info("updating schema deltas in catalog",
 		slog.String("flowName", flowName),
-		slog.Int("numTables", len(tableOIDs)))
-
-	tableNames := make([]string, 0, len(tableOIDs))
-	for tableName := range tableOIDs {
-		tableNames = append(tableNames, tableName)
-	}
-	tableSchemas, err := LoadTableSchemasFromCatalog(ctx, pool, flowName, tableNames)
-	if err != nil {
-		return fmt.Errorf("failed to load table schemas from catalog: %w", err)
-	}
+		slog.Int("numTables", len(destinationTableSourceSchemaMap)))
 
 	tx, err := pool.Pool.Begin(ctx)
 	if err != nil {
@@ -107,36 +98,26 @@ func UpdateTableOIDsInTableSchemaInCatalog(
 	defer shared.RollbackTx(tx, logger)
 
 	batch := &pgx.Batch{}
-	for tableName, tableOID := range tableOIDs {
-		tableSchema, exists := tableSchemas[tableName]
-		if !exists {
-			logger.Error("table schema not found in catalog",
-				slog.String("flowName", flowName),
-				slog.String("tableName", tableName))
-			return fmt.Errorf("table schema not found for table: %s", tableName)
-		}
-
-		tableSchema.TableOid = tableOID
+	for tableName, tableSchema := range destinationTableSourceSchemaMap {
 		tableSchemaBytes, err := proto.Marshal(tableSchema)
 		if err != nil {
-			return fmt.Errorf("unable to marshal updated table schema for %s: %w", tableName, err)
+			return fmt.Errorf("unable to marshal table schema for %s: %w", tableName, err)
 		}
 
 		batch.Queue(
 			"UPDATE table_schema_mapping SET table_schema=$1 WHERE flow_name=$2 AND table_name=$3",
 			tableSchemaBytes, flowName, tableName,
 		)
 
-		logger.Info("queued table OID update",
+		logger.Info("queued schema delta update",
 			slog.String("flowName", flowName),
-			slog.String("tableName", tableName),
-			slog.Uint64("tableOID", uint64(tableOID)))
+			slog.String("tableName", tableName))
 	}
 
 	results := tx.SendBatch(ctx, batch)
 	defer results.Close() // Ensure resources are freed in case of early return
 
-	for i := range len(tableOIDs) {
+	for i := range len(destinationTableSourceSchemaMap) {
 		if _, err := results.Exec(); err != nil {
 			logger.Error("failed to update table schema in catalog",
 				slog.Any("error", err),
@@ -157,9 +138,9 @@ func UpdateTableOIDsInTableSchemaInCatalog(
 		return fmt.Errorf("failed to commit transaction: %w", err)
 	}
 
-	logger.Info("successfully updated all table OIDs in catalog",
+	logger.Info("successfully updated all schema deltas in catalog",
 		slog.String("flowName", flowName),
-		slog.Int("numTables", len(tableOIDs)))
+		slog.Int("numTables", len(destinationTableSourceSchemaMap)))
 
 	return nil
 }