@@ -345,19 +345,15 @@ func (ca *changeAggregator) Start(ctx context.Context) {
345
345
346
346
spans , err := ca .setupSpansAndFrontier ()
347
347
if err != nil {
348
- if log .V (2 ) {
349
- log .Dev .Infof (ca .Ctx (), "change aggregator moving to draining due to error setting up spans and frontier: %v" , err )
350
- }
348
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error setting up spans and frontier: %v" , err )
351
349
ca .MoveToDraining (err )
352
350
ca .cancel ()
353
351
return
354
352
}
355
353
356
354
feed , err := makeChangefeedConfigFromJobDetails (ctx , ca .spec .Feed , ca .FlowCtx .Cfg .ExecutorConfig .(* sql.ExecutorConfig ))
357
355
if err != nil {
358
- if log .V (2 ) {
359
- log .Infof (ca .Ctx (), "change aggregator moving to draining due to error making changefeed config: %v" , err )
360
- }
356
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error making changefeed config: %v" , err )
361
357
ca .MoveToDraining (err )
362
358
ca .cancel ()
363
359
return
@@ -380,19 +376,15 @@ func (ca *changeAggregator) Start(ctx context.Context) {
380
376
scope , _ := opts .GetMetricScope ()
381
377
ca .sliMetrics , err = ca .metrics .getSLIMetrics (scope )
382
378
if err != nil {
383
- if log .V (2 ) {
384
- log .Dev .Infof (ca .Ctx (), "change aggregator moving to draining due to error getting sli metrics: %v" , err )
385
- }
379
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error getting sli metrics: %v" , err )
386
380
ca .MoveToDraining (err )
387
381
ca .cancel ()
388
382
return
389
383
}
390
384
ca .sliMetricsID = ca .sliMetrics .claimId ()
391
385
ca .targets , err = AllTargets (ctx , ca .spec .Feed , ca .FlowCtx .Cfg .ExecutorConfig .(* sql.ExecutorConfig ))
392
386
if err != nil {
393
- if log .V (2 ) {
394
- log .Infof (ca .Ctx (), "change aggregator moving to draining due to error getting targets: %v" , err )
395
- }
387
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error getting targets: %v" , err )
396
388
ca .MoveToDraining (err )
397
389
ca .cancel ()
398
390
return
@@ -402,9 +394,7 @@ func (ca *changeAggregator) Start(ctx context.Context) {
402
394
recorder , err = ca .wrapMetricsRecorderWithTelemetry (ctx , recorder , ca .targets )
403
395
404
396
if err != nil {
405
- if log .V (2 ) {
406
- log .Dev .Infof (ca .Ctx (), "change aggregator moving to draining due to error wrapping metrics controller: %v" , err )
407
- }
397
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error wrapping metrics controller: %v" , err )
408
398
ca .MoveToDraining (err )
409
399
ca .cancel ()
410
400
}
@@ -413,9 +403,7 @@ func (ca *changeAggregator) Start(ctx context.Context) {
413
403
ca .spec .User (), ca .spec .JobID , recorder , ca .targets )
414
404
if err != nil {
415
405
err = changefeedbase .MarkRetryableError (err )
416
- if log .V (2 ) {
417
- log .Dev .Infof (ca .Ctx (), "change aggregator moving to draining due to error getting sink: %v" , err )
418
- }
406
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error getting sink: %v" , err )
419
407
ca .MoveToDraining (err )
420
408
ca .cancel ()
421
409
return
@@ -447,9 +435,7 @@ func (ca *changeAggregator) Start(ctx context.Context) {
447
435
limit := changefeedbase .PerChangefeedMemLimit .Get (& ca .FlowCtx .Cfg .Settings .SV )
448
436
ca .eventProducer , ca .kvFeedDoneCh , ca .errCh , err = ca .startKVFeed (ctx , spans , kvFeedHighWater , needsInitialScan , feed , pool , limit , opts )
449
437
if err != nil {
450
- if log .V (2 ) {
451
- log .Dev .Infof (ca .Ctx (), "change aggregator moving to draining due to error starting kv feed: %v" , err )
452
- }
438
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error starting kv feed: %v" , err )
453
439
ca .MoveToDraining (err )
454
440
ca .cancel ()
455
441
return
@@ -459,9 +445,7 @@ func (ca *changeAggregator) Start(ctx context.Context) {
459
445
ctx , ca .FlowCtx .Cfg , ca .spec , feed , ca .frontier , kvFeedHighWater ,
460
446
ca .sink , ca .metrics , ca .sliMetrics , ca .knobs )
461
447
if err != nil {
462
- if log .V (2 ) {
463
- log .Dev .Infof (ca .Ctx (), "change aggregator moving to draining due to error creating event consumer: %v" , err )
464
- }
448
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error creating event consumer: %v" , err )
465
449
ca .MoveToDraining (err )
466
450
ca .cancel ()
467
451
return
@@ -661,7 +645,7 @@ func (ca *changeAggregator) setupSpansAndFrontier() (spans []roachpb.Span, err e
661
645
// Checkpointed spans are spans that were above the highwater mark, and we
662
646
// must preserve that information in the frontier for future checkpointing.
663
647
if err := checkpoint .Restore (ca .frontier , ca .spec .SpanLevelCheckpoint ); err != nil {
664
- return nil , err
648
+ return nil , errors . Wrapf ( err , "failed to restore span-level checkpoint" )
665
649
}
666
650
667
651
return spans , nil
@@ -777,9 +761,7 @@ func (ca *changeAggregator) Next() (rowenc.EncDatumRow, *execinfrapb.ProducerMet
777
761
// NB: we do not invoke ca.cancel here -- just merely moving
778
762
// to drain state so that the trailing metadata callback
779
763
// has a chance to produce shutdown checkpoint.
780
- if log .V (2 ) {
781
- log .Dev .Infof (ca .Ctx (), "change aggregator moving to draining due to error while checking for node drain: %v" , err )
782
- }
764
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error while checking for node drain: %v" , err )
783
765
ca .MoveToDraining (err )
784
766
break
785
767
}
@@ -810,9 +792,7 @@ func (ca *changeAggregator) Next() (rowenc.EncDatumRow, *execinfrapb.ProducerMet
810
792
}
811
793
// Shut down the poller if it wasn't already.
812
794
ca .cancel ()
813
- if log .V (2 ) {
814
- log .Dev .Infof (ca .Ctx (), "change aggregator moving to draining due to error from tick: %v" , err )
815
- }
795
+ log .Dev .Warningf (ca .Ctx (), "moving to draining due to error from tick: %v" , err )
816
796
ca .MoveToDraining (err )
817
797
break
818
798
}
@@ -1378,9 +1358,7 @@ func (cf *changeFrontier) Start(ctx context.Context) {
1378
1358
scope := cf .spec .Feed .Opts [changefeedbase .OptMetricsScope ]
1379
1359
sli , err := cf .metrics .getSLIMetrics (scope )
1380
1360
if err != nil {
1381
- if log .V (2 ) {
1382
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining due to error getting sli metrics: %v" , err )
1383
- }
1361
+ log .Dev .Warningf (cf .Ctx (), "moving to draining due to error getting sli metrics: %v" , err )
1384
1362
cf .MoveToDraining (err )
1385
1363
return
1386
1364
}
@@ -1389,9 +1367,7 @@ func (cf *changeFrontier) Start(ctx context.Context) {
1389
1367
cf .spec .User (), cf .spec .JobID , sli , cf .targets )
1390
1368
if err != nil {
1391
1369
err = changefeedbase .MarkRetryableError (err )
1392
- if log .V (2 ) {
1393
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining due to error getting sink: %v" , err )
1394
- }
1370
+ log .Dev .Warningf (cf .Ctx (), "moving to draining due to error getting sink: %v" , err )
1395
1371
cf .MoveToDraining (err )
1396
1372
return
1397
1373
}
@@ -1404,9 +1380,7 @@ func (cf *changeFrontier) Start(ctx context.Context) {
1404
1380
1405
1381
cf .highWaterAtStart = cf .spec .Feed .StatementTime
1406
1382
if cf .evalCtx .ChangefeedState == nil {
1407
- if log .V (2 ) {
1408
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining due to missing changefeed state" )
1409
- }
1383
+ log .Dev .Warningf (cf .Ctx (), "moving to draining due to missing changefeed state" )
1410
1384
cf .MoveToDraining (errors .AssertionFailedf ("expected initialized local state" ))
1411
1385
return
1412
1386
}
@@ -1418,9 +1392,7 @@ func (cf *changeFrontier) Start(ctx context.Context) {
1418
1392
if cf .spec .JobID != 0 {
1419
1393
job , err := cf .FlowCtx .Cfg .JobRegistry .LoadClaimedJob (ctx , cf .spec .JobID )
1420
1394
if err != nil {
1421
- if log .V (2 ) {
1422
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining due to error loading claimed job: %v" , err )
1423
- }
1395
+ log .Dev .Warningf (cf .Ctx (), "moving to draining due to error loading claimed job: %v" , err )
1424
1396
cf .MoveToDraining (err )
1425
1397
return
1426
1398
}
@@ -1472,15 +1444,16 @@ func (cf *changeFrontier) Start(ctx context.Context) {
1472
1444
perTableTracking ,
1473
1445
cf .spec .TrackedSpans ... )
1474
1446
if err != nil {
1475
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining due to error setting up frontier: %v" , err )
1447
+ log .Dev .Warningf (cf .Ctx (), "moving to draining due to error setting up frontier: %v" , err )
1476
1448
cf .MoveToDraining (err )
1477
1449
return
1478
1450
}
1479
1451
1480
1452
if err := checkpoint .Restore (cf .frontier , cf .spec .SpanLevelCheckpoint ); err != nil {
1481
- if log .V (2 ) {
1482
- log .Dev .Infof (cf .Ctx (), "change frontier encountered error on checkpoint restore: %v" , err )
1483
- }
1453
+ log .Dev .Warningf (cf .Ctx (),
1454
+ "moving to draining due to error restoring span-level checkpoint: %v" , err )
1455
+ cf .MoveToDraining (err )
1456
+ return
1484
1457
}
1485
1458
1486
1459
if cf .knobs .AfterCoordinatorFrontierRestore != nil {
@@ -1637,39 +1610,31 @@ func (cf *changeFrontier) Next() (rowenc.EncDatumRow, *execinfrapb.ProducerMetad
1637
1610
}
1638
1611
}
1639
1612
1640
- if log .V (2 ) {
1641
- log .Dev .Infof (cf .Ctx (),
1642
- "change frontier moving to draining after reaching resolved span boundary (%s): %v" ,
1643
- boundaryType , err )
1644
- }
1613
+ log .Dev .Warningf (cf .Ctx (),
1614
+ "moving to draining after reaching resolved span boundary (%s): %v" ,
1615
+ boundaryType , err )
1645
1616
cf .MoveToDraining (err )
1646
1617
break
1647
1618
}
1648
1619
1649
1620
row , meta := cf .input .Next ()
1650
1621
if meta != nil {
1651
1622
if meta .Err != nil {
1652
- if log .V (2 ) {
1653
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining after getting error from aggregator: %v" , meta .Err )
1654
- }
1623
+ log .Dev .Warningf (cf .Ctx (), "moving to draining after getting error from aggregator: %v" , meta .Err )
1655
1624
cf .MoveToDraining (nil /* err */ )
1656
1625
}
1657
1626
if meta .Changefeed != nil && meta .Changefeed .DrainInfo != nil {
1658
1627
// Seeing changefeed drain info metadata from the aggregator means
1659
1628
// that the aggregator exited due to node shutdown. Transition to
1660
1629
// draining so that the remaining aggregators will shut down and
1661
1630
// transmit their up-to-date frontier.
1662
- if log .V (2 ) {
1663
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining due to aggregator shutdown: %s" , meta .Changefeed )
1664
- }
1631
+ log .Dev .Warningf (cf .Ctx (), "moving to draining due to aggregator shutdown: %s" , meta .Changefeed )
1665
1632
cf .MoveToDraining (changefeedbase .ErrNodeDraining )
1666
1633
}
1667
1634
return nil , meta
1668
1635
}
1669
1636
if row == nil {
1670
- if log .V (2 ) {
1671
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining after getting nil row from aggregator" )
1672
- }
1637
+ log .Dev .Warningf (cf .Ctx (), "moving to draining after getting nil row from aggregator" )
1673
1638
cf .MoveToDraining (nil /* err */ )
1674
1639
break
1675
1640
}
@@ -1684,9 +1649,7 @@ func (cf *changeFrontier) Next() (rowenc.EncDatumRow, *execinfrapb.ProducerMetad
1684
1649
}
1685
1650
1686
1651
if err := cf .noteAggregatorProgress (cf .Ctx (), row [0 ]); err != nil {
1687
- if log .V (2 ) {
1688
- log .Dev .Infof (cf .Ctx (), "change frontier moving to draining after error while processing aggregator progress: %v" , err )
1689
- }
1652
+ log .Dev .Warningf (cf .Ctx (), "moving to draining after error while processing aggregator progress: %v" , err )
1690
1653
cf .MoveToDraining (err )
1691
1654
break
1692
1655
}
0 commit comments