fix some bad merging in the batch examples (#227)

davidporter-id-au · web-flow · commit 9cbe55412ac9 · 2025-04-09T15:37:00.000-07:00
diff --git a/docs/02-use-cases/06-batch-job.md b/docs/02-use-cases/06-batch-job.md
@@ -29,7 +29,7 @@ Heartbeating cadence activities are activities who emit their progress at an app
 
 - This is for high-throughput operations where work may able to fit into a single long-running activity, or partitioned across multiple activities which can run for a longer duration.
 - This addresses problems customers may have running workflows which are returning large blocks of data where the data is hitting up against Cadence activity limits
-- This is a good way avoid hitting Cadence workflow history limits Cadence History entries (since this only is a single activity which is long running vs many small short-lived activities).
+- Because heartbeat data is only temporarily recorded, this is a good way avoid hitting Cadence workflow limits on the number of history events: there only is a single activity which is long running vs many small short-lived activities (each of which needs multiple history events).
 
 ### High level concept:
 
@@ -39,16 +39,15 @@ The idea is to create an activity which will handle a lot of records and record
 func (a *ABatchActivity) Execute(ctx context.Context, params Params) error {
 
     // in this case this is just a struct with a mutex protecting it
-	var state State
-
-    // when starting the activity, check at start time for a previous iteration 
-		err := activity.GetHeartbeatDetails(ctx, &state)
-		if err != nil {
-			return err
-		}
-		log.Info("resuming from a previous state", zap.Any("state", state))
-		}
-	}
+    var state State
+    if activity.HasHeartbeatDetails(ctx) {
+        // when starting the activity, check at start time for a previous iteration 
+        err := activity.GetHeartbeatDetails(ctx, &state)
+        if err != nil {
+            return err
+        }
+        log.Info("resuming from a previous state", zap.Any("state", state))
+    }
 
     // in the background, every 5 seconds, emit where we're up to
     // so the cadence server knows the activity is still alive, and 
@@ -61,6 +60,7 @@ func (a *ABatchActivity) Execute(ctx context.Context, params Params) error {
             select {
             case <-ctx.Done():
                 return
+            case <-ticker.C:
                 reportState := state.Clone()
                 activity.RecordHeartbeat(ctx, reportState)
             }
@@ -71,14 +71,14 @@ func (a *ABatchActivity) Execute(ctx context.Context, params Params) error {
     // records which will take a while to get through. Importantly, 
     // if we have to restart, don't start from the beginning, use the 
     // offset so we don't redo work.
-	batchDataToProcess := a.DB.GetDataFromOffset(state.GetOffset())
+    batchDataToProcess := a.DB.GetDataFromOffset(state.GetOffset())
 
     // go through and process all the records through whatever side-effects are appropriate
     for i := range batchDataToProcess {
         a.rpc.UpdateRecord(i)
         state.Finished(i)
     }
-	return nil
+    return nil
 }
 ```
 
@@ -88,36 +88,37 @@ And run this activity in a workflow with settings:
 // retry if the activity gets stopped for any reason
 func setActivityOptions(ctx workflow.Context) workflow.Context {
 
-	ctx = workflow.WithActivityOptions(ctx, workflow.ActivityOptions{
-		ScheduleToStartTimeout: time.Minute,           // how long we expect this task to sit waiting to be picked up. 
+    ctx = workflow.WithActivityOptions(ctx, workflow.ActivityOptions{
+        ScheduleToStartTimeout: time.Minute,           // how long we expect this task to sit waiting to be picked up. 
                                                        // Typically subseconds unless heavily contended
-		StartToCloseTimeout:    time.Hour,             // however long this activity is expected to take, maximum, from end to end. 
+        StartToCloseTimeout:    time.Hour,             // however long this activity is expected to take, maximum, from end to end. 
                                                        // This is workload dependent
-		HeartbeatTimeout:       time.Second * 30,      // How long we should wait before deciding to restart the activity because the 
+        HeartbeatTimeout:       time.Second * 30,      // How long we should wait before deciding to restart the activity because the 
                                                        // background thread hasn't checked in. Half a a minute is probably a bit 
                                                        // overgenous. In the example above we're picking 5 seconds to heartbeat
-		
+        
         // It is unrealistic to assume that a long running activity will succeed
         // so add a retry-policy to restart it when there's a failure. 
         RetryPolicy: &workflow.RetryPolicy{
-			InitialInterval:          time.Second,
-			MaximumInterval:          time.Minute * 10,
-		},
-	})
-	return ctx
+            InitialInterval:          time.Second,
+            MaximumInterval:          time.Minute * 10,
+            MaximumAttempts:          10,               // we expect this to have to restart a maximum of 10 times before giving up. 	
+        },
+    })
+    return ctx
 }
 
 func Workflow(ctx workflow.Context, config entity.Config) error {
 
-	log := workflow.GetLogger(ctx)
-	ctx = setActivityOptions(ctx, config)
+    log := workflow.GetLogger(ctx)
+    ctx = setActivityOptions(ctx, config)
     err := workflow.ExecuteActivity(ctx, ABatchActivityName, config).Get(ctx, nil)
     if err != nil {
         log.Error("failed to execute activity", zap.Error(err), zap.Any("input", config))
 
     }
 
-	log.Info("Workflow complete")
-	return nil
+    log.Info("Workflow complete")
+    return nil
 }
 ```