taskman/executor_pool.go at main · jkbrsn/taskman · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
package taskman

import (
	"container/heap"
	"context"
	"errors"
	"fmt"
	"sync"
	"sync/atomic"
	"time"

	"github.com/rs/zerolog"
)

// poolExecutor is an implementation of executor that uses a worker pool to execute tasks.
type poolExecutor struct {
	log zerolog.Logger

	ctx    context.Context
	cancel context.CancelFunc

	// Queue
	mu              sync.RWMutex
	jobQueue        priorityQueue        // A priority queue to hold the scheduled jobs
	queueUpdateChan chan bool            // Channel to signal that new tasks have entered the queue
	pausedJobs      map[string]pausedJob // Jobs currently paused outside the queue

	// Operations
	runDone  chan struct{} // Channel to signal run has stopped
	stopOnce sync.Once     // Ensures Stop is only called once

	// Worker pool
	workerPool     *workerPool
	workerPoolDone chan struct{} // Channel to receive signal that the worker pool has stopped
	errorChan      chan error    // Channel to receive errors from the worker pool
	taskChan       chan Task     // Channel to send tasks to the worker pool
	poolScaler     *poolScaler

	// Options
	channelBufferSize int           // Buffer size for task channels
	minWorkerCount    int           // Minimum number of workers in the pool
	scaleInterval     time.Duration // Interval for automatic scaling of the worker pool

	// Metrics
	jobExecChan chan struct{}    // Channel to signal that a job has been executed
	metrics     *executorMetrics // Metrics for the overall task manager
	maxJobWidth atomic.Int32     // Widest job in the queue in terms of number of tasks
}

type pausedJob struct {
	job       *Job
	remaining time.Duration
}

// periodicWorkerScaling scales the worker pool at regular intervals, based on the state of the
// job queue. The worker pool is already scaled every time a job is added or removed, but this
// function provides a way to scale the worker pool over time.
func (e *poolExecutor) periodicWorkerScaling() {
	ticker := time.NewTicker(e.scaleInterval)
	defer ticker.Stop()

	for {
		select {
		case <-ticker.C:
			// Scale the worker pool based, setting 0 workers needed immediately
			e.scaleWorkerPool(0)
		case <-e.ctx.Done():
			// TaskManager received stop signal, exiting periodic scaling
			return
		}
	}
}

// run runs the main loop of the pool executor.
// revive:disable:function-length valid exception
// revive:disable:cognitive-complexity valid exception
// revive:disable:cyclomatic valid exception
func (e *poolExecutor) run() {
	defer close(e.runDone)

	// Reusable timer to avoid goroutine churn from time.After
	var (
		timer *time.Timer
		fires <-chan time.Time
	)

	stopTimer := func() {
		if timer != nil {
			if !timer.Stop() {
				// Drain if already fired
				select {
				case <-timer.C:
				default:
				}
			}
		}
		fires = nil
	}

	for {
		// Check for context cancellation
		select {
		case <-e.ctx.Done():
			return
		default:
			// Do nothing if the executor is running
		}

		// Snapshot only what's needed under lock
		e.mu.Lock()
		queueLen := e.jobQueue.Len()
		var (
			jobID    string
			tasks    []Task
			nextExec time.Time
			cadence  time.Duration
			index    int
		)
		if queueLen > 0 {
			next := e.jobQueue[0]
			jobID = next.ID
			tasks = next.Tasks
			nextExec = next.NextExec
			cadence = next.Cadence
			index = next.index
		}
		e.mu.Unlock()

		if queueLen == 0 {
			// No jobs: wait for new job or stop
			stopTimer()
			select {
			case <-e.queueUpdateChan:
				continue
			case <-e.ctx.Done():
				return
			}
		}

		now := time.Now()
		delay := nextExec.Sub(now)
		if delay <= 0 {
			// Dispatch without holding lock
			e.log.Trace().Msgf("Dispatching job %s", jobID)
			for _, task := range tasks {
				select {
				case <-e.ctx.Done():
					return
				case e.taskChan <- task:
				}
			}

			// Signal that a job has been executed
			// Note: we actually don't know the execution status here but can assume that by
			// dispatching the tasks, the job has been executed
			e.jobExecChan <- struct{}{}

			// Reschedule the job under lock or retire it if run limit reached
			jobRemoved := false
			e.mu.Lock()
			jobRemoved = e.rescheduleOrRemoveAtLocked(index, jobID, nextExec, cadence, now)
			e.mu.Unlock()
			if jobRemoved {
				e.scaleWorkerPool(0)
			}
			continue
		}

		// Wait until due, but reuse timer so we can preempt on new jobs/stop
		if timer == nil {
			timer = time.NewTimer(delay)
			fires = timer.C
		} else {
			if !timer.Stop() {
				select {
				case <-timer.C:
				default:
				}
			}
			timer.Reset(delay)
			fires = timer.C
		}

		select {
		case <-fires:
			// Time to execute next job
			continue
		case <-e.queueUpdateChan:
			// New job added; re-evaluate queue head
			continue
		case <-e.ctx.Done():
			return
		}
	}
}

// revive:enable:function-length
// revive:enable:cognitive-complexity
// revive:enable:cyclomatic

// scaleWorkerPool scales the worker pool based on the current pool state and configuration.
func (e *poolExecutor) scaleWorkerPool(workersNeededNow int) {
	now := time.Now()
	e.poolScaler.scale(now, workersNeededNow)
}

// rescheduleOrRemoveAtLocked handles rescheduling a job entry at the given index or removing
// it if its run limit has been reached. It assumes `e.mu` is already held.
func (e *poolExecutor) rescheduleOrRemoveAtLocked(
	index int,
	jobID string,
	nextExec time.Time,
	cadence time.Duration,
	now time.Time,
) bool {
	if index < len(e.jobQueue) && e.jobQueue[index].ID == jobID {
		entry := e.jobQueue[index]
		if entry.consumeRun() {
			removed := heap.Remove(&e.jobQueue, index)
			if removedJob, ok := removed.(*Job); ok {
				e.finalizeJobRemovalLocked(removedJob)
			}
			return true
		}

		// advance nextExec by whole cadences so that it's after now
		n := nextExec
		if cadence > 0 {
			if !n.After(now) {
				steps := 1 + int(now.Sub(n)/cadence)
				n = n.Add(time.Duration(steps) * cadence)
			}
		} else {
			// cadence should be > 0 per validation; fallback to single step
			n = n.Add(cadence)
		}
		e.jobQueue[index].NextExec = n
		heap.Fix(&e.jobQueue, index)
	}
	return false
}

// Job returns the job with the given ID.
func (e *poolExecutor) Job(jobID string) (Job, error) {
	e.mu.RLock()
	defer e.mu.RUnlock()

	jobIndex, err := e.jobQueue.JobInQueue(jobID)
	if err != nil {
		if paused, ok := e.pausedJobs[jobID]; ok {
			job := *paused.job
			job.NextExec = time.Now().Add(paused.remaining)
			return job, nil
		}
		return Job{}, fmt.Errorf("job with ID %s not found", jobID)
	}
	job := *e.jobQueue[jobIndex]
	return job, nil
}

// Metrics returns the metrics for the executor.
func (e *poolExecutor) Metrics() TaskManagerMetrics {
	snap := e.metrics.snapshot()
	return TaskManagerMetrics{
		ManagedJobs:          int(snap.JobsManaged),
		JobsPerSecond:        snap.JobsPerSecond,
		JobsTotalExecutions:  int(snap.JobsTotalExecutions),
		ManagedTasks:         int(snap.TasksManaged),
		TasksPerSecond:       snap.TasksPerSecond,
		TasksAverageExecTime: snap.TasksAverageExecTime,
		TasksTotalExecutions: int(snap.TasksTotalExecutions),
		PoolMetrics: &PoolMetrics{
			WidestJobWidth:      int(e.maxJobWidth.Load()),
			WorkerCountTarget:   int(e.workerPool.workerCountTarget.Load()),
			WorkerScalingEvents: int(e.workerPool.workerScalingEvents.Load()),
			WorkerUtilization:   float32(e.workerPool.utilization()),
			WorkersActive:       int(e.workerPool.workersActive.Load()),
			WorkersRunning:      int(e.workerPool.workersRunning.Load()),
		},
	}
}

// Remove removes a job from the queue.
func (e *poolExecutor) Remove(jobID string) error {
	e.mu.Lock()
	defer e.mu.Unlock()

	// Get the job from the queue
	jobIndex, err := e.jobQueue.JobInQueue(jobID)
	if err != nil {
		if paused, ok := e.pausedJobs[jobID]; ok {
			delete(e.pausedJobs, jobID)
			taskCount := len(paused.job.Tasks)
			e.metrics.updateMetrics(-1, -taskCount, paused.job.Cadence)
			e.scaleWorkerPool(0)
			return nil
		}
		return fmt.Errorf("job with ID %s not found", jobID)
	}
	// Remove the job from the queue
	removed := heap.Remove(&e.jobQueue, jobIndex)
	if removed == nil {
		return fmt.Errorf("job with ID %s not found", jobID)
	}
	if removedJob, ok := removed.(*Job); ok {
		e.finalizeJobRemovalLocked(removedJob)
	}

	// Scale worker pool if needed
	e.scaleWorkerPool(0)

	return nil
}

// Pause removes the job from the execution queue while preserving its remaining delay.
func (e *poolExecutor) Pause(jobID string) error {
	select {
	case <-e.ctx.Done():
		return ErrExecutorContextDone
	default:
	}

	e.mu.Lock()
	if e.pausedJobs == nil {
		e.mu.Unlock()
		return errors.New("executor not started")
	}

	if _, exists := e.pausedJobs[jobID]; exists {
		e.mu.Unlock()
		return fmt.Errorf("job %s already paused", jobID)
	}

	jobIndex, err := e.jobQueue.JobInQueue(jobID)
	if err != nil {
		e.mu.Unlock()
		return fmt.Errorf("pause job %q: %w", jobID, err)
	}
	job := e.jobQueue[jobIndex]
	now := time.Now()
	remaining := max(job.NextExec.Sub(now), 0)

	removed := heap.Remove(&e.jobQueue, jobIndex)
	pausedPtr, ok := removed.(*Job)
	if !ok || pausedPtr == nil {
		e.mu.Unlock()
		return fmt.Errorf("pause job %q: failed to remove job from queue", jobID)
	}

	e.pausedJobs[jobID] = pausedJob{
		job:       pausedPtr,
		remaining: remaining,
	}

	if len(pausedPtr.Tasks) == int(e.maxJobWidth.Load()) {
		widest := 0
		for _, j := range e.jobQueue {
			if l := len(j.Tasks); l > widest {
				widest = l
			}
		}
		e.maxJobWidth.Store(int32(widest))
	}
	e.mu.Unlock()

	e.scaleWorkerPool(0)
	e.notifyQueueUpdate()

	return nil
}

// Resume requeues a previously paused job using the remaining delay captured when it was paused.
func (e *poolExecutor) Resume(jobID string) error {
	select {
	case <-e.ctx.Done():
		return ErrExecutorContextDone
	default:
	}

	e.mu.Lock()
	if e.pausedJobs == nil {
		e.mu.Unlock()
		return errors.New("executor not started")
	}

	paused, ok := e.pausedJobs[jobID]
	if !ok {
		e.mu.Unlock()
		return fmt.Errorf("job %s is not paused", jobID)
	}
	delete(e.pausedJobs, jobID)

	now := time.Now()
	if paused.remaining < 0 {
		paused.remaining = 0
	}
	paused.job.NextExec = now.Add(paused.remaining)
	jobTasks := len(paused.job.Tasks)
	heap.Push(&e.jobQueue, paused.job)

	if jobTasks > int(e.maxJobWidth.Load()) {
		e.maxJobWidth.Store(int32(jobTasks))
	}
	e.mu.Unlock()

	e.scaleWorkerPool(jobTasks)
	e.notifyQueueUpdate()

	return nil
}

// notifyQueueUpdate signals the executor that a new job has been added to the queue.
func (e *poolExecutor) notifyQueueUpdate() {
	if e.queueUpdateChan == nil {
		return
	}
	select {
	case <-e.ctx.Done():
		return
	default:
	}
	select {
	case e.queueUpdateChan <- true:
	default:
	}
}

// finalizeJobRemovalLocked finalizes the removal of a job from the queue. Assumes the executor lock
// is already held when called.
func (e *poolExecutor) finalizeJobRemovalLocked(job *Job) {
	if job == nil {
		return
	}
	if len(job.Tasks) == int(e.maxJobWidth.Load()) {
		widest := 0
		for _, candidate := range e.jobQueue {
			if l := len(candidate.Tasks); l > widest {
				widest = l
			}
		}
		e.maxJobWidth.Store(int32(widest))
	}
	e.metrics.updateMetrics(-1, -len(job.Tasks), job.Cadence)
}

// Replace replaces a job in the queue.
func (e *poolExecutor) Replace(job Job) error {
	if err := job.Validate(); err != nil {
		return fmt.Errorf("invalid job: %w", err)
	}

	e.mu.Lock()
	defer e.mu.Unlock()

	// Get the job's index in the queue
	jobIndex, err := e.jobQueue.JobInQueue(job.ID)
	if err != nil {
		return fmt.Errorf("replace job %q: %w", job.ID, err)
	}

	// Replace the job in the queue, preserving scheduling fields
	oldJob := e.jobQueue[jobIndex]
	job.NextExec = oldJob.NextExec
	job.index = oldJob.index
	job.inheritExecLimit(oldJob)
	e.jobQueue[jobIndex] = &job

	// Preserve heap invariants if ordering-related fields ever change
	heap.Fix(&e.jobQueue, job.index)

	// Executor metrics updates
	oldTasks := len(oldJob.Tasks)
	newTasks := len(job.Tasks)
	deltaTasks := newTasks - oldTasks
	if deltaTasks != 0 {
		// Jobs managed unchanged (replace), but tasks managed changes by delta
		e.metrics.updateMetrics(0, deltaTasks, job.Cadence)
	} else if oldJob.Cadence != job.Cadence {
		e.metrics.updateCadence(newTasks, oldJob.Cadence, job.Cadence)
	}

	// Widest-job updates
	currentMax := int(e.maxJobWidth.Load())
	if newTasks > currentMax {
		e.maxJobWidth.Store(int32(newTasks))
	} else if oldTasks == currentMax && newTasks < currentMax {
		// The widest job got narrower; recompute widest across queue
		widest := 0
		for _, j := range e.jobQueue {
			if l := len(j.Tasks); l > widest {
				widest = l
			}
		}
		e.maxJobWidth.Store(int32(widest))
	}

	return nil
}

// Schedule schedules a job for execution.
func (e *poolExecutor) Schedule(job Job) error {
	if err := job.Validate(); err != nil {
		return fmt.Errorf("invalid job: %w", err)
	}

	job.initializeExecLimit()

	e.mu.Lock()
	defer e.mu.Unlock()

	// Validate job ID duplicity and job requirements
	if _, ok := e.jobQueue.JobInQueue(job.ID); ok == nil {
		return errors.New("invalid job: duplicate job ID")
	}
	if e.pausedJobs != nil {
		if _, exists := e.pausedJobs[job.ID]; exists {
			return errors.New("invalid job: duplicate job ID")
		}
	}

	// Check executor context state
	select {
	case <-e.ctx.Done():
		// If the executor is stopped, do not continue adding the job
		return ErrExecutorContextDone
	default:
		// Pass through if the executor is running
	}

	e.log.Debug().Msgf(
		"Scheduling job with %d tasks with ID '%s' and cadence %v",
		len(job.Tasks), job.ID, job.Cadence,
	)

	// Set NextExec to now if it is not set
	if job.NextExec.IsZero() {
		job.NextExec = time.Now().Add(job.Cadence)
	}

	// Update task metrics
	taskCount := len(job.Tasks)
	if taskCount > int(e.maxJobWidth.Load()) {
		e.maxJobWidth.Store(int32(taskCount))
	}
	e.metrics.updateMetrics(1, taskCount, job.Cadence)

	// Scale worker pool if needed
	e.scaleWorkerPool(taskCount)

	// Push the job to the queue
	heap.Push(&e.jobQueue, &job)

	// Signal the executor to check for new tasks
	select {
	case <-e.ctx.Done():
		// Do nothing if the executor is stopped
		return ErrExecutorContextDone
	default:
		select {
		case e.queueUpdateChan <- true:
			e.log.Trace().Msg("Signaled new job added")
		default:
			// Do nothing if no one is listening
		}
	}

	return nil
}

// Start starts the executor by setting up the job queue, channels, and worker pool.
func (e *poolExecutor) Start() {
	// Metrics: reuse provided metrics but validate context
	if e.metrics == nil {
		e.metrics = newExecutorMetrics()
	} else if e.metrics.ctx == nil {
		ctx, cancel := context.WithCancel(context.Background())
		e.metrics.ctx = ctx
		e.metrics.cancel = cancel
	}

	// Job queue
	e.jobQueue = make(priorityQueue, 0)
	heap.Init(&e.jobQueue)
	e.pausedJobs = make(map[string]pausedJob)

	// Channels (ownership):
	// - executor owns: taskChan, queueUpdateChan
	// - workerPool owns: taskExecChan, workerPoolDone signaling
	// - caller owns: errorChan
	e.taskChan = make(chan Task, e.channelBufferSize)
	if e.errorChan == nil {
		// Create internal error channel if caller didn't provide one
		e.errorChan = make(chan error, e.channelBufferSize)
	}
	e.workerPoolDone = make(chan struct{})
	e.runDone = make(chan struct{})
	e.queueUpdateChan = make(chan bool, 2)
	e.jobExecChan = make(chan struct{}, e.channelBufferSize)

	// Worker pool
	taskExecChan := make(chan time.Duration, e.channelBufferSize)
	e.workerPool = newWorkerPool(
		e.log, // Pass on logger instance
		e.errorChan,
		taskExecChan,
		e.taskChan,
		e.workerPoolDone,
		workerPoolCfg{
			initialWorkers:       e.minWorkerCount,
			maxWorkers:           e.poolScaler.cfg.MaxWorkers,
			utilizationThreshold: e.poolScaler.cfg.TargetUtilization,
			downScaleMinInterval: e.poolScaler.cfg.CooldownDown,
		},
	)

	e.poolScaler.workerPool = e.workerPool

	go e.metrics.consumeTaskExecChan(taskExecChan)
	go e.metrics.consumeJobExecChan(e.jobExecChan)
	go e.run()
	go e.periodicWorkerScaling()
}

// Stop signals the executor to stop processing tasks and exit. The executor will block until the
// run loop has exited, and the worker pool has stopped.
func (e *poolExecutor) Stop() {
	e.stopOnce.Do(func() {
		// Stop sequence and channel ownership:
		// - executor owns queueUpdateChan and taskChan
		// - workerPool owns taskExecChan and workerPoolDone
		// - caller owns errorChan (never closed here)

		// 1) Signal cancellation to all components
		e.cancel()

		// 2) Close queueUpdateChan to unblock run loop when queue is empty
		close(e.queueUpdateChan)

		// 3) Wait for run loop to exit cleanly
		<-e.runDone

		// 4) Stop the worker pool and wait for it to finish
		e.workerPool.stop()
		<-e.workerPoolDone

		// 5) Stop metrics
		e.metrics.cancel()

		// 6) Close taskChan after workers have exited to avoid sends after close
		close(e.taskChan)

		// 7) Close jobExecChan
		close(e.jobExecChan)

		// 8) Clear paused jobs map to release references
		e.mu.Lock()
		e.pausedJobs = nil
		e.mu.Unlock()

		e.log.Debug().Msg("Executor stopped")
	})
}

// newPoolExecutor creates a new pool executor.
func newPoolExecutor(
	parentCtx context.Context,
	logger zerolog.Logger,
	errorChan chan error,
	metrics *executorMetrics,
	channelBufferSize int,
	minWorkerCount int,
	scaleInterval time.Duration,
	scalerConfig PoolScaleConfig,
) *poolExecutor {
	ctx, cancel := context.WithCancel(parentCtx)
	log := logger.With().Str("component", "executor").Logger()
	poolScaler := newPoolScaler(logger, nil, metrics, scalerConfig)

	return &poolExecutor{
		ctx:               ctx,
		cancel:            cancel,
		log:               log,
		errorChan:         errorChan,
		metrics:           metrics,
		channelBufferSize: channelBufferSize,
		minWorkerCount:    minWorkerCount,
		scaleInterval:     scaleInterval,
		poolScaler:        poolScaler,
	}
}