asynq/processor.go

// Copyright 2020 Kentaro Hibino. All rights reserved.
// Use of this source code is governed by a MIT license
// that can be found in the LICENSE file.

package asynq

import (
	"fmt"
	"log"
	"sync"
	"time"

	"github.com/hibiken/asynq/internal/base"
	"github.com/hibiken/asynq/internal/rdb"
)

type processor struct {
	rdb *rdb.RDB

	handler Handler

	retryDelayFunc retryDelayFunc

	// timeout for blocking dequeue operation.
	// dequeue needs to timeout to avoid blocking forever
	// in case of a program shutdown or additon of a new queue.
	dequeueTimeout time.Duration

	// sema is a counting semaphore to ensure the number of active workers
	// does not exceed the limit.
	sema chan struct{}

	// channel to communicate back to the long running "processor" goroutine.
	// once is used to send value to the channel only once.
	done chan struct{}
	once sync.Once

	// abort channel is closed when the shutdown of the "processor" goroutine starts.
	abort chan struct{}

	// quit channel communicates to the in-flight worker goroutines to stop.
	quit chan struct{}
}

type retryDelayFunc func(n int, err error, task *Task) time.Duration

func newProcessor(r *rdb.RDB, n int, fn retryDelayFunc) *processor {
	return &processor{
		rdb:            r,
		retryDelayFunc: fn,
		dequeueTimeout: 2 * time.Second,
		sema:           make(chan struct{}, n),
		done:           make(chan struct{}),
		abort:          make(chan struct{}),
		quit:           make(chan struct{}),
		handler:        HandlerFunc(func(t *Task) error { return fmt.Errorf("handler not set") }),
	}
}

// Note: stops only the "processor" goroutine, does not stop workers.
// It's safe to call this method multiple times.
func (p *processor) stop() {
	p.once.Do(func() {
		log.Println("[INFO] Processor shutting down...")
		// Unblock if processor is waiting for sema token.
		close(p.abort)
		// Signal the processor goroutine to stop processing tasks
		// from the queue.
		p.done <- struct{}{}
	})
}

// NOTE: once terminated, processor cannot be re-started.
func (p *processor) terminate() {
	p.stop()

	// IDEA: Allow user to customize this timeout value.
	const timeout = 8 * time.Second
	time.AfterFunc(timeout, func() { close(p.quit) })
	log.Println("[INFO] Waiting for all workers to finish...")
	// block until all workers have released the token
	for i := 0; i < cap(p.sema); i++ {
		p.sema <- struct{}{}
	}
	log.Println("[INFO] All workers have finished.")
	p.restore() // move any unfinished tasks back to the queue.
}

func (p *processor) start() {
	// NOTE: The call to "restore" needs to complete before starting
	// the processor goroutine.
	p.restore()
	go func() {
		for {
			select {
			case <-p.done:
				log.Println("[INFO] Processor done.")
				return
			default:
				p.exec()
			}
		}
	}()
}

// exec pulls a task out of the queue and starts a worker goroutine to
// process the task.
func (p *processor) exec() {
	msg, err := p.rdb.Dequeue(p.dequeueTimeout)
	if err == rdb.ErrDequeueTimeout {
		// timed out, this is a normal behavior.
		return
	}
	if err != nil {
		log.Printf("[ERROR] unexpected error while pulling a task out of queue: %v\n", err)
		return
	}

	select {
	case <-p.abort:
		// shutdown is starting, return immediately after requeuing the message.
		p.requeue(msg)
		return
	case p.sema <- struct{}{}: // acquire token
		go func() {
			defer func() { <-p.sema /* release token */ }()

			resCh := make(chan error, 1)
			task := &Task{Type: msg.Type, Payload: msg.Payload}
			go func() {
				resCh <- perform(p.handler, task)
			}()

			select {
			case <-p.quit:
				// time is up, quit this worker goroutine.
				log.Printf("[WARN] Terminating in-progress task %+v\n", msg)
				return
			case resErr := <-resCh:
				// Note: One of three things should happen.
				// 1) Done  -> Removes the message from InProgress
				// 2) Retry -> Removes the message from InProgress & Adds the message to Retry
				// 3) Kill  -> Removes the message from InProgress & Adds the message to Dead
				if resErr != nil {
					if msg.Retried >= msg.Retry {
						p.kill(msg, resErr)
					} else {
						p.retry(msg, resErr)
					}
					return
				}
				p.markAsDone(msg)
			}
		}()
	}
}

// restore moves all tasks from "in-progress" back to queue
// to restore all unfinished tasks.
func (p *processor) restore() {
	n, err := p.rdb.RestoreUnfinished()
	if err != nil {
		log.Printf("[ERROR] Could not restore unfinished tasks: %v\n", err)
	}
	if n > 0 {
		log.Printf("[INFO] Restored %d unfinished tasks back to queue.\n", n)
	}
}

func (p *processor) requeue(msg *base.TaskMessage) {
	err := p.rdb.Requeue(msg)
	if err != nil {
		log.Printf("[ERROR] Could not move task from InProgress back to queue: %v\n", err)
	}
}

func (p *processor) markAsDone(msg *base.TaskMessage) {
	err := p.rdb.Done(msg)
	if err != nil {
		log.Printf("[ERROR] Could not remove task from InProgress queue: %v\n", err)
	}
}

func (p *processor) retry(msg *base.TaskMessage, e error) {
	d := p.retryDelayFunc(msg.Retried, e, &Task{Type: msg.Type, Payload: msg.Payload})
	retryAt := time.Now().Add(d)
	err := p.rdb.Retry(msg, retryAt, e.Error())
	if err != nil {
		log.Printf("[ERROR] Could not send task %+v to Retry queue: %v\n", msg, err)
	}
}

func (p *processor) kill(msg *base.TaskMessage, e error) {
	log.Printf("[WARN] Retry exhausted for task(Type: %q, ID: %v)\n", msg.Type, msg.ID)
	err := p.rdb.Kill(msg, e.Error())
	if err != nil {
		log.Printf("[ERROR] Could not send task %+v to Dead queue: %v\n", msg, err)
	}
}

// perform calls the handler with the given task.
// If the call returns without panic, it simply returns the value,
// otherwise, it recovers from panic and returns an error.
func perform(h Handler, task *Task) (err error) {
	defer func() {
		if x := recover(); x != nil {
			err = fmt.Errorf("panic: %v", x)
		}
	}()
	return h.ProcessTask(task)
}
Add license comment to all src files 2020-01-03 10:13:16 +08:00			`// Copyright 2020 Kentaro Hibino. All rights reserved.`
			`// Use of this source code is governed by a MIT license`
			`// that can be found in the LICENSE file.`

Extract manager to its own type 2019-11-19 22:48:54 +08:00			`package asynq`

			`import (`
			`"fmt"`
			`"log"`
Stop processing more tasks from the queue once TSTP signal is received 2019-12-17 22:18:22 +08:00			`"sync"`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`"time"`
Extract rdb to internal package 2019-12-04 13:01:26 +08:00
Create base internal package 2019-12-22 23:15:45 +08:00			`"github.com/hibiken/asynq/internal/base"`
Extract rdb to internal package 2019-12-04 13:01:26 +08:00			`"github.com/hibiken/asynq/internal/rdb"`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`)`

Rename manager to processor 2019-11-21 12:08:03 +08:00			`type processor struct {`
Extract rdb to internal package 2019-12-04 13:01:26 +08:00			`rdb *rdb.RDB`
Extract manager to its own type 2019-11-19 22:48:54 +08:00
Change Background API to take Handler interface 2019-12-03 12:42:21 +08:00			`handler Handler`
Extract manager to its own type 2019-11-19 22:48:54 +08:00
Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`retryDelayFunc retryDelayFunc`

Add test for processor 2019-11-30 04:48:54 +08:00			`// timeout for blocking dequeue operation.`
			`// dequeue needs to timeout to avoid blocking forever`
			`// in case of a program shutdown or additon of a new queue.`
			`dequeueTimeout time.Duration`

Extract manager to its own type 2019-11-19 22:48:54 +08:00			`// sema is a counting semaphore to ensure the number of active workers`
Add test for processor 2019-11-30 04:48:54 +08:00			`// does not exceed the limit.`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`sema chan struct{}`

Rename manager to processor 2019-11-21 12:08:03 +08:00			`// channel to communicate back to the long running "processor" goroutine.`
Use sync.Once 2019-12-18 12:34:56 +08:00			`// once is used to send value to the channel only once.`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`done chan struct{}`
Use sync.Once 2019-12-18 12:34:56 +08:00			`once sync.Once`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00
Rename channel name 2019-12-19 10:57:48 +08:00			`// abort channel is closed when the shutdown of the "processor" goroutine starts.`
			`abort chan struct{}`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00
			`// quit channel communicates to the in-flight worker goroutines to stop.`
			`quit chan struct{}`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`}`

Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`type retryDelayFunc func(n int, err error, task *Task) time.Duration`

			`func newProcessor(r rdb.RDB, n int, fn retryDelayFunc) processor {`
Rename manager to processor 2019-11-21 12:08:03 +08:00			`return &processor{`
Extract rdb to internal package 2019-12-04 13:01:26 +08:00			`rdb: r,`
Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`retryDelayFunc: fn,`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`dequeueTimeout: 2 * time.Second,`
Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`sema: make(chan struct{}, n),`
Add test for processor 2019-11-30 04:48:54 +08:00			`done: make(chan struct{}),`
Rename channel name 2019-12-19 10:57:48 +08:00			`abort: make(chan struct{}),`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`quit: make(chan struct{}),`
Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`handler: HandlerFunc(func(t *Task) error { return fmt.Errorf("handler not set") }),`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`}`
			`}`

Stop processing more tasks from the queue once TSTP signal is received 2019-12-17 22:18:22 +08:00			`// Note: stops only the "processor" goroutine, does not stop workers.`
			`// It's safe to call this method multiple times.`
			`func (p *processor) stop() {`
Use sync.Once 2019-12-18 12:34:56 +08:00			`p.once.Do(func() {`
			`log.Println("[INFO] Processor shutting down...")`
			`// Unblock if processor is waiting for sema token.`
Rename channel name 2019-12-19 10:57:48 +08:00			`close(p.abort)`
Use sync.Once 2019-12-18 12:34:56 +08:00			`// Signal the processor goroutine to stop processing tasks`
			`// from the queue.`
			`p.done <- struct{}{}`
			`})`
Stop processing more tasks from the queue once TSTP signal is received 2019-12-17 22:18:22 +08:00			`}`

Add test for processor 2019-11-30 04:48:54 +08:00			`// NOTE: once terminated, processor cannot be re-started.`
Rename manager to processor 2019-11-21 12:08:03 +08:00			`func (p *processor) terminate() {`
Stop processing more tasks from the queue once TSTP signal is received 2019-12-17 22:18:22 +08:00			`p.stop()`
Gracefully shutdown all scheduled goroutines on (*Launcher).Stop 2019-11-19 23:38:09 +08:00
Minor cleanup 2019-12-30 23:10:13 +08:00			`// IDEA: Allow user to customize this timeout value.`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`const timeout = 8 * time.Second`
			`time.AfterFunc(timeout, func() { close(p.quit) })`
Change shutdown message to use info level logging 2019-11-29 23:14:28 +08:00			`log.Println("[INFO] Waiting for all workers to finish...")`
Minor cleanup 2019-11-28 11:36:56 +08:00			`// block until all workers have released the token`
Rename manager to processor 2019-11-21 12:08:03 +08:00			`for i := 0; i < cap(p.sema); i++ {`
			`p.sema <- struct{}{}`
Gracefully shutdown all scheduled goroutines on (*Launcher).Stop 2019-11-19 23:38:09 +08:00			`}`
Change shutdown message to use info level logging 2019-11-29 23:14:28 +08:00			`log.Println("[INFO] All workers have finished.")`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`p.restore() // move any unfinished tasks back to the queue.`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`}`

Rename manager to processor 2019-11-21 12:08:03 +08:00			`func (p *processor) start() {`
Add logic to restore unfinished tasks back into the default queue if there are any uncompleted tasks 2019-11-24 07:09:50 +08:00			`// NOTE: The call to "restore" needs to complete before starting`
			`// the processor goroutine.`
			`p.restore()`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`go func() {`
			`for {`
			`select {`
Rename manager to processor 2019-11-21 12:08:03 +08:00			`case <-p.done:`
Change shutdown message to use info level logging 2019-11-29 23:14:28 +08:00			`log.Println("[INFO] Processor done.")`
Gracefully shutdown all scheduled goroutines on (*Launcher).Stop 2019-11-19 23:38:09 +08:00			`return`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`default:`
Rename manager to processor 2019-11-21 12:08:03 +08:00			`p.exec()`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`}`
			`}`
			`}()`
			`}`

Track in-progress tasks with redis SET 2019-11-22 13:45:27 +08:00			`// exec pulls a task out of the queue and starts a worker goroutine to`
			`// process the task.`
Rename manager to processor 2019-11-21 12:08:03 +08:00			`func (p *processor) exec() {`
Change rdb Dequeue signature 2019-12-04 22:25:58 +08:00			`msg, err := p.rdb.Dequeue(p.dequeueTimeout)`
Extract rdb to internal package 2019-12-04 13:01:26 +08:00			`if err == rdb.ErrDequeueTimeout {`
Minor cleanup 2019-11-28 11:36:56 +08:00			`// timed out, this is a normal behavior.`
			`return`
			`}`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`if err != nil {`
Minor cleanup 2019-11-28 11:36:56 +08:00			`log.Printf("[ERROR] unexpected error while pulling a task out of queue: %v\n", err)`
			`return`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`}`

Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`select {`
Rename channel name 2019-12-19 10:57:48 +08:00			`case <-p.abort:`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`// shutdown is starting, return immediately after requeuing the message.`
			`p.requeue(msg)`
			`return`
			`case p.sema <- struct{}{}: // acquire token`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`go func() {`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`defer func() { <-p.sema /* release token */ }()`

			`resCh := make(chan error, 1)`
			`task := &Task{Type: msg.Type, Payload: msg.Payload}`
			`go func() {`
			`resCh <- perform(p.handler, task)`
			`}()`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`select {`
			`case <-p.quit:`
			`// time is up, quit this worker goroutine.`
Log warning and info messages when unfinished tasks get aborted 2019-12-19 10:55:08 +08:00			`log.Printf("[WARN] Terminating in-progress task %+v\n", msg)`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`return`
			`case resErr := <-resCh:`
			`// Note: One of three things should happen.`
			`// 1) Done -> Removes the message from InProgress`
			`// 2) Retry -> Removes the message from InProgress & Adds the message to Retry`
			`// 3) Kill -> Removes the message from InProgress & Adds the message to Dead`
			`if resErr != nil {`
			`if msg.Retried >= msg.Retry {`
Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`p.kill(msg, resErr)`
Minor cleanup 2019-12-26 12:04:29 +08:00			`} else {`
Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`p.retry(msg, resErr)`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`}`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`return`
			`}`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`p.markAsDone(msg)`
Track in-progress tasks with redis SET 2019-11-22 13:45:27 +08:00			`}`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`}()`
			`}`
Extract manager to its own type 2019-11-19 22:48:54 +08:00			`}`
Add logic to restore unfinished tasks back into the default queue if there are any uncompleted tasks 2019-11-24 07:09:50 +08:00
			`// restore moves all tasks from "in-progress" back to queue`
			`// to restore all unfinished tasks.`
			`func (p *processor) restore() {`
Log warning and info messages when unfinished tasks get aborted 2019-12-19 10:55:08 +08:00			`n, err := p.rdb.RestoreUnfinished()`
Add logic to restore unfinished tasks back into the default queue if there are any uncompleted tasks 2019-11-24 07:09:50 +08:00			`if err != nil {`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`log.Printf("[ERROR] Could not restore unfinished tasks: %v\n", err)`
			`}`
Log warning and info messages when unfinished tasks get aborted 2019-12-19 10:55:08 +08:00			`if n > 0 {`
			`log.Printf("[INFO] Restored %d unfinished tasks back to queue.\n", n)`
			`}`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`}`

Create base internal package 2019-12-22 23:15:45 +08:00			`func (p processor) requeue(msg base.TaskMessage) {`
Unblock processor shutdown process if processor is waiting for semaphore token 2019-12-18 12:07:17 +08:00			`err := p.rdb.Requeue(msg)`
			`if err != nil {`
			`log.Printf("[ERROR] Could not move task from InProgress back to queue: %v\n", err)`
			`}`
			`}`

Create base internal package 2019-12-22 23:15:45 +08:00			`func (p processor) markAsDone(msg base.TaskMessage) {`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`err := p.rdb.Done(msg)`
			`if err != nil {`
			`log.Printf("[ERROR] Could not remove task from InProgress queue: %v\n", err)`
			`}`
			`}`

Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`func (p processor) retry(msg base.TaskMessage, e error) {`
			`d := p.retryDelayFunc(msg.Retried, e, &Task{Type: msg.Type, Payload: msg.Payload})`
			`retryAt := time.Now().Add(d)`
			`err := p.rdb.Retry(msg, retryAt, e.Error())`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`if err != nil {`
			`log.Printf("[ERROR] Could not send task %+v to Retry queue: %v\n", msg, err)`
			`}`
			`}`

Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`func (p processor) kill(msg base.TaskMessage, e error) {`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`log.Printf("[WARN] Retry exhausted for task(Type: %q, ID: %v)\n", msg.Type, msg.ID)`
Allow user to specify retry delay duration 2019-12-30 09:43:19 +08:00			`err := p.rdb.Kill(msg, e.Error())`
Add timeout to worker goroutines when TERM signal is received Wait for a certain amount of time to allow for worker goroutines to finish. If the goroutines don't finish with the timeout duration, processor will quit the goroutines and restore any unfinished tasks from the in_progress queue back to the default queue. 2019-12-16 13:00:09 +08:00			`if err != nil {`
			`log.Printf("[ERROR] Could not send task %+v to Dead queue: %v\n", msg, err)`
Add logic to restore unfinished tasks back into the default queue if there are any uncompleted tasks 2019-11-24 07:09:50 +08:00			`}`
			`}`
Protect handler call against panic 2019-11-28 06:03:04 +08:00
			`// perform calls the handler with the given task.`
			`// If the call returns without panic, it simply returns the value,`
			`// otherwise, it recovers from panic and returns an error.`
Change Background API to take Handler interface 2019-12-03 12:42:21 +08:00			`func perform(h Handler, task *Task) (err error) {`
Protect handler call against panic 2019-11-28 06:03:04 +08:00			`defer func() {`
			`if x := recover(); x != nil {`
			`err = fmt.Errorf("panic: %v", x)`
			`}`
			`}()`
Change Background API to take Handler interface 2019-12-03 12:42:21 +08:00			`return h.ProcessTask(task)`
Protect handler call against panic 2019-11-28 06:03:04 +08:00			`}`