mirror of
				https://github.com/hibiken/asynq.git
				synced 2025-10-26 11:16:12 +08:00 
			
		
		
		
	
		
			
				
	
	
		
			490 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			490 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| // Copyright 2020 Kentaro Hibino. All rights reserved.
 | |
| // Use of this source code is governed by a MIT license
 | |
| // that can be found in the LICENSE file.
 | |
| 
 | |
| package asynq
 | |
| 
 | |
| import (
 | |
| 	"context"
 | |
| 	"errors"
 | |
| 	"fmt"
 | |
| 	"math"
 | |
| 	"math/rand"
 | |
| 	"runtime"
 | |
| 	"strings"
 | |
| 	"sync"
 | |
| 	"time"
 | |
| 
 | |
| 	"github.com/hibiken/asynq/internal/base"
 | |
| 	"github.com/hibiken/asynq/internal/log"
 | |
| 	"github.com/hibiken/asynq/internal/rdb"
 | |
| )
 | |
| 
 | |
| // Server is responsible for managing the background-task processing.
 | |
| //
 | |
| // Server pulls tasks off queues and processes them.
 | |
| // If the processing of a task is unsuccessful, server will
 | |
| // schedule it for a retry.
 | |
| // A task will be retried until either the task gets processed successfully
 | |
| // or until it reaches its max retry count.
 | |
| //
 | |
| // If a task exhausts its retries, it will be moved to the "dead" queue and
 | |
| // will be kept in the queue for some time until a certain condition is met
 | |
| // (e.g., queue size reaches a certain limit, or the task has been in the
 | |
| // queue for a certain amount of time).
 | |
| type Server struct {
 | |
| 	logger *log.Logger
 | |
| 
 | |
| 	broker base.Broker
 | |
| 
 | |
| 	status *base.ServerStatus
 | |
| 
 | |
| 	// wait group to wait for all goroutines to finish.
 | |
| 	wg            sync.WaitGroup
 | |
| 	scheduler     *scheduler
 | |
| 	processor     *processor
 | |
| 	syncer        *syncer
 | |
| 	heartbeater   *heartbeater
 | |
| 	subscriber    *subscriber
 | |
| 	recoverer     *recoverer
 | |
| 	healthchecker *healthchecker
 | |
| }
 | |
| 
 | |
| // Config specifies the server's background-task processing behavior.
 | |
| type Config struct {
 | |
| 	// Maximum number of concurrent processing of tasks.
 | |
| 	//
 | |
| 	// If set to a zero or negative value, NewServer will overwrite the value
 | |
| 	// to the number of CPUs usable by the currennt process.
 | |
| 	Concurrency int
 | |
| 
 | |
| 	// Function to calculate retry delay for a failed task.
 | |
| 	//
 | |
| 	// By default, it uses exponential backoff algorithm to calculate the delay.
 | |
| 	//
 | |
| 	// n is the number of times the task has been retried.
 | |
| 	// e is the error returned by the task handler.
 | |
| 	// t is the task in question.
 | |
| 	RetryDelayFunc func(n int, e error, t *Task) time.Duration
 | |
| 
 | |
| 	// List of queues to process with given priority value. Keys are the names of the
 | |
| 	// queues and values are associated priority value.
 | |
| 	//
 | |
| 	// If set to nil or not specified, the server will process only the "default" queue.
 | |
| 	//
 | |
| 	// Priority is treated as follows to avoid starving low priority queues.
 | |
| 	//
 | |
| 	// Example:
 | |
| 	// Queues: map[string]int{
 | |
| 	//     "critical": 6,
 | |
| 	//     "default":  3,
 | |
| 	//     "low":      1,
 | |
| 	// }
 | |
| 	// With the above config and given that all queues are not empty, the tasks
 | |
| 	// in "critical", "default", "low" should be processed 60%, 30%, 10% of
 | |
| 	// the time respectively.
 | |
| 	//
 | |
| 	// If a queue has a zero or negative priority value, the queue will be ignored.
 | |
| 	Queues map[string]int
 | |
| 
 | |
| 	// StrictPriority indicates whether the queue priority should be treated strictly.
 | |
| 	//
 | |
| 	// If set to true, tasks in the queue with the highest priority is processed first.
 | |
| 	// The tasks in lower priority queues are processed only when those queues with
 | |
| 	// higher priorities are empty.
 | |
| 	StrictPriority bool
 | |
| 
 | |
| 	// ErrorHandler handles errors returned by the task handler.
 | |
| 	//
 | |
| 	// HandleError is invoked only if the task handler returns a non-nil error.
 | |
| 	//
 | |
| 	// Example:
 | |
| 	// func reportError(task *asynq.Task, err error, retried, maxRetry int) {
 | |
| 	// 	   if retried >= maxRetry {
 | |
| 	//         err = fmt.Errorf("retry exhausted for task %s: %w", task.Type, err)
 | |
| 	// 	   }
 | |
| 	//     errorReportingService.Notify(err)
 | |
| 	// })
 | |
| 	//
 | |
| 	// ErrorHandler: asynq.ErrorHandlerFunc(reportError)
 | |
| 	ErrorHandler ErrorHandler
 | |
| 
 | |
| 	// Logger specifies the logger used by the server instance.
 | |
| 	//
 | |
| 	// If unset, default logger is used.
 | |
| 	Logger Logger
 | |
| 
 | |
| 	// LogLevel specifies the minimum log level to enable.
 | |
| 	//
 | |
| 	// If unset, InfoLevel is used by default.
 | |
| 	LogLevel LogLevel
 | |
| 
 | |
| 	// ShutdownTimeout specifies the duration to wait to let workers finish their tasks
 | |
| 	// before forcing them to abort when stopping the server.
 | |
| 	//
 | |
| 	// If unset or zero, default timeout of 8 seconds is used.
 | |
| 	ShutdownTimeout time.Duration
 | |
| 
 | |
| 	// HealthCheckFunc is called periodically with any errors encountered during ping to the
 | |
| 	// connected redis server.
 | |
| 	HealthCheckFunc func(error)
 | |
| 
 | |
| 	// HealthCheckInterval specifies the interval between healthchecks.
 | |
| 	//
 | |
| 	// If unset or zero, the interval is set to 15 seconds.
 | |
| 	HealthCheckInterval time.Duration
 | |
| }
 | |
| 
 | |
| // An ErrorHandler handles an error occured during task processing.
 | |
| type ErrorHandler interface {
 | |
| 	HandleError(ctx context.Context, task *Task, err error)
 | |
| }
 | |
| 
 | |
| // The ErrorHandlerFunc type is an adapter to allow the use of  ordinary functions as a ErrorHandler.
 | |
| // If f is a function with the appropriate signature, ErrorHandlerFunc(f) is a ErrorHandler that calls f.
 | |
| type ErrorHandlerFunc func(ctx context.Context, task *Task, err error)
 | |
| 
 | |
| // HandleError calls fn(ctx, task, err)
 | |
| func (fn ErrorHandlerFunc) HandleError(ctx context.Context, task *Task, err error) {
 | |
| 	fn(ctx, task, err)
 | |
| }
 | |
| 
 | |
| // Logger supports logging at various log levels.
 | |
| type Logger interface {
 | |
| 	// Debug logs a message at Debug level.
 | |
| 	Debug(args ...interface{})
 | |
| 
 | |
| 	// Info logs a message at Info level.
 | |
| 	Info(args ...interface{})
 | |
| 
 | |
| 	// Warn logs a message at Warning level.
 | |
| 	Warn(args ...interface{})
 | |
| 
 | |
| 	// Error logs a message at Error level.
 | |
| 	Error(args ...interface{})
 | |
| 
 | |
| 	// Fatal logs a message at Fatal level
 | |
| 	// and process will exit with status set to 1.
 | |
| 	Fatal(args ...interface{})
 | |
| }
 | |
| 
 | |
| // LogLevel represents logging level.
 | |
| //
 | |
| // It satisfies flag.Value interface.
 | |
| type LogLevel int32
 | |
| 
 | |
| const (
 | |
| 	// Note: reserving value zero to differentiate unspecified case.
 | |
| 	level_unspecified LogLevel = iota
 | |
| 
 | |
| 	// DebugLevel is the lowest level of logging.
 | |
| 	// Debug logs are intended for debugging and development purposes.
 | |
| 	DebugLevel
 | |
| 
 | |
| 	// InfoLevel is used for general informational log messages.
 | |
| 	InfoLevel
 | |
| 
 | |
| 	// WarnLevel is used for undesired but relatively expected events,
 | |
| 	// which may indicate a problem.
 | |
| 	WarnLevel
 | |
| 
 | |
| 	// ErrorLevel is used for undesired and unexpected events that
 | |
| 	// the program can recover from.
 | |
| 	ErrorLevel
 | |
| 
 | |
| 	// FatalLevel is used for undesired and unexpected events that
 | |
| 	// the program cannot recover from.
 | |
| 	FatalLevel
 | |
| )
 | |
| 
 | |
| // String is part of the flag.Value interface.
 | |
| func (l *LogLevel) String() string {
 | |
| 	switch *l {
 | |
| 	case DebugLevel:
 | |
| 		return "debug"
 | |
| 	case InfoLevel:
 | |
| 		return "info"
 | |
| 	case WarnLevel:
 | |
| 		return "warn"
 | |
| 	case ErrorLevel:
 | |
| 		return "error"
 | |
| 	case FatalLevel:
 | |
| 		return "fatal"
 | |
| 	}
 | |
| 	panic(fmt.Sprintf("asynq: unexpected log level: %v", *l))
 | |
| }
 | |
| 
 | |
| // Set is part of the flag.Value interface.
 | |
| func (l *LogLevel) Set(val string) error {
 | |
| 	switch strings.ToLower(val) {
 | |
| 	case "debug":
 | |
| 		*l = DebugLevel
 | |
| 	case "info":
 | |
| 		*l = InfoLevel
 | |
| 	case "warn", "warning":
 | |
| 		*l = WarnLevel
 | |
| 	case "error":
 | |
| 		*l = ErrorLevel
 | |
| 	case "fatal":
 | |
| 		*l = FatalLevel
 | |
| 	default:
 | |
| 		return fmt.Errorf("asynq: unsupported log level %q", val)
 | |
| 	}
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| func toInternalLogLevel(l LogLevel) log.Level {
 | |
| 	switch l {
 | |
| 	case DebugLevel:
 | |
| 		return log.DebugLevel
 | |
| 	case InfoLevel:
 | |
| 		return log.InfoLevel
 | |
| 	case WarnLevel:
 | |
| 		return log.WarnLevel
 | |
| 	case ErrorLevel:
 | |
| 		return log.ErrorLevel
 | |
| 	case FatalLevel:
 | |
| 		return log.FatalLevel
 | |
| 	}
 | |
| 	panic(fmt.Sprintf("asynq: unexpected log level: %v", l))
 | |
| }
 | |
| 
 | |
| // Formula taken from https://github.com/mperham/sidekiq.
 | |
| func defaultDelayFunc(n int, e error, t *Task) time.Duration {
 | |
| 	r := rand.New(rand.NewSource(time.Now().UnixNano()))
 | |
| 	s := int(math.Pow(float64(n), 4)) + 15 + (r.Intn(30) * (n + 1))
 | |
| 	return time.Duration(s) * time.Second
 | |
| }
 | |
| 
 | |
| var defaultQueueConfig = map[string]int{
 | |
| 	base.DefaultQueueName: 1,
 | |
| }
 | |
| 
 | |
| const (
 | |
| 	defaultShutdownTimeout = 8 * time.Second
 | |
| 
 | |
| 	defaultHealthCheckInterval = 15 * time.Second
 | |
| )
 | |
| 
 | |
| // NewServer returns a new Server given a redis connection option
 | |
| // and background processing configuration.
 | |
| func NewServer(r RedisConnOpt, cfg Config) *Server {
 | |
| 	n := cfg.Concurrency
 | |
| 	if n < 1 {
 | |
| 		n = runtime.NumCPU()
 | |
| 	}
 | |
| 	delayFunc := cfg.RetryDelayFunc
 | |
| 	if delayFunc == nil {
 | |
| 		delayFunc = defaultDelayFunc
 | |
| 	}
 | |
| 	queues := make(map[string]int)
 | |
| 	for qname, p := range cfg.Queues {
 | |
| 		if p > 0 {
 | |
| 			queues[qname] = p
 | |
| 		}
 | |
| 	}
 | |
| 	if len(queues) == 0 {
 | |
| 		queues = defaultQueueConfig
 | |
| 	}
 | |
| 	shutdownTimeout := cfg.ShutdownTimeout
 | |
| 	if shutdownTimeout == 0 {
 | |
| 		shutdownTimeout = defaultShutdownTimeout
 | |
| 	}
 | |
| 	healthcheckInterval := cfg.HealthCheckInterval
 | |
| 	if healthcheckInterval == 0 {
 | |
| 		healthcheckInterval = defaultHealthCheckInterval
 | |
| 	}
 | |
| 	logger := log.NewLogger(cfg.Logger)
 | |
| 	loglevel := cfg.LogLevel
 | |
| 	if loglevel == level_unspecified {
 | |
| 		loglevel = InfoLevel
 | |
| 	}
 | |
| 	logger.SetLevel(toInternalLogLevel(loglevel))
 | |
| 
 | |
| 	rdb := rdb.NewRDB(createRedisClient(r))
 | |
| 	starting := make(chan *base.TaskMessage)
 | |
| 	finished := make(chan *base.TaskMessage)
 | |
| 	syncCh := make(chan *syncRequest)
 | |
| 	status := base.NewServerStatus(base.StatusIdle)
 | |
| 	cancels := base.NewCancelations()
 | |
| 
 | |
| 	syncer := newSyncer(syncerParams{
 | |
| 		logger:     logger,
 | |
| 		requestsCh: syncCh,
 | |
| 		interval:   5 * time.Second,
 | |
| 	})
 | |
| 	heartbeater := newHeartbeater(heartbeaterParams{
 | |
| 		logger:         logger,
 | |
| 		broker:         rdb,
 | |
| 		interval:       5 * time.Second,
 | |
| 		concurrency:    n,
 | |
| 		queues:         queues,
 | |
| 		strictPriority: cfg.StrictPriority,
 | |
| 		status:         status,
 | |
| 		starting:       starting,
 | |
| 		finished:       finished,
 | |
| 	})
 | |
| 	scheduler := newScheduler(schedulerParams{
 | |
| 		logger:   logger,
 | |
| 		broker:   rdb,
 | |
| 		interval: 5 * time.Second,
 | |
| 	})
 | |
| 	subscriber := newSubscriber(subscriberParams{
 | |
| 		logger:       logger,
 | |
| 		broker:       rdb,
 | |
| 		cancelations: cancels,
 | |
| 	})
 | |
| 	processor := newProcessor(processorParams{
 | |
| 		logger:          logger,
 | |
| 		broker:          rdb,
 | |
| 		retryDelayFunc:  delayFunc,
 | |
| 		syncCh:          syncCh,
 | |
| 		cancelations:    cancels,
 | |
| 		concurrency:     n,
 | |
| 		queues:          queues,
 | |
| 		strictPriority:  cfg.StrictPriority,
 | |
| 		errHandler:      cfg.ErrorHandler,
 | |
| 		shutdownTimeout: shutdownTimeout,
 | |
| 		starting:        starting,
 | |
| 		finished:        finished,
 | |
| 	})
 | |
| 	recoverer := newRecoverer(recovererParams{
 | |
| 		logger:         logger,
 | |
| 		broker:         rdb,
 | |
| 		retryDelayFunc: delayFunc,
 | |
| 		interval:       1 * time.Minute,
 | |
| 	})
 | |
| 	healthchecker := newHealthChecker(healthcheckerParams{
 | |
| 		logger:          logger,
 | |
| 		broker:          rdb,
 | |
| 		interval:        healthcheckInterval,
 | |
| 		healthcheckFunc: cfg.HealthCheckFunc,
 | |
| 	})
 | |
| 	return &Server{
 | |
| 		logger:        logger,
 | |
| 		broker:        rdb,
 | |
| 		status:        status,
 | |
| 		scheduler:     scheduler,
 | |
| 		processor:     processor,
 | |
| 		syncer:        syncer,
 | |
| 		heartbeater:   heartbeater,
 | |
| 		subscriber:    subscriber,
 | |
| 		recoverer:     recoverer,
 | |
| 		healthchecker: healthchecker,
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // A Handler processes tasks.
 | |
| //
 | |
| // ProcessTask should return nil if the processing of a task
 | |
| // is successful.
 | |
| //
 | |
| // If ProcessTask return a non-nil error or panics, the task
 | |
| // will be retried after delay.
 | |
| type Handler interface {
 | |
| 	ProcessTask(context.Context, *Task) error
 | |
| }
 | |
| 
 | |
| // The HandlerFunc type is an adapter to allow the use of
 | |
| // ordinary functions as a Handler. If f is a function
 | |
| // with the appropriate signature, HandlerFunc(f) is a
 | |
| // Handler that calls f.
 | |
| type HandlerFunc func(context.Context, *Task) error
 | |
| 
 | |
| // ProcessTask calls fn(ctx, task)
 | |
| func (fn HandlerFunc) ProcessTask(ctx context.Context, task *Task) error {
 | |
| 	return fn(ctx, task)
 | |
| }
 | |
| 
 | |
| // ErrServerStopped indicates that the operation is now illegal because of the server being stopped.
 | |
| var ErrServerStopped = errors.New("asynq: the server has been stopped")
 | |
| 
 | |
| // Run starts the background-task processing and blocks until
 | |
| // an os signal to exit the program is received. Once it receives
 | |
| // a signal, it gracefully shuts down all active workers and other
 | |
| // goroutines to process the tasks.
 | |
| //
 | |
| // Run returns any error encountered during server startup time.
 | |
| // If the server has already been stopped, ErrServerStopped is returned.
 | |
| func (srv *Server) Run(handler Handler) error {
 | |
| 	if err := srv.Start(handler); err != nil {
 | |
| 		return err
 | |
| 	}
 | |
| 	srv.waitForSignals()
 | |
| 	srv.Stop()
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // Start starts the worker server. Once the server has started,
 | |
| // it pulls tasks off queues and starts a worker goroutine for each task.
 | |
| // Tasks are processed concurrently by the workers  up to the number of
 | |
| // concurrency specified at the initialization time.
 | |
| //
 | |
| // Start returns any error encountered during server startup time.
 | |
| // If the server has already been stopped, ErrServerStopped is returned.
 | |
| func (srv *Server) Start(handler Handler) error {
 | |
| 	if handler == nil {
 | |
| 		return fmt.Errorf("asynq: server cannot run with nil handler")
 | |
| 	}
 | |
| 	switch srv.status.Get() {
 | |
| 	case base.StatusRunning:
 | |
| 		return fmt.Errorf("asynq: the server is already running")
 | |
| 	case base.StatusStopped:
 | |
| 		return ErrServerStopped
 | |
| 	}
 | |
| 	srv.status.Set(base.StatusRunning)
 | |
| 	srv.processor.handler = handler
 | |
| 
 | |
| 	srv.logger.Info("Starting processing")
 | |
| 
 | |
| 	srv.heartbeater.start(&srv.wg)
 | |
| 	srv.healthchecker.start(&srv.wg)
 | |
| 	srv.subscriber.start(&srv.wg)
 | |
| 	srv.syncer.start(&srv.wg)
 | |
| 	srv.recoverer.start(&srv.wg)
 | |
| 	srv.scheduler.start(&srv.wg)
 | |
| 	srv.processor.start(&srv.wg)
 | |
| 	return nil
 | |
| }
 | |
| 
 | |
| // Stop stops the worker server.
 | |
| // It gracefully closes all active workers. The server will wait for
 | |
| // active workers to finish processing tasks for duration specified in Config.ShutdownTimeout.
 | |
| // If worker didn't finish processing a task during the timeout, the task will be pushed back to Redis.
 | |
| func (srv *Server) Stop() {
 | |
| 	switch srv.status.Get() {
 | |
| 	case base.StatusIdle, base.StatusStopped:
 | |
| 		// server is not running, do nothing and return.
 | |
| 		return
 | |
| 	}
 | |
| 
 | |
| 	srv.logger.Info("Starting graceful shutdown")
 | |
| 	// Note: The order of termination is important.
 | |
| 	// Sender goroutines should be terminated before the receiver goroutines.
 | |
| 	// processor -> syncer (via syncCh)
 | |
| 	// processor -> heartbeater (via starting, finished channels)
 | |
| 	srv.scheduler.terminate()
 | |
| 	srv.processor.terminate()
 | |
| 	srv.recoverer.terminate()
 | |
| 	srv.syncer.terminate()
 | |
| 	srv.subscriber.terminate()
 | |
| 	srv.healthchecker.terminate()
 | |
| 	srv.heartbeater.terminate()
 | |
| 
 | |
| 	srv.wg.Wait()
 | |
| 
 | |
| 	srv.broker.Close()
 | |
| 	srv.status.Set(base.StatusStopped)
 | |
| 
 | |
| 	srv.logger.Info("Exiting")
 | |
| }
 | |
| 
 | |
| // Quiet signals the server to stop pulling new tasks off queues.
 | |
| // Quiet should be used before stopping the server.
 | |
| func (srv *Server) Quiet() {
 | |
| 	srv.logger.Info("Stopping processor")
 | |
| 	srv.processor.stop()
 | |
| 	srv.status.Set(base.StatusQuiet)
 | |
| 	srv.logger.Info("Processor stopped")
 | |
| }
 |