From cc3c95e75714699a639d64f0c33437e89de2811f Mon Sep 17 00:00:00 2001
From: Valery Piashchynski <piashchynski.valery@gmail.com>
Date: Sun, 12 May 2024 13:31:53 +0200
Subject: [PATCH] Initial commit

---
 pool/async_pool/debug.go      | 147 ++++++++++++
 pool/async_pool/options.go    |  19 ++
 pool/async_pool/pool.go       | 418 ++++++++++++++++++++++++++++++++++
 pool/async_pool/stream.go     |  31 +++
 pool/async_pool/supervisor.go | 180 +++++++++++++++
 worker/worker.go              |   5 +-
 6 files changed, 799 insertions(+), 1 deletion(-)
 create mode 100644 pool/async_pool/debug.go
 create mode 100644 pool/async_pool/options.go
 create mode 100644 pool/async_pool/pool.go
 create mode 100644 pool/async_pool/stream.go
 create mode 100644 pool/async_pool/supervisor.go

diff --git a/pool/async_pool/debug.go b/pool/async_pool/debug.go
new file mode 100644
index 0000000..d4b0cf5
--- /dev/null
+++ b/pool/async_pool/debug.go
@@ -0,0 +1,147 @@
+package async_pool //nolint:stylecheck
+
+import (
+	"context"
+	"runtime"
+
+	"github.com/roadrunner-server/goridge/v3/pkg/frame"
+	"github.com/roadrunner-server/sdk/v4/events"
+	"github.com/roadrunner-server/sdk/v4/fsm"
+	"github.com/roadrunner-server/sdk/v4/payload"
+	"go.uber.org/zap"
+)
+
+// execDebug used when debug mode was not set and exec_ttl is 0
+// TODO DRY
+func (sp *Pool) execDebug(ctx context.Context, p *payload.Payload, stopCh chan struct{}) (chan *PExec, error) {
+	sp.log.Debug("executing in debug mode, worker will be destroyed after response is received")
+	w, err := sp.allocator()
+	if err != nil {
+		return nil, err
+	}
+
+	go func() {
+		// read the exit status to prevent process to become a zombie
+		_ = w.Wait()
+	}()
+
+	rsp, err := w.Exec(ctx, p)
+	if err != nil {
+		return nil, err
+	}
+
+	switch {
+	case rsp.Flags&frame.STREAM != 0:
+		// create a channel for the stream (only if there are no errors)
+		resp := make(chan *PExec, 5)
+		// send the initial frame
+		resp <- newPExec(rsp, nil)
+
+		// in case of stream, we should not return worker immediately
+		go func() {
+			// would be called on Goexit
+			defer func() {
+				sp.log.Debug("stopping [stream] worker", zap.Int("pid", int(w.Pid())), zap.String("state", w.State().String()))
+				close(resp)
+				// destroy the worker
+				errD := w.Stop()
+				if errD != nil {
+					sp.log.Debug(
+						"debug mode: worker stopped with error",
+						zap.String("reason", "worker error"),
+						zap.Int64("pid", w.Pid()),
+						zap.String("internal_event_name", events.EventWorkerError.String()),
+						zap.Error(errD),
+					)
+				}
+			}()
+
+			// stream iterator
+			for {
+				select {
+				// we received stop signal
+				case <-stopCh:
+					sp.log.Debug("stream stop signal received", zap.Int("pid", int(w.Pid())), zap.String("state", w.State().String()))
+					ctxT, cancelT := context.WithTimeout(ctx, sp.cfg.StreamTimeout)
+					err = w.StreamCancel(ctxT)
+					cancelT()
+					if err != nil {
+						w.State().Transition(fsm.StateErrored)
+						sp.log.Warn("stream cancel error", zap.Error(err))
+					} else {
+						// successfully canceled
+						w.State().Transition(fsm.StateReady)
+						sp.log.Debug("transition to the ready state", zap.String("from", w.State().String()))
+					}
+
+					runtime.Goexit()
+				default:
+					// we have to set a stream timeout on every request
+					switch sp.supervisedExec {
+					case true:
+						ctxT, cancelT := context.WithTimeout(context.Background(), sp.cfg.Supervisor.ExecTTL)
+						pld, next, errI := w.StreamIterWithContext(ctxT)
+						cancelT()
+						if errI != nil {
+							sp.log.Warn("stream error", zap.Error(err))
+
+							resp <- newPExec(nil, errI)
+
+							// move worker to the invalid state to restart
+							w.State().Transition(fsm.StateInvalid)
+							runtime.Goexit()
+						}
+
+						resp <- newPExec(pld, nil)
+
+						if !next {
+							w.State().Transition(fsm.StateReady)
+							// we've got the last frame
+							runtime.Goexit()
+						}
+					case false:
+						// non supervised execution, can potentially hang here
+						pld, next, errI := w.StreamIter()
+						if errI != nil {
+							sp.log.Warn("stream iter error", zap.Error(err))
+							// send error response
+							resp <- newPExec(nil, errI)
+
+							// move worker to the invalid state to restart
+							w.State().Transition(fsm.StateInvalid)
+							runtime.Goexit()
+						}
+
+						resp <- newPExec(pld, nil)
+
+						if !next {
+							w.State().Transition(fsm.StateReady)
+							// we've got the last frame
+							runtime.Goexit()
+						}
+					}
+				}
+			}
+		}()
+
+		return resp, nil
+	default:
+		resp := make(chan *PExec, 1)
+		resp <- newPExec(rsp, nil)
+		// close the channel
+		close(resp)
+
+		errD := w.Stop()
+		if errD != nil {
+			sp.log.Debug(
+				"debug mode: worker stopped with error",
+				zap.String("reason", "worker error"),
+				zap.Int64("pid", w.Pid()),
+				zap.String("internal_event_name", events.EventWorkerError.String()),
+				zap.Error(errD),
+			)
+		}
+
+		return resp, nil
+	}
+}
diff --git a/pool/async_pool/options.go b/pool/async_pool/options.go
new file mode 100644
index 0000000..822404f
--- /dev/null
+++ b/pool/async_pool/options.go
@@ -0,0 +1,19 @@
+package async_pool //nolint:stylecheck
+
+import (
+	"go.uber.org/zap"
+)
+
+type Options func(p *Pool)
+
+func WithLogger(z *zap.Logger) Options {
+	return func(p *Pool) {
+		p.log = z
+	}
+}
+
+func WithQueueSize(l uint64) Options {
+	return func(p *Pool) {
+		p.maxQueueSize = l
+	}
+}
diff --git a/pool/async_pool/pool.go b/pool/async_pool/pool.go
new file mode 100644
index 0000000..584254c
--- /dev/null
+++ b/pool/async_pool/pool.go
@@ -0,0 +1,418 @@
+package async_pool //nolint:stylecheck
+
+import (
+	"context"
+	"runtime"
+	"sync"
+	"sync/atomic"
+	"unsafe"
+
+	"github.com/roadrunner-server/errors"
+	"github.com/roadrunner-server/goridge/v3/pkg/frame"
+	"github.com/roadrunner-server/sdk/v4/events"
+	"github.com/roadrunner-server/sdk/v4/fsm"
+	"github.com/roadrunner-server/sdk/v4/payload"
+	"github.com/roadrunner-server/sdk/v4/pool"
+	"github.com/roadrunner-server/sdk/v4/worker"
+	workerWatcher "github.com/roadrunner-server/sdk/v4/worker_watcher"
+	"go.uber.org/zap"
+)
+
+const (
+	// StopRequest can be sent by worker to indicate that restart is required.
+	StopRequest = `{"stop":true}`
+)
+
+// Pool controls worker creation, destruction and task routing. Pool uses fixed amount of stack.
+type Pool struct {
+	// pool configuration
+	cfg *pool.Config
+	// logger
+	log *zap.Logger
+	// worker command creator
+	cmd pool.Command
+	// creates and connects to stack
+	factory pool.Factory
+	// manages worker states and TTLs
+	ww *workerWatcher.WorkerWatcher
+	// allocate new worker
+	allocator func() (*worker.Process, error)
+	// exec queue size
+	queue        uint64
+	maxQueueSize uint64
+	// used in the supervised mode
+	supervisedExec bool
+	stopCh         chan struct{}
+	mu             sync.RWMutex
+}
+
+// NewPool creates a new worker pool and task multiplexer. Pool will initiate with one worker. If supervisor configuration is provided -> pool will be turned into a supervisedExec mode
+func NewPool(ctx context.Context, cmd pool.Command, factory pool.Factory, cfg *pool.Config, log *zap.Logger, options ...Options) (*Pool, error) {
+	if factory == nil {
+		return nil, errors.Str("no factory initialized")
+	}
+
+	if cfg == nil {
+		return nil, errors.Str("nil configuration provided")
+	}
+
+	cfg.InitDefaults()
+
+	// for debug mode we need to set the number of workers to 0 (no pre-allocated workers) and max jobs to 1
+	if cfg.Debug {
+		cfg.NumWorkers = 0
+		cfg.MaxJobs = 1
+		cfg.MaxQueueSize = 0
+	}
+
+	p := &Pool{
+		cfg:     cfg,
+		cmd:     cmd,
+		factory: factory,
+		log:     log,
+		queue:   0,
+	}
+
+	// apply options
+	for i := 0; i < len(options); i++ {
+		options[i](p)
+	}
+
+	if p.log == nil {
+		var err error
+		p.log, err = zap.NewDevelopment()
+		if err != nil {
+			return nil, err
+		}
+	}
+
+	// set up workers allocator
+	p.allocator = pool.NewPoolAllocator(ctx, p.cfg.AllocateTimeout, p.cfg.MaxJobs, factory, cmd, p.cfg.Command, p.log)
+	// set up workers watcher
+	p.ww = workerWatcher.NewSyncWorkerWatcher(p.allocator, p.log, p.cfg.NumWorkers, p.cfg.AllocateTimeout)
+
+	// allocate requested number of workers
+	workers, err := pool.AllocateParallel(p.cfg.NumWorkers, p.allocator)
+	if err != nil {
+		return nil, err
+	}
+
+	// add workers to the watcher
+	err = p.ww.Watch(workers)
+	if err != nil {
+		return nil, err
+	}
+
+	if p.cfg.Supervisor != nil {
+		if p.cfg.Supervisor.ExecTTL != 0 {
+			// we use supervisedExec ExecWithTTL mode only when ExecTTL is set
+			// otherwise we may use a faster Exec
+			p.supervisedExec = true
+		}
+		// start the supervisor
+		p.Start()
+	}
+
+	return p, nil
+}
+
+// GetConfig returns associated pool configuration. Immutable.
+func (sp *Pool) GetConfig() *pool.Config {
+	return sp.cfg
+}
+
+// Workers returns worker list associated with the pool.
+func (sp *Pool) Workers() (workers []*worker.Process) {
+	return sp.ww.List()
+}
+
+func (sp *Pool) RemoveWorker(ctx context.Context) error {
+	if sp.cfg.Debug {
+		sp.log.Warn("remove worker operation is not allowed in debug mode")
+		return nil
+	}
+	var cancel context.CancelFunc
+	_, ok := ctx.Deadline()
+	if !ok {
+		ctx, cancel = context.WithTimeout(ctx, sp.cfg.DestroyTimeout)
+		defer cancel()
+	}
+
+	return sp.ww.RemoveWorker(ctx)
+}
+
+func (sp *Pool) AddWorker() error {
+	if sp.cfg.Debug {
+		sp.log.Warn("add worker operation is not allowed in debug mode")
+		return nil
+	}
+	return sp.ww.AddWorker()
+}
+
+// Exec executes provided payload on the worker
+func (sp *Pool) Exec(ctx context.Context, p *payload.Payload, stopCh chan struct{}) (chan *PExec, error) {
+	const op = errors.Op("static_pool_exec")
+
+	if len(p.Body) == 0 && len(p.Context) == 0 {
+		return nil, errors.E(op, errors.Str("payload can not be empty"))
+	}
+
+	// check if we have space to put the request
+	if atomic.LoadUint64(&sp.maxQueueSize) != 0 && atomic.LoadUint64(&sp.queue) >= atomic.LoadUint64(&sp.maxQueueSize) {
+		return nil, errors.E(op, errors.QueueSize, errors.Str("max queue size reached"))
+	}
+
+	if sp.cfg.Debug {
+		switch sp.supervisedExec {
+		case true:
+			ctxTTL, cancel := context.WithTimeout(ctx, sp.cfg.Supervisor.ExecTTL)
+			defer cancel()
+			return sp.execDebug(ctxTTL, p, stopCh)
+		case false:
+			return sp.execDebug(context.Background(), p, stopCh)
+		}
+	}
+
+	/*
+		register request in the QUEUE
+	*/
+	atomic.AddUint64(&sp.queue, 1)
+	defer atomic.AddUint64(&sp.queue, ^uint64(0))
+
+	// see notes at the end of the file
+begin:
+	ctxGetFree, cancel := context.WithTimeout(ctx, sp.cfg.AllocateTimeout)
+	defer cancel()
+	w, err := sp.takeWorker(ctxGetFree, op)
+	if err != nil {
+		return nil, errors.E(op, err)
+	}
+
+	var rsp *payload.Payload
+	switch sp.supervisedExec {
+	case true:
+		// in the supervisedExec mode we're limiting the allowed time for the execution inside the PHP worker
+		ctxT, cancelT := context.WithTimeout(ctx, sp.cfg.Supervisor.ExecTTL)
+		defer cancelT()
+		rsp, err = w.Exec(ctxT, p)
+	case false:
+		// no context here
+		// potential problem: if the worker is hung, we can't stop it
+		rsp, err = w.Exec(context.Background(), p)
+	}
+
+	if w.MaxExecsReached() {
+		sp.log.Debug("requests execution limit reached, worker will be restarted", zap.Int64("pid", w.Pid()), zap.Uint64("execs", w.State().NumExecs()))
+		w.State().Transition(fsm.StateMaxJobsReached)
+	}
+
+	if err != nil {
+		// just push event if on any stage was timeout error
+		switch {
+		case errors.Is(errors.ExecTTL, err):
+			// for this case, worker already killed in the ExecTTL function
+			sp.log.Warn("worker stopped, and will be restarted", zap.String("reason", "execTTL timeout elapsed"), zap.Int64("pid", w.Pid()), zap.String("internal_event_name", events.EventExecTTL.String()), zap.Error(err))
+			w.State().Transition(fsm.StateExecTTLReached)
+
+			// worker should already be reallocated
+			return nil, err
+		case errors.Is(errors.SoftJob, err):
+			/*
+				in case of soft job error, we should not kill the worker, this is just an error payload from the worker.
+			*/
+			w.State().Transition(fsm.StateReady)
+			sp.log.Warn("soft worker error", zap.String("reason", "SoftJob"), zap.Int64("pid", w.Pid()), zap.String("internal_event_name", events.EventWorkerSoftError.String()), zap.Error(err))
+			sp.ww.Release(w)
+
+			return nil, err
+		case errors.Is(errors.Network, err):
+			// in case of network error, we can't stop the worker, we should kill it
+			w.State().Transition(fsm.StateErrored)
+			sp.log.Warn("RoadRunner can't communicate with the worker", zap.String("reason", "worker hung or process was killed"), zap.Int64("pid", w.Pid()), zap.String("internal_event_name", events.EventWorkerError.String()), zap.Error(err))
+			// kill the worker instead of sending a net packet to it
+			_ = w.Kill()
+
+			// do not return it, should be reallocated on Kill
+			return nil, err
+		case errors.Is(errors.Retry, err):
+			// put the worker back to the stack and retry the request with the new one
+			sp.ww.Release(w)
+			goto begin
+
+		default:
+			w.State().Transition(fsm.StateErrored)
+			sp.log.Warn("worker will be restarted", zap.Int64("pid", w.Pid()), zap.String("internal_event_name", events.EventWorkerDestruct.String()), zap.Error(err))
+
+			sp.ww.Release(w)
+			return nil, err
+		}
+	}
+
+	// worker want's to be terminated
+	// unsafe is used to quickly transform []byte to string
+	if len(rsp.Body) == 0 && unsafe.String(unsafe.SliceData(rsp.Context), len(rsp.Context)) == StopRequest {
+		w.State().Transition(fsm.StateInvalid)
+		sp.ww.Release(w)
+		goto begin
+	}
+
+	switch {
+	case rsp.Flags&frame.STREAM != 0:
+		sp.log.Debug("stream mode", zap.Int64("pid", w.Pid()))
+		// create channel for the stream (only if there are no errors)
+		// we need to create a buffered channel to prevent blocking
+		// stream buffer size should be bigger than regular, to have some payloads ready (optimization)
+		resp := make(chan *PExec, 5)
+		// send the initial frame
+		resp <- newPExec(rsp, nil)
+
+		// in case of stream we should not return worker back immediately
+		go func() {
+			// would be called on Goexit
+			defer func() {
+				sp.log.Debug("release [stream] worker", zap.Int("pid", int(w.Pid())), zap.String("state", w.State().String()))
+				close(resp)
+				sp.ww.Release(w)
+			}()
+
+			// stream iterator
+			for {
+				select {
+				// we received stop signal
+				case <-stopCh:
+					sp.log.Debug("stream stop signal received", zap.Int("pid", int(w.Pid())), zap.String("state", w.State().String()))
+					ctxT, cancelT := context.WithTimeout(ctx, sp.cfg.StreamTimeout)
+					err = w.StreamCancel(ctxT)
+					cancelT()
+					if err != nil {
+						w.State().Transition(fsm.StateErrored)
+						sp.log.Warn("stream cancel error", zap.Error(err))
+					} else {
+						// successfully canceled
+						w.State().Transition(fsm.StateReady)
+						sp.log.Debug("transition to the ready state", zap.String("from", w.State().String()))
+					}
+
+					runtime.Goexit()
+				default:
+					// we have to set a stream timeout on every request
+					switch sp.supervisedExec {
+					case true:
+						ctxT, cancelT := context.WithTimeout(context.Background(), sp.cfg.Supervisor.ExecTTL)
+						pld, next, errI := w.StreamIterWithContext(ctxT)
+						cancelT()
+						if errI != nil {
+							sp.log.Warn("stream error", zap.Error(err))
+
+							resp <- newPExec(nil, errI)
+
+							// move worker to the invalid state to restart
+							w.State().Transition(fsm.StateInvalid)
+							runtime.Goexit()
+						}
+
+						resp <- newPExec(pld, nil)
+
+						if !next {
+							w.State().Transition(fsm.StateReady)
+							// we've got the last frame
+							runtime.Goexit()
+						}
+					case false:
+						// non supervised execution, can potentially hang here
+						pld, next, errI := w.StreamIter()
+						if errI != nil {
+							sp.log.Warn("stream iter error", zap.Error(err))
+							// send error response
+							resp <- newPExec(nil, errI)
+
+							// move worker to the invalid state to restart
+							w.State().Transition(fsm.StateInvalid)
+							runtime.Goexit()
+						}
+
+						resp <- newPExec(pld, nil)
+
+						if !next {
+							w.State().Transition(fsm.StateReady)
+							// we've got the last frame
+							runtime.Goexit()
+						}
+					}
+				}
+			}
+		}()
+
+		return resp, nil
+	default:
+		resp := make(chan *PExec, 1)
+		// send the initial frame
+		resp <- newPExec(rsp, nil)
+		sp.log.Debug("req-resp mode", zap.Int64("pid", w.Pid()))
+		if w.State().Compare(fsm.StateWorking) {
+			w.State().Transition(fsm.StateReady)
+		}
+		// return worker back
+		sp.ww.Release(w)
+		// close the channel
+		close(resp)
+		return resp, nil
+	}
+}
+
+func (sp *Pool) QueueSize() uint64 {
+	return atomic.LoadUint64(&sp.queue)
+}
+
+// Destroy all underlying stack (but let them complete the task).
+func (sp *Pool) Destroy(ctx context.Context) {
+	sp.log.Info("destroy signal received", zap.Duration("timeout", sp.cfg.DestroyTimeout))
+	var cancel context.CancelFunc
+	_, ok := ctx.Deadline()
+	if !ok {
+		ctx, cancel = context.WithTimeout(ctx, sp.cfg.DestroyTimeout)
+		defer cancel()
+	}
+	sp.ww.Destroy(ctx)
+	atomic.StoreUint64(&sp.queue, 0)
+}
+
+func (sp *Pool) Reset(ctx context.Context) error {
+	// set timeout
+	ctx, cancel := context.WithTimeout(ctx, sp.cfg.ResetTimeout)
+	defer cancel()
+	// reset all workers
+	numToAllocate := sp.ww.Reset(ctx)
+	// re-allocate all workers
+	workers, err := pool.AllocateParallel(numToAllocate, sp.allocator)
+	if err != nil {
+		return err
+	}
+	// add the NEW workers to the watcher
+	err = sp.ww.Watch(workers)
+	if err != nil {
+		return err
+	}
+
+	return nil
+}
+
+func (sp *Pool) takeWorker(ctxGetFree context.Context, op errors.Op) (*worker.Process, error) {
+	// Get function consumes context with timeout
+	w, err := sp.ww.Take(ctxGetFree)
+	if err != nil {
+		// if the error is of kind NoFreeWorkers, it means, that we can't get worker from the stack during the allocate timeout
+		if errors.Is(errors.NoFreeWorkers, err) {
+			sp.log.Error(
+				"no free workers in the pool, wait timeout exceed",
+				zap.String("reason", "no free workers"),
+				zap.String("internal_event_name", events.EventNoFreeWorkers.String()),
+				zap.Error(err),
+			)
+			return nil, errors.E(op, err)
+		}
+		// else if err not nil - return error
+		return nil, errors.E(op, err)
+	}
+	return w, nil
+}
diff --git a/pool/async_pool/stream.go b/pool/async_pool/stream.go
new file mode 100644
index 0000000..0915ad7
--- /dev/null
+++ b/pool/async_pool/stream.go
@@ -0,0 +1,31 @@
+package async_pool //nolint:stylecheck
+
+import "github.com/roadrunner-server/sdk/v4/payload"
+
+type PExec struct {
+	pld *payload.Payload
+	err error
+}
+
+func newPExec(pld *payload.Payload, err error) *PExec {
+	return &PExec{
+		pld: pld,
+		err: err,
+	}
+}
+
+func (p *PExec) Payload() *payload.Payload {
+	return p.pld
+}
+
+func (p *PExec) Body() []byte {
+	return p.pld.Body
+}
+
+func (p *PExec) Context() []byte {
+	return p.pld.Context
+}
+
+func (p *PExec) Error() error {
+	return p.err
+}
diff --git a/pool/async_pool/supervisor.go b/pool/async_pool/supervisor.go
new file mode 100644
index 0000000..2afdfe4
--- /dev/null
+++ b/pool/async_pool/supervisor.go
@@ -0,0 +1,180 @@
+package async_pool //nolint:stylecheck
+
+import (
+	"time"
+
+	"github.com/roadrunner-server/sdk/v4/events"
+	"github.com/roadrunner-server/sdk/v4/fsm"
+	"github.com/roadrunner-server/sdk/v4/state/process"
+	"go.uber.org/zap"
+)
+
+const (
+	MB = 1024 * 1024
+
+	// NsecInSec nanoseconds in second
+	NsecInSec int64 = 1000000000
+)
+
+func (sp *Pool) Start() {
+	go func() {
+		watchTout := time.NewTicker(sp.cfg.Supervisor.WatchTick)
+		defer watchTout.Stop()
+
+		for {
+			select {
+			case <-sp.stopCh:
+				return
+			// stop here
+			case <-watchTout.C:
+				sp.mu.Lock()
+				sp.control()
+				sp.mu.Unlock()
+			}
+		}
+	}()
+}
+
+func (sp *Pool) Stop() {
+	sp.stopCh <- struct{}{}
+}
+
+func (sp *Pool) control() {
+	now := time.Now()
+
+	// MIGHT BE OUTDATED
+	// It's a copy of the Workers pointers
+	workers := sp.Workers()
+
+	for i := 0; i < len(workers); i++ {
+		// if worker not in the Ready OR working state
+		// skip such worker
+		switch workers[i].State().CurrentState() {
+		case
+			fsm.StateInactive,
+			fsm.StateErrored,
+			fsm.StateStopping,
+			fsm.StateStopped,
+			fsm.StateInvalid,
+			fsm.StateMaxJobsReached:
+
+			// do no touch the bad worker until it pushed back to the stack
+			continue
+
+		case
+			fsm.StateMaxMemoryReached,
+			fsm.StateIdleTTLReached,
+			fsm.StateTTLReached:
+			// we can stop workers which reached the idlettl state
+			// workers can be moved from these states ONLY by the supervisor and ONLY if the worker is in the StateReady
+			if workers[i] != nil {
+				_ = workers[i].Stop()
+			}
+
+			// call cleanup callback
+			workers[i].Callback()
+
+			continue
+		}
+
+		s, err := process.WorkerProcessState(workers[i])
+		if err != nil {
+			// worker not longer valid for supervision
+			continue
+		}
+
+		if sp.cfg.Supervisor.TTL != 0 && now.Sub(workers[i].Created()).Seconds() >= sp.cfg.Supervisor.TTL.Seconds() {
+			/*
+				worker at this point might be in the middle of request execution:
+
+				---> REQ ---> WORKER -----------------> RESP (at this point we should not set the Ready state) ------> | ----> Worker gets between supervisor checks and get killed in the ww.Release
+											 ^
+				                           TTL Reached, state - invalid                                                |
+																														-----> Worker Stopped here
+			*/
+
+			// if the worker in the StateReady, it means, that it's not working on the request and we can safely stop/kill it
+			// but if the worker in the any other state, we can't stop it, because it might be in the middle of the request execution, instead, we're setting the Invalid state
+			if workers[i].State().Compare(fsm.StateReady) {
+				workers[i].State().Transition(fsm.StateTTLReached)
+			} else {
+				workers[i].State().Transition(fsm.StateInvalid)
+			}
+
+			sp.log.Debug("ttl", zap.String("reason", "ttl is reached"), zap.Int64("pid", workers[i].Pid()), zap.String("internal_event_name", events.EventTTL.String()))
+			continue
+		}
+
+		if sp.cfg.Supervisor.MaxWorkerMemory != 0 && s.MemoryUsage >= sp.cfg.Supervisor.MaxWorkerMemory*MB {
+			/*
+				worker at this point might be in the middle of request execution:
+
+				---> REQ ---> WORKER -----------------> RESP (at this point we should not set the Ready state) ------> | ----> Worker gets between supervisor checks and get killed in the ww.Release
+											 ^
+				                           TTL Reached, state - invalid                                                |
+																														-----> Worker Stopped here
+			*/
+
+			// if the worker in the StateReady, it means, that it's not working on the request and we can safely stop/kill it
+			// but if the worker in the any other state, we can't stop it, because it might be in the middle of the request execution, instead, we're setting the Invalid state
+			if workers[i].State().Compare(fsm.StateReady) {
+				workers[i].State().Transition(fsm.StateMaxMemoryReached)
+			} else {
+				workers[i].State().Transition(fsm.StateInvalid)
+			}
+
+			sp.log.Debug("memory_limit", zap.String("reason", "max memory is reached"), zap.Int64("pid", workers[i].Pid()), zap.String("internal_event_name", events.EventMaxMemory.String()))
+			continue
+		}
+
+		// firs we check maxWorker idle
+		if sp.cfg.Supervisor.IdleTTL != 0 {
+			// then check for the worker state
+			if !workers[i].State().Compare(fsm.StateReady) {
+				continue
+			}
+
+			/*
+				Calculate idle time
+				If worker in the StateReady, we read it LastUsed timestamp as UnixNano uint64
+				2. For example maxWorkerIdle is equal to 5sec, then, if (time.Now - LastUsed) > maxWorkerIdle
+				we are guessing that worker overlap idle time and has to be killed
+			*/
+
+			// 1610530005534416045 lu
+			// lu - now = -7811150814 - nanoseconds
+			// 7.8 seconds
+			// get last used unix nano
+			lu := workers[i].State().LastUsed()
+			// worker not used, skip
+			if lu == 0 {
+				continue
+			}
+
+			// convert last used to unixNano and sub time.now to seconds
+			// negative number, because lu always in the past, except for the `back to the future` :)
+			res := ((int64(lu) - now.UnixNano()) / NsecInSec) * -1
+
+			// maxWorkerIdle more than diff between now and last used
+			// for example:
+			// After exec worker goes to the rest
+			// And resting for the 5 seconds
+			// IdleTTL is 1 second.
+			// After the control check, res will be 5, idle is 1
+			// 5 - 1 = 4, more than 0, YOU ARE FIRED (removed). Done.
+			if int64(sp.cfg.Supervisor.IdleTTL.Seconds())-res <= 0 {
+				/*
+					worker at this point might be in the middle of request execution:
+
+					---> REQ ---> WORKER -----------------> RESP (at this point we should not set the Ready state) ------> | ----> Worker gets between supervisor checks and get killed in the ww.Release
+												 ^
+					                           TTL Reached, state - invalid                                                |
+																															-----> Worker Stopped here
+				*/
+
+				workers[i].State().Transition(fsm.StateIdleTTLReached)
+				sp.log.Debug("idle_ttl", zap.String("reason", "idle ttl is reached"), zap.Int64("pid", workers[i].Pid()), zap.String("internal_event_name", events.EventTTL.String()))
+			}
+		}
+	}
+}
diff --git a/worker/worker.go b/worker/worker.go
index c1b28c9..84b6c23 100644
--- a/worker/worker.go
+++ b/worker/worker.go
@@ -29,6 +29,9 @@ type Process struct {
 	created time.Time
 	log     *zap.Logger
 
+	// number of requests consumed by the async worker
+	numRequests uint64 //nolint:unused
+
 	// calculated maximum value with jitter
 	maxExecs uint64
 
@@ -244,7 +247,7 @@ func (w *Process) StreamIter() (*payload.Payload, bool, error) {
 	return pld, pld.Flags&frame.STREAM != 0, nil
 }
 
-// StreamIter returns true if stream is available and payload
+// StreamIterWithContext returns true if stream is available and payload
 func (w *Process) StreamIterWithContext(ctx context.Context) (*payload.Payload, bool, error) {
 	c := w.getCh()