From f7dd603f3886691af6c1fb1c10a0cf03035b33d9 Mon Sep 17 00:00:00 2001 From: Kyle Xiao Date: Thu, 2 Jan 2025 11:54:08 +0800 Subject: [PATCH] feat: now gopool pkg --- concurrency/gopool/gopool.go | 227 ++++++++++++++++++++++++++++++ concurrency/gopool/gopool_test.go | 199 ++++++++++++++++++++++++++ 2 files changed, 426 insertions(+) create mode 100644 concurrency/gopool/gopool.go create mode 100644 concurrency/gopool/gopool_test.go diff --git a/concurrency/gopool/gopool.go b/concurrency/gopool/gopool.go new file mode 100644 index 0000000..9f095a0 --- /dev/null +++ b/concurrency/gopool/gopool.go @@ -0,0 +1,227 @@ +/* + * Copyright 2025 CloudWeGo Authors + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package gopool + +import ( + "context" + "log" + "runtime/debug" + "sync/atomic" + "time" +) + +// Option ... +type Option struct { + // MaxIdleWorkers is the max idle workers keeping in pool for waiting tasks. + // There workers will exit after `WorkerMaxAge` + MaxIdleWorkers int + + // WorkerMaxAge is the max age of a worker in pool. + WorkerMaxAge time.Duration + + // TaskChanBuffer is the size of task queue length. + // if it's full, we will fall back to use `go` directly without using pool. + // normally, the queue length should be small, + // coz we will create new workers to pick tasks if necessary. + TaskChanBuffer int +} + +// DefaultOption returns the default values of Option. +func DefaultOption() *Option { + return &Option{ + MaxIdleWorkers: 1000, + WorkerMaxAge: time.Minute, + TaskChanBuffer: 1000, + } +} + +var defaultGoPool = NewGoPool("__default__", nil) + +// Go runs the given func in background +func Go(f func()) { + defaultGoPool.Go(f) +} + +// GoCtx runs the given func in background, and it passes ctx to panic handler when happens. +func GoCtx(ctx context.Context, f func()) { + defaultGoPool.GoCtx(ctx, f) +} + +// SetPanicHandler sets a func for handling panic cases. +// +// check the comment of (*GoPool).SetPanicHandler for details +func SetPanicHandler(f func(ctx context.Context, r interface{})) { + defaultGoPool.SetPanicHandler(f) +} + +type task struct { + ctx context.Context + f func() +} + +// GoPool represents a simple worker pool which manages goroutines for background tasks. +type GoPool struct { + name string + + workers int32 + maxIdle int32 + maxage int64 // milliseconds + + panicHandler func(ctx context.Context, r interface{}) + + tasks chan task + unixMilli int64 + + createWorker func() +} + +// NewGoPool create a new instance for goroutine worker +func NewGoPool(name string, o *Option) *GoPool { + if o == nil { + o = DefaultOption() + } + p := &GoPool{ + name: name, + tasks: make(chan task, o.TaskChanBuffer), + maxage: o.WorkerMaxAge.Milliseconds(), + maxIdle: int32(o.MaxIdleWorkers), + } + + // fix: func literal escapes to heap + p.createWorker = func() { + p.runWorker() + } + return p +} + +// Go runs the given func in background +func (p *GoPool) Go(f func()) { + p.GoCtx(context.Background(), f) +} + +// GoCtx runs the given func in background, and it passes ctx to panic handler when happens. +func (p *GoPool) GoCtx(ctx context.Context, f func()) { + select { + case p.tasks <- task{ctx: ctx, f: f}: + default: + // full? fall back to use go directly + go p.runTask(ctx, f) + return + } + // luckily ... it's true when there're many workers. + if len(p.tasks) == 0 { + return + } + // all worker is busy, create a new one + go p.createWorker() +} + +// SetPanicHandler sets a func for handling panic cases. +// +// Panic handler takes two args, `ctx` and `r`. +// `ctx` is the one provided when calling GoCtx, and `r` is returned by recover() +// +// By default, GoPool will use log.Printf to record the err and stack. +// +// It's recommended to set your own handler. +func (p *GoPool) SetPanicHandler(f func(ctx context.Context, r interface{})) { + p.panicHandler = f +} + +func (p *GoPool) runTask(ctx context.Context, f func()) { + defer func(p *GoPool, ctx context.Context) { + if r := recover(); r != nil { + if p.panicHandler != nil { + p.panicHandler(ctx, r) + } else { + log.Printf("GOPOOL: panic in pool: %s: %v: %s", p.name, r, debug.Stack()) + } + } + }(p, ctx) + f() +} + +func (p *GoPool) CurrentWorkers() int { + return int(atomic.LoadInt32(&p.workers)) +} + +func (p *GoPool) runWorker() { + id := atomic.AddInt32(&p.workers, 1) + defer atomic.AddInt32(&p.workers, -1) + + if id > p.maxIdle { + // drain task chan and exit without waiting + for { + select { + case t := <-p.tasks: + p.runTask(t.ctx, t.f) + default: + return + } + } + } + + createdAt := time.Now().UnixMilli() // for checking maxage + for t := range p.tasks { + p.runTask(t.ctx, t.f) + + now := atomic.LoadInt64(&p.unixMilli) + + // check if ticker is NOT alive + // p.unixMilli will be set to zero if it's not running + if now == 0 { + // cas and create a new ticker + now = time.Now().UnixMilli() + if atomic.CompareAndSwapInt64(&p.unixMilli, 0, now) { + go p.runTicker() + } + } + + // check maxage + if now-createdAt > p.maxage { + return + } + } +} + +// noopTask is used by runTicker() to wake up workers and checks their age. +var noopTask = task{f: func() {}} + +func (p *GoPool) runTicker() { + // mark it zero to trigger ticker to be created when we have active workers + defer atomic.StoreInt64(&p.unixMilli, 0) + + // If p.maxage=1s, it updates `unixMilli` and sends 100 noop tasks per second. + // As a result, workers may take longer time to exit, and this is expected. + d := time.Duration(p.maxage) * time.Millisecond / 100 + + // set a minimum value to avoid performance issues. + if d < time.Millisecond { + d = time.Millisecond + } + + t := time.NewTicker(d) + defer t.Stop() + + for now := range t.C { + if p.CurrentWorkers() == 0 { + return + } + atomic.StoreInt64(&p.unixMilli, now.UnixMilli()) + p.tasks <- noopTask + } +} diff --git a/concurrency/gopool/gopool_test.go b/concurrency/gopool/gopool_test.go new file mode 100644 index 0000000..37887fe --- /dev/null +++ b/concurrency/gopool/gopool_test.go @@ -0,0 +1,199 @@ +/* + * Copyright 2025 CloudWeGo Authors + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package gopool + +import ( + "context" + "fmt" + "math" + "runtime" + "sync" + "sync/atomic" + "testing" + "time" + + "github.com/stretchr/testify/require" + + "github.com/bytedance/gopkg/util/gopool" +) + +func TestGoPool(t *testing.T) { + { // test normal case + p := NewGoPool("TestGoPool", nil) + n := 10 + wg := sync.WaitGroup{} + wg.Add(n) + v := int32(0) + for i := 0; i < n; i++ { + p.Go(func() { + time.Sleep(time.Millisecond) + atomic.AddInt32(&v, 1) + wg.Done() + }) + } + wg.Wait() + require.Equal(t, int32(n), atomic.LoadInt32(&v)) + } + + { // test without PanicHandler + p := NewGoPool("TestGoPool", nil) + p.Go(func() { panic("x") }) + time.Sleep(time.Millisecond) + } + + { // test SetPanicHandler + wg := sync.WaitGroup{} + p := NewGoPool("TestGoPool", nil) // fix p.SetPanicHandler data race + ctx, cancel := context.WithCancel(context.Background()) + defer cancel() + x := "testpanic" + p.SetPanicHandler(func(c context.Context, r interface{}) { + defer wg.Done() + require.Equal(t, x, r) + require.Same(t, ctx, c) + }) + wg.Add(1) + p.GoCtx(ctx, func() { + panic(x) + }) + wg.Wait() + } +} + +func TestGoPool_Ticker(t *testing.T) { + o := DefaultOption() + o.WorkerMaxAge = 100 * time.Millisecond + p := NewGoPool("TestGoPool_Ticker", o) + for i := 0; i < 10; i++ { + p.Go(func() { time.Sleep(o.WorkerMaxAge / 10) }) + } + time.Sleep(10 * time.Millisecond) // wait all goroutines to run + require.Equal(t, 10, p.CurrentWorkers()) + time.Sleep(o.WorkerMaxAge + o.WorkerMaxAge/10) // ticker will trigger worker to exit + require.Equal(t, 0, p.CurrentWorkers()) +} + +func TestGoPool_Full(t *testing.T) { + o := DefaultOption() + o.TaskChanBuffer = 1 // smaller value, easier to be full. + p := NewGoPool("TestGoPool_Full", o) + + v := int32(0) + n := 10000 + for i := 0; i < n; i++ { + p.Go(func() { atomic.AddInt32(&v, 1) }) + } + time.Sleep(10 * time.Millisecond) // wait all goroutines done + require.Equal(t, int32(n), atomic.LoadInt32(&v)) +} + +func TestGoPool_MaxIdle(t *testing.T) { + o := DefaultOption() + o.MaxIdleWorkers = 7 + p := NewGoPool("TestGoPool_MaxIdle", o) + + v := int32(0) + n := 10000 + for i := 0; i < n; i++ { + p.Go(func() { atomic.AddInt32(&v, 1) }) + } + time.Sleep(10 * time.Millisecond) // wait all goroutines done + require.Equal(t, int32(n), atomic.LoadInt32(&v)) + require.Equal(t, o.MaxIdleWorkers, p.CurrentWorkers()) +} + +// ======== Benchmarks ... + +// must be const then make() will allocate on stack +const stacksize = 120 + +var ( + testDepths = []int{2, 32, 128} + benchBatch = 2 +) + +func recursiveFunc(depth int) { + if depth < 0 { + return + } + b := make([]byte, stacksize) + recursiveFunc(depth - 1) + runtime.KeepAlive(b) +} + +func makefunc(depth int, wg *sync.WaitGroup) func() { + return func() { + recursiveFunc(depth) + wg.Done() + } +} + +func BenchmarkGoPool(b *testing.B) { + newHandler := func(depth int, wg *sync.WaitGroup) func() { + o := DefaultOption() + p := NewGoPool("BenchmarkGoPool", o) + f := makefunc(depth, wg) + return func() { + p.Go(f) + } + } + benchmarkGo(newHandler, b) +} + +func BenchmarkBytedanceGoPool(b *testing.B) { + newHandler := func(depth int, wg *sync.WaitGroup) func() { + p := gopool.NewPool("BenchmarkBytedanceGoPool", math.MaxInt32, gopool.NewConfig()) + f := makefunc(depth, wg) + return func() { + p.Go(f) + } + } + benchmarkGo(newHandler, b) +} + +func BenchmarkGoWithoutPool(b *testing.B) { + newHandler := func(depth int, wg *sync.WaitGroup) func() { + p := &GoPool{} + f := makefunc(depth, wg) + testf := func() { + // reuse runTask method + p.runTask(context.Background(), f) + } + return func() { + go testf() + } + } + benchmarkGo(newHandler, b) +} + +func benchmarkGo(newHandler func(int, *sync.WaitGroup) func(), b *testing.B) { + for _, depth := range testDepths { + b.Run(fmt.Sprintf("batch_%d_stacksize_%d", benchBatch, depth*stacksize), func(b *testing.B) { + b.RunParallel(func(pb *testing.PB) { + var wg sync.WaitGroup + f := newHandler(depth, &wg) + for pb.Next() { + wg.Add(benchBatch) + for i := 0; i < benchBatch; i++ { + f() + } + wg.Wait() + } + }) + }) + } +}