123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202 |
- package p2c
- import (
- "context"
- "fmt"
- "math"
- "math/rand"
- "strings"
- "sync"
- "sync/atomic"
- "time"
- "github.com/tal-tech/go-zero/core/logx"
- "github.com/tal-tech/go-zero/core/syncx"
- "github.com/tal-tech/go-zero/core/timex"
- "github.com/tal-tech/go-zero/zrpc/internal/codes"
- "google.golang.org/grpc/balancer"
- "google.golang.org/grpc/balancer/base"
- "google.golang.org/grpc/resolver"
- )
- const (
- Name = "p2c_ewma"
- decayTime = int64(time.Second * 10) // default value from finagle
- forcePick = int64(time.Second)
- initSuccess = 1000
- throttleSuccess = initSuccess / 2
- penalty = int64(math.MaxInt32)
- pickTimes = 3
- logInterval = time.Minute
- )
- func init() {
- balancer.Register(newBuilder())
- }
- type p2cPickerBuilder struct {
- }
- func newBuilder() balancer.Builder {
- return base.NewBalancerBuilder(Name, new(p2cPickerBuilder))
- }
- func (b *p2cPickerBuilder) Build(readySCs map[resolver.Address]balancer.SubConn) balancer.Picker {
- if len(readySCs) == 0 {
- return base.NewErrPicker(balancer.ErrNoSubConnAvailable)
- }
- var conns []*subConn
- for addr, conn := range readySCs {
- conns = append(conns, &subConn{
- addr: addr,
- conn: conn,
- success: initSuccess,
- })
- }
- return &p2cPicker{
- conns: conns,
- r: rand.New(rand.NewSource(time.Now().UnixNano())),
- stamp: syncx.NewAtomicDuration(),
- }
- }
- type p2cPicker struct {
- conns []*subConn
- r *rand.Rand
- stamp *syncx.AtomicDuration
- lock sync.Mutex
- }
- func (p *p2cPicker) Pick(ctx context.Context, info balancer.PickInfo) (
- conn balancer.SubConn, done func(balancer.DoneInfo), err error) {
- p.lock.Lock()
- defer p.lock.Unlock()
- var chosen *subConn
- switch len(p.conns) {
- case 0:
- return nil, nil, balancer.ErrNoSubConnAvailable
- case 1:
- chosen = p.choose(p.conns[0], nil)
- case 2:
- chosen = p.choose(p.conns[0], p.conns[1])
- default:
- var node1, node2 *subConn
- for i := 0; i < pickTimes; i++ {
- a := p.r.Intn(len(p.conns))
- b := p.r.Intn(len(p.conns) - 1)
- if b >= a {
- b++
- }
- node1 = p.conns[a]
- node2 = p.conns[b]
- if node1.healthy() && node2.healthy() {
- break
- }
- }
- chosen = p.choose(node1, node2)
- }
- atomic.AddInt64(&chosen.inflight, 1)
- atomic.AddInt64(&chosen.requests, 1)
- return chosen.conn, p.buildDoneFunc(chosen), nil
- }
- func (p *p2cPicker) buildDoneFunc(c *subConn) func(info balancer.DoneInfo) {
- start := int64(timex.Now())
- return func(info balancer.DoneInfo) {
- atomic.AddInt64(&c.inflight, -1)
- now := timex.Now()
- last := atomic.SwapInt64(&c.last, int64(now))
- td := int64(now) - last
- if td < 0 {
- td = 0
- }
- w := math.Exp(float64(-td) / float64(decayTime))
- lag := int64(now) - start
- if lag < 0 {
- lag = 0
- }
- olag := atomic.LoadUint64(&c.lag)
- if olag == 0 {
- w = 0
- }
- atomic.StoreUint64(&c.lag, uint64(float64(olag)*w+float64(lag)*(1-w)))
- success := initSuccess
- if info.Err != nil && !codes.Acceptable(info.Err) {
- success = 0
- }
- osucc := atomic.LoadUint64(&c.success)
- atomic.StoreUint64(&c.success, uint64(float64(osucc)*w+float64(success)*(1-w)))
- stamp := p.stamp.Load()
- if now-stamp >= logInterval {
- if p.stamp.CompareAndSwap(stamp, now) {
- p.logStats()
- }
- }
- }
- }
- func (p *p2cPicker) choose(c1, c2 *subConn) *subConn {
- start := int64(timex.Now())
- if c2 == nil {
- atomic.StoreInt64(&c1.pick, start)
- return c1
- }
- if c1.load() > c2.load() {
- c1, c2 = c2, c1
- }
- pick := atomic.LoadInt64(&c2.pick)
- if start-pick > forcePick && atomic.CompareAndSwapInt64(&c2.pick, pick, start) {
- return c2
- }
- atomic.StoreInt64(&c1.pick, start)
- return c1
- }
- func (p *p2cPicker) logStats() {
- var stats []string
- p.lock.Lock()
- defer p.lock.Unlock()
- for _, conn := range p.conns {
- stats = append(stats, fmt.Sprintf("conn: %s, load: %d, reqs: %d",
- conn.addr.Addr, conn.load(), atomic.SwapInt64(&conn.requests, 0)))
- }
- logx.Statf("p2c - %s", strings.Join(stats, "; "))
- }
- type subConn struct {
- addr resolver.Address
- conn balancer.SubConn
- lag uint64
- inflight int64
- success uint64
- requests int64
- last int64
- pick int64
- }
- func (c *subConn) healthy() bool {
- return atomic.LoadUint64(&c.success) > throttleSuccess
- }
- func (c *subConn) load() int64 {
- // plus one to avoid multiply zero
- lag := int64(math.Sqrt(float64(atomic.LoadUint64(&c.lag) + 1)))
- load := lag * (atomic.LoadInt64(&c.inflight) + 1)
- if load == 0 {
- return penalty
- }
- return load
- }
|