diff --git a/internal/client/retry/backoff.go b/internal/client/retry/backoff.go deleted file mode 100644 index 229d9766c..000000000 --- a/internal/client/retry/backoff.go +++ /dev/null @@ -1,399 +0,0 @@ -// Copyright 2021 TiKV Authors -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// http://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. - -// NOTE: The code in this file is based on code from the -// TiDB project, licensed under the Apache License v 2.0 -// -// https://github.com/pingcap/tidb/tree/cc5e161ac06827589c4966674597c137cc9e809c/store/tikv/retry/backoff.go -// - -// Copyright 2016 PingCAP, Inc. -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// http://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. - -package retry - -import ( - "bytes" - "context" - "fmt" - "math" - "strconv" - "strings" - "sync/atomic" - "time" - - "github.com/opentracing/opentracing-go" - "github.com/pingcap/log" - "github.com/pkg/errors" - tikverr "github.com/tikv/client-go/v2/error" - "github.com/tikv/client-go/v2/internal/logutil" - "github.com/tikv/client-go/v2/kv" - "github.com/tikv/client-go/v2/util" - "go.uber.org/zap" - "go.uber.org/zap/zapcore" -) - -// Backoffer is a utility for retrying queries. -type Backoffer struct { - ctx context.Context - - fn map[string]backoffFn - maxSleep int - totalSleep int - excludedSleep int - - vars *kv.Variables - noop bool - - errors []error - configs []*Config - backoffSleepMS map[string]int - backoffTimes map[string]int - parent *Backoffer -} - -type txnStartCtxKeyType struct{} - -// TxnStartKey is a key for transaction start_ts info in context.Context. -var TxnStartKey interface{} = txnStartCtxKeyType{} - -// NewBackoffer (Deprecated) creates a Backoffer with maximum sleep time(in ms). -func NewBackoffer(ctx context.Context, maxSleep int) *Backoffer { - return &Backoffer{ - ctx: ctx, - maxSleep: maxSleep, - vars: kv.DefaultVars, - } -} - -// NewBackofferWithVars creates a Backoffer with maximum sleep time(in ms) and kv.Variables. -func NewBackofferWithVars(ctx context.Context, maxSleep int, vars *kv.Variables) *Backoffer { - return NewBackoffer(ctx, maxSleep).withVars(vars) -} - -// NewNoopBackoff create a Backoffer do nothing just return error directly -func NewNoopBackoff(ctx context.Context) *Backoffer { - return &Backoffer{ctx: ctx, noop: true} -} - -// withVars sets the kv.Variables to the Backoffer and return it. -func (b *Backoffer) withVars(vars *kv.Variables) *Backoffer { - if vars != nil { - b.vars = vars - } - // maxSleep is the max sleep time in millisecond. - // When it is multiplied by BackOffWeight, it should not be greater than MaxInt32. - if b.maxSleep > 0 && math.MaxInt32/b.vars.BackOffWeight >= b.maxSleep { - b.maxSleep *= b.vars.BackOffWeight - } - return b -} - -// Backoff sleeps a while base on the Config and records the error message. -// It returns a retryable error if total sleep time exceeds maxSleep. -func (b *Backoffer) Backoff(cfg *Config, err error) error { - if span := opentracing.SpanFromContext(b.ctx); span != nil && span.Tracer() != nil { - span1 := span.Tracer().StartSpan(fmt.Sprintf("tikv.backoff.%s", cfg), opentracing.ChildOf(span.Context())) - defer span1.Finish() - opentracing.ContextWithSpan(b.ctx, span1) - } - return b.BackoffWithCfgAndMaxSleep(cfg, -1, err) -} - -// BackoffWithMaxSleepTxnLockFast sleeps a while base on the MaxSleepTxnLock and records the error message -// and never sleep more than maxSleepMs for each sleep. -func (b *Backoffer) BackoffWithMaxSleepTxnLockFast(maxSleepMs int, err error) error { - cfg := BoTxnLockFast - return b.BackoffWithCfgAndMaxSleep(cfg, maxSleepMs, err) -} - -// BackoffWithCfgAndMaxSleep sleeps a while base on the Config and records the error message -// and never sleep more than maxSleepMs for each sleep. -func (b *Backoffer) BackoffWithCfgAndMaxSleep(cfg *Config, maxSleepMs int, err error) error { - if strings.Contains(err.Error(), tikverr.MismatchClusterID) { - logutil.Logger(b.ctx).Fatal("critical error", zap.Error(err)) - } - select { - case <-b.ctx.Done(): - return errors.WithStack(err) - default: - } - if b.noop { - return err - } - maxBackoffTimeExceeded := (b.totalSleep - b.excludedSleep) >= b.maxSleep - maxExcludedTimeExceeded := false - if maxLimit, ok := isSleepExcluded[cfg.name]; ok { - maxExcludedTimeExceeded = b.excludedSleep >= maxLimit && b.excludedSleep >= b.maxSleep - } - maxTimeExceeded := maxBackoffTimeExceeded || maxExcludedTimeExceeded - if b.maxSleep > 0 && maxTimeExceeded { - longestSleepCfg, longestSleepTime := b.longestSleepCfg() - errMsg := fmt.Sprintf("%s backoffer.maxSleep %dms is exceeded, errors:", cfg.String(), b.maxSleep) - for i, err := range b.errors { - // Print only last 3 errors for non-DEBUG log levels. - if log.GetLevel() == zapcore.DebugLevel || i >= len(b.errors)-3 { - errMsg += "\n" + err.Error() - } - } - var backoffDetail bytes.Buffer - totalTimes := 0 - for name, times := range b.backoffTimes { - totalTimes += times - if backoffDetail.Len() > 0 { - backoffDetail.WriteString(", ") - } - backoffDetail.WriteString(name) - backoffDetail.WriteString(":") - backoffDetail.WriteString(strconv.Itoa(times)) - } - errMsg += fmt.Sprintf("\ntotal-backoff-times: %v, backoff-detail: %v, maxBackoffTimeExceeded: %v, maxExcludedTimeExceeded: %v", - totalTimes, backoffDetail.String(), maxBackoffTimeExceeded, maxExcludedTimeExceeded) - returnedErr := err - if longestSleepCfg != nil { - errMsg += fmt.Sprintf("\nlongest sleep type: %s, time: %dms", longestSleepCfg.String(), longestSleepTime) - returnedErr = longestSleepCfg.err - } - logutil.Logger(b.ctx).Warn(errMsg) - // Use the backoff type that contributes most to the timeout to generate a MySQL error. - return errors.WithStack(returnedErr) - } - b.errors = append(b.errors, errors.Errorf("%s at %s", err.Error(), time.Now().Format(time.RFC3339Nano))) - b.configs = append(b.configs, cfg) - - // Lazy initialize. - if b.fn == nil { - b.fn = make(map[string]backoffFn) - } - f, ok := b.fn[cfg.name] - if !ok { - f = cfg.createBackoffFn(b.vars) - b.fn[cfg.name] = f - } - realSleep := f(b.ctx, maxSleepMs) - if cfg.metric != nil { - (*cfg.metric).Observe(float64(realSleep) / 1000) - } - - b.totalSleep += realSleep - if _, ok := isSleepExcluded[cfg.name]; ok { - b.excludedSleep += realSleep - } - if b.backoffSleepMS == nil { - b.backoffSleepMS = make(map[string]int) - } - b.backoffSleepMS[cfg.name] += realSleep - if b.backoffTimes == nil { - b.backoffTimes = make(map[string]int) - } - b.backoffTimes[cfg.name]++ - - stmtExec := b.ctx.Value(util.ExecDetailsKey) - if stmtExec != nil { - detail := stmtExec.(*util.ExecDetails) - atomic.AddInt64(&detail.BackoffDuration, int64(realSleep)*int64(time.Millisecond)) - atomic.AddInt64(&detail.BackoffCount, 1) - } - - err2 := b.checkKilled() - if err2 != nil { - return err2 - } - - var startTs interface{} - if ts := b.ctx.Value(TxnStartKey); ts != nil { - startTs = ts - } - logutil.Logger(b.ctx).Debug( - "retry later", - zap.Error(err), - zap.Int("totalSleep", b.totalSleep), - zap.Int("excludedSleep", b.excludedSleep), - zap.Int("maxSleep", b.maxSleep), - zap.Stringer("type", cfg), - zap.Reflect("txnStartTS", startTs), - ) - return nil -} - -func (b *Backoffer) checkKilled() error { - if b.vars != nil && b.vars.Killed != nil { - killed := atomic.LoadUint32(b.vars.Killed) - if killed != 0 { - logutil.BgLogger().Info( - "backoff stops because a killed signal is received", - zap.Uint32("signal", killed), - ) - return errors.WithStack(tikverr.ErrQueryInterruptedWithSignal{Signal: killed}) - } - } - return nil -} - -func (b *Backoffer) String() string { - if b.totalSleep == 0 { - return "" - } - return fmt.Sprintf(" backoff(%dms %v)", b.totalSleep, b.configs) -} - -// copyMapWithoutRecursive is only used to deep copy map fields in the Backoffer type. -func copyMapWithoutRecursive(srcMap map[string]int) map[string]int { - result := map[string]int{} - for k, v := range srcMap { - result[k] = v - } - return result -} - -// Clone creates a new Backoffer which keeps current Backoffer's sleep time and errors, and shares -// current Backoffer's context. -// Some fields like `configs` and `vars` are concurrently used by all the backoffers in different threads, -// try not to modify the referenced content directly. -func (b *Backoffer) Clone() *Backoffer { - return &Backoffer{ - ctx: b.ctx, - maxSleep: b.maxSleep, - totalSleep: b.totalSleep, - excludedSleep: b.excludedSleep, - vars: b.vars, - errors: append([]error{}, b.errors...), - configs: append([]*Config{}, b.configs...), - backoffSleepMS: copyMapWithoutRecursive(b.backoffSleepMS), - backoffTimes: copyMapWithoutRecursive(b.backoffTimes), - parent: b.parent, - } -} - -// Fork creates a new Backoffer which keeps current Backoffer's sleep time and errors, and holds -// a child context of current Backoffer's context. -// Some fields like `configs` and `vars` are concurrently used by all the backoffers in different threads, -// try not to modify the referenced content directly. -func (b *Backoffer) Fork() (*Backoffer, context.CancelFunc) { - ctx, cancel := context.WithCancel(b.ctx) - return &Backoffer{ - ctx: ctx, - maxSleep: b.maxSleep, - totalSleep: b.totalSleep, - excludedSleep: b.excludedSleep, - errors: append([]error{}, b.errors...), - configs: append([]*Config{}, b.configs...), - backoffSleepMS: copyMapWithoutRecursive(b.backoffSleepMS), - backoffTimes: copyMapWithoutRecursive(b.backoffTimes), - vars: b.vars, - parent: b, - }, cancel -} - -// GetVars returns the binded vars. -func (b *Backoffer) GetVars() *kv.Variables { - return b.vars -} - -// GetTotalSleep returns total sleep time. -func (b *Backoffer) GetTotalSleep() int { - return b.totalSleep -} - -// GetTypes returns type list of this backoff and all its ancestors. -func (b *Backoffer) GetTypes() []string { - typs := make([]string, 0, len(b.configs)) - for b != nil { - for _, cfg := range b.configs { - typs = append(typs, cfg.String()) - } - b = b.parent - } - return typs -} - -// GetCtx returns the binded context. -func (b *Backoffer) GetCtx() context.Context { - return b.ctx -} - -// SetCtx sets the binded context to ctx. -func (b *Backoffer) SetCtx(ctx context.Context) { - b.ctx = ctx -} - -// GetBackoffTimes returns a map contains backoff time count by type. -func (b *Backoffer) GetBackoffTimes() map[string]int { - return b.backoffTimes -} - -// GetTotalBackoffTimes returns the total backoff times of the backoffer. -func (b *Backoffer) GetTotalBackoffTimes() int { - total := 0 - for _, time := range b.backoffTimes { - total += time - } - return total -} - -// GetBackoffSleepMS returns a map contains backoff sleep time by type. -func (b *Backoffer) GetBackoffSleepMS() map[string]int { - return b.backoffSleepMS -} - -// ErrorsNum returns the number of errors. -func (b *Backoffer) ErrorsNum() int { - return len(b.errors) -} - -// Reset resets the sleep state of the backoffer, so that following backoff -// can sleep shorter. The reason why we don't create a new backoffer is that -// backoffer is similar to context and it records some metrics that we -// want to record for an entire process which is composed of serveral stages. -func (b *Backoffer) Reset() { - b.fn = nil - b.totalSleep = 0 - b.excludedSleep = 0 -} - -// ResetMaxSleep resets the sleep state and max sleep limit of the backoffer. -// It's used when switches to the next stage of the process. -func (b *Backoffer) ResetMaxSleep(maxSleep int) { - b.Reset() - b.maxSleep = maxSleep - b.withVars(b.vars) -} - -func (b *Backoffer) longestSleepCfg() (*Config, int) { - candidate := "" - maxSleep := 0 - for cfgName, sleepTime := range b.backoffSleepMS { - if _, ok := isSleepExcluded[cfgName]; sleepTime > maxSleep && !ok { - maxSleep = sleepTime - candidate = cfgName - } - } - for _, cfg := range b.configs { - if cfg.name == candidate { - return cfg, maxSleep - } - } - return nil, 0 -} diff --git a/internal/client/retry/backoff_test.go b/internal/client/retry/backoff_test.go deleted file mode 100644 index cdd6b46ff..000000000 --- a/internal/client/retry/backoff_test.go +++ /dev/null @@ -1,112 +0,0 @@ -// Copyright 2021 TiKV Authors -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// http://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. - -// NOTE: The code in this file is based on code from the -// TiDB project, licensed under the Apache License v 2.0 -// -// https://github.com/pingcap/tidb/tree/cc5e161ac06827589c4966674597c137cc9e809c/store/tikv/retry/backoff_test.go -// - -// Copyright 2019 PingCAP, Inc. -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// http://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. - -package retry - -import ( - "context" - "errors" - "testing" - - "github.com/stretchr/testify/assert" -) - -func TestBackoffWithMax(t *testing.T) { - b := NewBackofferWithVars(context.TODO(), 2000, nil) - err := b.BackoffWithMaxSleepTxnLockFast(5, errors.New("test")) - - assert.Nil(t, err) - assert.Equal(t, 5, b.totalSleep) -} - -func TestBackoffErrorType(t *testing.T) { - // the actual maxSleep is multiplied by weight, which is 1600ms - b := NewBackofferWithVars(context.TODO(), 800, nil) - err := b.Backoff(BoRegionMiss, errors.New("region miss")) // 2ms sleep - assert.Nil(t, err) - // 6ms sleep at most in total - for i := 0; i < 2; i++ { - err = b.Backoff(BoMaxDataNotReady, errors.New("data not ready")) - assert.Nil(t, err) - } - // 100ms sleep at most in total - err = b.Backoff(BoRegionRecoveryInProgress, errors.New("recovery in progress")) - assert.Nil(t, err) - - // sleep from ServerIsBusy is not counted - err = b.Backoff(BoTiKVServerBusy, errors.New("server is busy")) - assert.Nil(t, err) - // 1000ms sleep at most in total - err = b.Backoff(BoIsWitness, errors.New("peer is witness")) - assert.Nil(t, err) - // wait it exceed max sleep - for i := 0; i < 15; i++ { - err = b.Backoff(BoTxnNotFound, errors.New("txn not found")) - if err != nil { - // Next backoff should return error of backoff that sleeps for longest time. - assert.ErrorIs(t, err, BoTxnNotFound.err) - return - } - } - assert.Fail(t, "should not be here") -} - -func TestBackoffDeepCopy(t *testing.T) { - var err error - b := NewBackofferWithVars(context.TODO(), 4, nil) - // 700 ms sleep in total and the backoffer will return an error next time. - for i := 0; i < 3; i++ { - err = b.Backoff(BoMaxDataNotReady, errors.New("data not ready")) - assert.Nil(t, err) - } - bForked, cancel := b.Fork() - defer cancel() - bCloned := b.Clone() - for _, b := range []*Backoffer{bForked, bCloned} { - err = b.Backoff(BoTiKVRPC, errors.New("tikv rpc")) - assert.ErrorIs(t, err, BoMaxDataNotReady.err) - } -} - -func TestBackoffWithMaxExcludedExceed(t *testing.T) { - setBackoffExcluded(BoTiKVServerBusy.name, 1) - b := NewBackofferWithVars(context.TODO(), 1, nil) - err := b.Backoff(BoTiKVServerBusy, errors.New("server is busy")) - assert.Nil(t, err) - - // As the total excluded sleep is greater than the max limited value, error should be returned. - err = b.Backoff(BoTiKVServerBusy, errors.New("server is busy")) - assert.NotNil(t, err) - assert.Greater(t, b.excludedSleep, b.maxSleep) -} diff --git a/internal/client/retry/config.go b/internal/client/retry/config.go deleted file mode 100644 index 17b524786..000000000 --- a/internal/client/retry/config.go +++ /dev/null @@ -1,203 +0,0 @@ -// Copyright 2021 TiKV Authors -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// http://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. - -// NOTE: The code in this file is based on code from the -// TiDB project, licensed under the Apache License v 2.0 -// -// https://github.com/pingcap/tidb/tree/cc5e161ac06827589c4966674597c137cc9e809c/store/tikv/retry/config.go -// - -// Copyright 2021 PingCAP, Inc. -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// http://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. - -package retry - -import ( - "context" - "math" - "math/rand" - "strings" - "time" - - "github.com/prometheus/client_golang/prometheus" - tikverr "github.com/tikv/client-go/v2/error" - "github.com/tikv/client-go/v2/internal/logutil" - "github.com/tikv/client-go/v2/kv" - "github.com/tikv/client-go/v2/metrics" - "go.uber.org/zap" -) - -// Config is the configuration of the Backoff function. -type Config struct { - name string - metric *prometheus.Observer - fnCfg *BackoffFnCfg - err error -} - -// backoffFn is the backoff function which compute the sleep time and do sleep. -type backoffFn func(ctx context.Context, maxSleepMs int) int - -func (c *Config) createBackoffFn(vars *kv.Variables) backoffFn { - if strings.EqualFold(c.name, txnLockFastName) { - return newBackoffFn(vars.BackoffLockFast, c.fnCfg.cap, c.fnCfg.jitter) - } - return newBackoffFn(c.fnCfg.base, c.fnCfg.cap, c.fnCfg.jitter) -} - -// BackoffFnCfg is the configuration for the backoff func which implements exponential backoff with -// optional jitters. -// See http://www.awsarchitectureblog.com/2015/03/backoff.html -type BackoffFnCfg struct { - base int - cap int - jitter int -} - -// NewBackoffFnCfg creates the config for BackoffFn. -func NewBackoffFnCfg(base, cap, jitter int) *BackoffFnCfg { - return &BackoffFnCfg{ - base, - cap, - jitter, - } -} - -// NewConfig creates a new Config for the Backoff operation. -func NewConfig(name string, metric *prometheus.Observer, backoffFnCfg *BackoffFnCfg, err error) *Config { - return &Config{ - name: name, - metric: metric, - fnCfg: backoffFnCfg, - err: err, - } -} - -func (c *Config) String() string { - return c.name -} - -// SetErrors sets a more detailed error instead of the default bo config. -func (c *Config) SetErrors(err error) { - c.err = err -} - -const txnLockFastName = "txnLockFast" - -// Backoff Config variables. -var ( - // TODO: distinguish tikv and tiflash in metrics - BoTiKVRPC = NewConfig("tikvRPC", &metrics.BackoffHistogramRPC, NewBackoffFnCfg(100, 2000, EqualJitter), tikverr.ErrTiKVServerTimeout) - BoTiFlashRPC = NewConfig("tiflashRPC", &metrics.BackoffHistogramRPC, NewBackoffFnCfg(100, 2000, EqualJitter), tikverr.ErrTiFlashServerTimeout) - BoTxnLock = NewConfig("txnLock", &metrics.BackoffHistogramLock, NewBackoffFnCfg(100, 3000, EqualJitter), tikverr.ErrResolveLockTimeout) - BoPDRPC = NewConfig("pdRPC", &metrics.BackoffHistogramPD, NewBackoffFnCfg(500, 3000, EqualJitter), tikverr.NewErrPDServerTimeout("")) - // change base time to 2ms, because it may recover soon. - BoRegionMiss = NewConfig("regionMiss", &metrics.BackoffHistogramRegionMiss, NewBackoffFnCfg(2, 500, NoJitter), tikverr.ErrRegionUnavailable) - BoRegionScheduling = NewConfig("regionScheduling", &metrics.BackoffHistogramRegionScheduling, NewBackoffFnCfg(2, 500, NoJitter), tikverr.ErrRegionUnavailable) - BoTiKVServerBusy = NewConfig("tikvServerBusy", &metrics.BackoffHistogramServerBusy, NewBackoffFnCfg(2000, 10000, EqualJitter), tikverr.ErrTiKVServerBusy) - BoTiKVDiskFull = NewConfig("tikvDiskFull", &metrics.BackoffHistogramTiKVDiskFull, NewBackoffFnCfg(500, 5000, NoJitter), tikverr.ErrTiKVDiskFull) - BoRegionRecoveryInProgress = NewConfig("regionRecoveryInProgress", &metrics.BackoffHistogramRegionRecoveryInProgress, NewBackoffFnCfg(100, 10000, EqualJitter), tikverr.ErrRegionRecoveryInProgress) - BoTiFlashServerBusy = NewConfig("tiflashServerBusy", &metrics.BackoffHistogramServerBusy, NewBackoffFnCfg(2000, 10000, EqualJitter), tikverr.ErrTiFlashServerBusy) - BoTxnNotFound = NewConfig("txnNotFound", &metrics.BackoffHistogramEmpty, NewBackoffFnCfg(2, 500, NoJitter), tikverr.ErrResolveLockTimeout) - BoStaleCmd = NewConfig("staleCommand", &metrics.BackoffHistogramStaleCmd, NewBackoffFnCfg(2, 1000, NoJitter), tikverr.ErrTiKVStaleCommand) - BoMaxTsNotSynced = NewConfig("maxTsNotSynced", &metrics.BackoffHistogramEmpty, NewBackoffFnCfg(2, 500, NoJitter), tikverr.ErrTiKVMaxTimestampNotSynced) - BoMaxDataNotReady = NewConfig("dataNotReady", &metrics.BackoffHistogramDataNotReady, NewBackoffFnCfg(2, 2000, NoJitter), tikverr.ErrRegionDataNotReady) - BoMaxRegionNotInitialized = NewConfig("regionNotInitialized", &metrics.BackoffHistogramEmpty, NewBackoffFnCfg(2, 1000, NoJitter), tikverr.ErrRegionNotInitialized) - BoIsWitness = NewConfig("isWitness", &metrics.BackoffHistogramIsWitness, NewBackoffFnCfg(1000, 10000, EqualJitter), tikverr.ErrIsWitness) - // TxnLockFast's `base` load from vars.BackoffLockFast when create BackoffFn. - BoTxnLockFast = NewConfig(txnLockFastName, &metrics.BackoffHistogramLockFast, NewBackoffFnCfg(2, 3000, EqualJitter), tikverr.ErrResolveLockTimeout) -) - -var isSleepExcluded = map[string]int{ - BoTiKVServerBusy.name: 600000, // The max excluded limit is 10min. - // add BoTiFlashServerBusy if appropriate -} - -// setBackoffExcluded is used for test only. -func setBackoffExcluded(name string, maxVal int) { - if _, ok := isSleepExcluded[name]; ok { - isSleepExcluded[name] = maxVal - } -} - -const ( - // NoJitter makes the backoff sequence strict exponential. - NoJitter = 1 + iota - // FullJitter applies random factors to strict exponential. - FullJitter - // EqualJitter is also randomized, but prevents very short sleeps. - EqualJitter - // DecorrJitter increases the maximum jitter based on the last random value. - DecorrJitter -) - -// newBackoffFn creates a backoff func which implements exponential backoff with -// optional jitters. -// See http://www.awsarchitectureblog.com/2015/03/backoff.html -func newBackoffFn(base, cap, jitter int) backoffFn { - if base < 2 { - // Top prevent panic in 'rand.Intn'. - base = 2 - } - attempts := 0 - lastSleep := base - return func(ctx context.Context, maxSleepMs int) int { - var sleep int - switch jitter { - case NoJitter: - sleep = expo(base, cap, attempts) - case FullJitter: - v := expo(base, cap, attempts) - sleep = rand.Intn(v) - case EqualJitter: - v := expo(base, cap, attempts) - sleep = v/2 + rand.Intn(v/2) - case DecorrJitter: - sleep = int(math.Min(float64(cap), float64(base+rand.Intn(lastSleep*3-base)))) - } - logutil.BgLogger().Debug("backoff", - zap.Int("base", base), - zap.Int("sleep", sleep), - zap.Int("attempts", attempts)) - - realSleep := sleep - // when set maxSleepMs >= 0 in `tikv.BackoffWithMaxSleep` will force sleep maxSleepMs milliseconds. - if maxSleepMs >= 0 && realSleep > maxSleepMs { - realSleep = maxSleepMs - } - select { - case <-time.After(time.Duration(realSleep) * time.Millisecond): - attempts++ - lastSleep = sleep - return realSleep - case <-ctx.Done(): - return 0 - } - } -} - -func expo(base, cap, n int) int { - return int(math.Min(float64(cap), float64(base)*math.Pow(2.0, float64(n)))) -}