From 65f0ea2b6d2e60bab33f8331af9f9d04f2ecfa82 Mon Sep 17 00:00:00 2001
From: Yongbo Jiang <cabinfeveroier@gmail.com>
Date: Mon, 1 Apr 2024 10:33:15 +0800
Subject: [PATCH 1/2] This is an automated cherry-pick of #7722

close tikv/pd#7726

Signed-off-by: ti-chi-bot <ti-community-prow-bot@tidb.io>
---
 pkg/progress/progress.go      | 103 ++++-
 pkg/progress/progress_test.go | 138 +++++-
 pkg/schedule/coordinator.go   | 835 ++++++++++++++++++++++++++++++++++
 server/cluster/cluster.go     |  18 +-
 4 files changed, 1064 insertions(+), 30 deletions(-)
 create mode 100644 pkg/schedule/coordinator.go

diff --git a/pkg/progress/progress.go b/pkg/progress/progress.go
index 345e4928c41..6940ad1dd01 100644
--- a/pkg/progress/progress.go
+++ b/pkg/progress/progress.go
@@ -24,8 +24,14 @@ import (
 	"github.com/tikv/pd/pkg/utils/syncutil"
 )
 
-// speedStatisticalWindow is the speed calculation window
-const speedStatisticalWindow = 10 * time.Minute
+const (
+	// maxSpeedCalculationWindow is the maximum size of the time window used to calculate the speed,
+	// but it does not mean that all data in it will be used to calculate the speed,
+	// which data is used depends on the patrol region duration
+	maxSpeedCalculationWindow = 2 * time.Hour
+	// minSpeedCalculationWindow is the minimum speed calculation window
+	minSpeedCalculationWindow = 10 * time.Minute
+)
 
 // Manager is used to maintain the progresses we care about.
 type Manager struct {
@@ -46,12 +52,28 @@ type progressIndicator struct {
 	remaining float64
 	// We use a fixed interval's history to calculate the latest average speed.
 	history *list.List
-	// We use speedStatisticalWindow / updateInterval to get the windowLengthLimit.
-	// Assume that the windowLengthLimit is 3, the init value is 1. after update 3 times with 2, 3, 4 separately. The window will become [1, 2, 3, 4].
+	// We use (maxSpeedCalculationWindow / updateInterval + 1) to get the windowCapacity.
+	// Assume that the windowCapacity is 4, the init value is 1. After update 3 times with 2, 3, 4 separately. The window will become [1, 2, 3, 4].
 	// Then we update it again with 5, the window will become [2, 3, 4, 5].
-	windowLengthLimit int
-	updateInterval    time.Duration
-	lastSpeed         float64
+	windowCapacity int
+	// windowLength is used to determine what data will be computed.
+	// Assume that the windowLength is 2, the init value is 1. The value that will be calculated are [1].
+	// After update 3 times with 2, 3, 4 separately. The value that will be calculated are [3,4] and the values in queue are [(1,2),3,4].
+	// It helps us avoid calculation results jumping change when patrol-region-interval changes.
+	windowLength int
+	// front is the first element which should be used.
+	// currentWindowLength indicates where the front is currently in the queue.
+	// Assume that the windowLength is 2, the init value is 1. The front is [1] and currentWindowLength is 1.
+	// After update 3 times with 2, 3, 4 separately.
+	// The front is [3], the currentWindowLength is 2, and values in queue are [(1,2),3,4]
+	//                                                                                ^ front
+	//                                                                                - - currentWindowLength = len([3,4]) = 2
+	// We will always keep the currentWindowLength equal to windowLength if the actual size is enough.
+	front               *list.Element
+	currentWindowLength int
+
+	updateInterval time.Duration
+	lastSpeed      float64
 }
 
 // Reset resets the progress manager.
@@ -62,13 +84,29 @@ func (m *Manager) Reset() {
 	m.progesses = make(map[string]*progressIndicator)
 }
 
+// Option is used to do some action for progressIndicator.
+type Option func(*progressIndicator)
+
+// WindowDurationOption changes the time window size.
+func WindowDurationOption(dur time.Duration) func(*progressIndicator) {
+	return func(pi *progressIndicator) {
+		if dur < minSpeedCalculationWindow {
+			dur = minSpeedCalculationWindow
+		} else if dur > maxSpeedCalculationWindow {
+			dur = maxSpeedCalculationWindow
+		}
+		pi.windowLength = int(dur/pi.updateInterval) + 1
+	}
+}
+
 // AddProgress adds a progress into manager if it doesn't exist.
-func (m *Manager) AddProgress(progress string, current, total float64, updateInterval time.Duration) (exist bool) {
+func (m *Manager) AddProgress(progress string, current, total float64, updateInterval time.Duration, opts ...Option) (exist bool) {
 	m.Lock()
 	defer m.Unlock()
 
 	history := list.New()
 	history.PushBack(current)
+<<<<<<< HEAD
 	if _, exist = m.progesses[progress]; !exist {
 		m.progesses[progress] = &progressIndicator{
 			total:             total,
@@ -76,38 +114,73 @@ func (m *Manager) AddProgress(progress string, current, total float64, updateInt
 			history:           history,
 			windowLengthLimit: int(speedStatisticalWindow / updateInterval),
 			updateInterval:    updateInterval,
+=======
+	if _, exist = m.progresses[progress]; !exist {
+		pi := &progressIndicator{
+			total:          total,
+			remaining:      total,
+			history:        history,
+			windowCapacity: int(maxSpeedCalculationWindow/updateInterval) + 1,
+			windowLength:   int(minSpeedCalculationWindow / updateInterval),
+			updateInterval: updateInterval,
+>>>>>>> 945e29c03 (cluster: dynamic progress time window for offline scene (#7722))
+		}
+		for _, op := range opts {
+			op(pi)
 		}
+		m.progresses[progress] = pi
+		pi.front = history.Front()
+		pi.currentWindowLength = 1
 	}
 	return
 }
 
 // UpdateProgress updates the progress if it exists.
-func (m *Manager) UpdateProgress(progress string, current, remaining float64, isInc bool) {
+func (m *Manager) UpdateProgress(progress string, current, remaining float64, isInc bool, opts ...Option) {
 	m.Lock()
 	defer m.Unlock()
 
+<<<<<<< HEAD
 	if p, exist := m.progesses[progress]; exist {
+=======
+	if p, exist := m.progresses[progress]; exist {
+		for _, op := range opts {
+			op(p)
+		}
+>>>>>>> 945e29c03 (cluster: dynamic progress time window for offline scene (#7722))
 		p.remaining = remaining
 		if p.total < remaining {
 			p.total = remaining
 		}
 
-		if p.history.Len() > p.windowLengthLimit {
+		p.history.PushBack(current)
+		p.currentWindowLength++
+
+		// try to move `front` into correct place.
+		for p.currentWindowLength > p.windowLength {
+			p.front = p.front.Next()
+			p.currentWindowLength--
+		}
+		for p.currentWindowLength < p.windowLength && p.front.Prev() != nil {
+			p.front = p.front.Prev()
+			p.currentWindowLength++
+		}
+
+		for p.history.Len() > p.windowCapacity {
 			p.history.Remove(p.history.Front())
 		}
-		p.history.PushBack(current)
 
 		// It means it just init and we haven't update the progress
 		if p.history.Len() <= 1 {
 			p.lastSpeed = 0
 		} else if isInc {
 			// the value increases, e.g., [1, 2, 3]
-			p.lastSpeed = (p.history.Back().Value.(float64) - p.history.Front().Value.(float64)) /
-				(float64(p.history.Len()-1) * p.updateInterval.Seconds())
+			p.lastSpeed = (current - p.front.Value.(float64)) /
+				(float64(p.currentWindowLength-1) * p.updateInterval.Seconds())
 		} else {
 			// the value decreases, e.g., [3, 2, 1]
-			p.lastSpeed = (p.history.Front().Value.(float64) - p.history.Back().Value.(float64)) /
-				(float64(p.history.Len()-1) * p.updateInterval.Seconds())
+			p.lastSpeed = (p.front.Value.(float64) - current) /
+				(float64(p.currentWindowLength-1) * p.updateInterval.Seconds())
 		}
 		if p.lastSpeed < 0 {
 			p.lastSpeed = 0
diff --git a/pkg/progress/progress_test.go b/pkg/progress/progress_test.go
index e6799fb0ff8..524d216d0ea 100644
--- a/pkg/progress/progress_test.go
+++ b/pkg/progress/progress_test.go
@@ -24,7 +24,6 @@ import (
 )
 
 func TestProgress(t *testing.T) {
-	t.Parallel()
 	re := require.New(t)
 	n := "test"
 	m := NewManager()
@@ -41,15 +40,17 @@ func TestProgress(t *testing.T) {
 	p, ls, cs, err = m.Status(n)
 	re.NoError(err)
 	re.Equal(0.7, p)
-	// 30/(70/1s+) > 30/70
-	re.Greater(ls, 30.0/70.0)
-	// 70/1s+ > 70
-	re.Less(cs, 70.0)
+	re.Less(math.Abs(ls-30.0/7.0), 1e-6)
+	re.Less(math.Abs(cs-7), 1e-6)
 	// there is no scheduling
-	for i := 0; i < 100; i++ {
+	for i := 0; i < 1000; i++ {
 		m.UpdateProgress(n, 30, 30, false)
 	}
+<<<<<<< HEAD
 	re.Equal(61, m.progesses[n].history.Len())
+=======
+	re.Equal(721, m.progresses[n].history.Len())
+>>>>>>> 945e29c03 (cluster: dynamic progress time window for offline scene (#7722))
 	p, ls, cs, err = m.Status(n)
 	re.NoError(err)
 	re.Equal(0.7, p)
@@ -70,7 +71,6 @@ func TestProgress(t *testing.T) {
 }
 
 func TestAbnormal(t *testing.T) {
-	t.Parallel()
 	re := require.New(t)
 	n := "test"
 	m := NewManager()
@@ -95,3 +95,127 @@ func TestAbnormal(t *testing.T) {
 	re.Equal(0.0, ls)
 	re.Equal(0.0, cs)
 }
+
+func TestProgressWithDynamicWindow(t *testing.T) {
+	// The full capacity of queue is 721.
+	re := require.New(t)
+	n := "test"
+	m := NewManager()
+	re.False(m.AddProgress(n, 100, 100, 10*time.Second))
+	p, ls, cs, err := m.Status(n)
+	re.NoError(err)
+	re.Equal(0.0, p)
+	re.Equal(math.MaxFloat64, ls)
+	re.Equal(0.0, cs)
+	time.Sleep(time.Second)
+	re.True(m.AddProgress(n, 100, 100, 10*time.Second))
+
+	m.UpdateProgress(n, 31, 31, false)
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.69, p)
+	re.Less(math.Abs(ls-31.0/6.9), 1e-6)
+	re.Less(math.Abs(cs-6.9), 1e-6)
+	re.Equal(2, m.progresses[n].currentWindowLength)
+	re.Equal(100.0, m.progresses[n].front.Value.(float64))
+
+	m.UpdateProgress(n, 30, 30, false, WindowDurationOption(time.Minute*20))
+	re.Equal(3, m.progresses[n].currentWindowLength)
+	re.Equal(100.0, m.progresses[n].front.Value.(float64))
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.7, p)
+	re.Less(math.Abs(ls-30.0/(7.0/2)), 1e-6)
+	re.Less(math.Abs(cs-3.5), 1e-6)
+
+	for i := 0; i < 1000; i++ {
+		m.UpdateProgress(n, 30, 30, false)
+	}
+	re.Equal(721, m.progresses[n].history.Len())
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.7, p)
+	re.Equal(math.MaxFloat64, ls)
+	re.Equal(0.0, cs)
+	m.UpdateProgress(n, 29, 29, false, WindowDurationOption(time.Minute*20))
+	re.Equal(121, m.progresses[n].currentWindowLength)
+	re.Equal(30.0, m.progresses[n].front.Value.(float64))
+	re.Equal(721, m.progresses[n].history.Len())
+
+	for i := 0; i < 60; i++ {
+		m.UpdateProgress(n, 28, 28, false)
+	}
+	re.Equal(721, m.progresses[n].history.Len())
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.72, p)
+	re.Equal(float64(28/(2./120)*10.), ls)
+	re.Equal(float64(2./120/10.), cs)
+
+	m.UpdateProgress(n, 28, 28, false, WindowDurationOption(time.Minute*10))
+	re.Equal(721, m.progresses[n].history.Len())
+	re.Equal(61, m.progresses[n].currentWindowLength)
+	re.Equal(28.0, m.progresses[n].front.Value.(float64))
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.72, p)
+	re.Equal(math.MaxFloat64, ls)
+	re.Equal(0.0, cs)
+
+	m.UpdateProgress(n, 28, 28, false, WindowDurationOption(time.Minute*20))
+	re.Equal(121, m.progresses[n].currentWindowLength)
+	re.Equal(30.0, m.progresses[n].front.Value.(float64))
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.72, p)
+	re.Equal(float64(28/(2./120)*10.), ls)
+	re.Equal(float64(2./120/10.), cs)
+
+	m.UpdateProgress(n, 1, 1, false, WindowDurationOption(time.Minute*12))
+	re.Equal(73, m.progresses[n].currentWindowLength)
+	re.Equal(30.0, m.progresses[n].front.Value.(float64))
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.99, p)
+	re.Equal(float64(1/(29./72)*10.), ls)
+	re.Equal(float64(29./72/10.), cs)
+
+	m.UpdateProgress(n, 1, 1, false, WindowDurationOption(time.Minute*5))
+	re.Equal(61, m.progresses[n].currentWindowLength)
+	re.Equal(28.0, m.progresses[n].front.Value.(float64))
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.99, p)
+	re.Equal(float64(1/(27./60)*10.), ls)
+	re.Equal(float64(27./60/10.), cs)
+
+	m.UpdateProgress(n, 1, 1, false, WindowDurationOption(time.Minute*180))
+	p, ls, cs, err = m.Status(n)
+	re.Equal(721, m.progresses[n].currentWindowLength)
+	re.Equal(30.0, m.progresses[n].front.Value.(float64))
+	re.NoError(err)
+	re.Equal(0.99, p)
+	re.Equal(float64(1/(29./720)*10.), ls)
+	re.Equal(float64(29./720/10.), cs)
+	for i := 0; i < 2000; i++ {
+		m.UpdateProgress(n, 1, 1, false)
+	}
+	re.Equal(721, m.progresses[n].history.Len())
+	p, ls, cs, err = m.Status(n)
+	re.NoError(err)
+	re.Equal(0.99, p)
+	re.Equal(math.MaxFloat64, ls)
+	re.Equal(0.0, cs)
+
+	ps := m.GetProgresses(func(p string) bool {
+		return strings.Contains(p, n)
+	})
+	re.Len(ps, 1)
+	re.Equal(n, ps[0])
+	ps = m.GetProgresses(func(p string) bool {
+		return strings.Contains(p, "a")
+	})
+	re.Empty(ps)
+	re.True(m.RemoveProgress(n))
+	re.False(m.RemoveProgress(n))
+}
diff --git a/pkg/schedule/coordinator.go b/pkg/schedule/coordinator.go
new file mode 100644
index 00000000000..35d9c2029a1
--- /dev/null
+++ b/pkg/schedule/coordinator.go
@@ -0,0 +1,835 @@
+// Copyright 2016 TiKV Project Authors.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+package schedule
+
+import (
+	"bytes"
+	"context"
+	"strconv"
+	"sync"
+	"time"
+
+	"github.com/pingcap/errors"
+	"github.com/pingcap/failpoint"
+	"github.com/pingcap/log"
+	"github.com/tikv/pd/pkg/cache"
+	"github.com/tikv/pd/pkg/core"
+	"github.com/tikv/pd/pkg/errs"
+	"github.com/tikv/pd/pkg/schedule/checker"
+	sc "github.com/tikv/pd/pkg/schedule/config"
+	sche "github.com/tikv/pd/pkg/schedule/core"
+	"github.com/tikv/pd/pkg/schedule/diagnostic"
+	"github.com/tikv/pd/pkg/schedule/hbstream"
+	"github.com/tikv/pd/pkg/schedule/operator"
+	"github.com/tikv/pd/pkg/schedule/scatter"
+	"github.com/tikv/pd/pkg/schedule/schedulers"
+	"github.com/tikv/pd/pkg/schedule/splitter"
+	"github.com/tikv/pd/pkg/statistics"
+	"github.com/tikv/pd/pkg/statistics/utils"
+	"github.com/tikv/pd/pkg/utils/logutil"
+	"github.com/tikv/pd/pkg/utils/syncutil"
+	"go.uber.org/zap"
+)
+
+const (
+	runSchedulerCheckInterval  = 3 * time.Second
+	checkSuspectRangesInterval = 100 * time.Millisecond
+	collectFactor              = 0.9
+	collectTimeout             = 5 * time.Minute
+	maxLoadConfigRetries       = 10
+	// pushOperatorTickInterval is the interval try to push the operator.
+	pushOperatorTickInterval = 500 * time.Millisecond
+
+	patrolScanRegionLimit = 128 // It takes about 14 minutes to iterate 1 million regions.
+	// PluginLoad means action for load plugin
+	PluginLoad = "PluginLoad"
+	// PluginUnload means action for unload plugin
+	PluginUnload = "PluginUnload"
+)
+
+var (
+	// WithLabelValues is a heavy operation, define variable to avoid call it every time.
+	waitingListGauge  = regionListGauge.WithLabelValues("waiting_list")
+	priorityListGauge = regionListGauge.WithLabelValues("priority_list")
+)
+
+// Coordinator is used to manage all schedulers and checkers to decide if the region needs to be scheduled.
+type Coordinator struct {
+	syncutil.RWMutex
+
+	wg     sync.WaitGroup
+	ctx    context.Context
+	cancel context.CancelFunc
+
+	schedulersInitialized bool
+	patrolRegionsDuration time.Duration
+
+	cluster           sche.ClusterInformer
+	prepareChecker    *prepareChecker
+	checkers          *checker.Controller
+	regionScatterer   *scatter.RegionScatterer
+	regionSplitter    *splitter.RegionSplitter
+	schedulers        *schedulers.Controller
+	opController      *operator.Controller
+	hbStreams         *hbstream.HeartbeatStreams
+	pluginInterface   *PluginInterface
+	diagnosticManager *diagnostic.Manager
+}
+
+// NewCoordinator creates a new Coordinator.
+func NewCoordinator(parentCtx context.Context, cluster sche.ClusterInformer, hbStreams *hbstream.HeartbeatStreams) *Coordinator {
+	ctx, cancel := context.WithCancel(parentCtx)
+	opController := operator.NewController(ctx, cluster.GetBasicCluster(), cluster.GetSharedConfig(), hbStreams)
+	schedulers := schedulers.NewController(ctx, cluster, cluster.GetStorage(), opController)
+	checkers := checker.NewController(ctx, cluster, cluster.GetCheckerConfig(), cluster.GetRuleManager(), cluster.GetRegionLabeler(), opController)
+	return &Coordinator{
+		ctx:                   ctx,
+		cancel:                cancel,
+		schedulersInitialized: false,
+		cluster:               cluster,
+		prepareChecker:        newPrepareChecker(),
+		checkers:              checkers,
+		regionScatterer:       scatter.NewRegionScatterer(ctx, cluster, opController, checkers.AddSuspectRegions),
+		regionSplitter:        splitter.NewRegionSplitter(cluster, splitter.NewSplitRegionsHandler(cluster, opController), checkers.AddSuspectRegions),
+		schedulers:            schedulers,
+		opController:          opController,
+		hbStreams:             hbStreams,
+		pluginInterface:       NewPluginInterface(),
+		diagnosticManager:     diagnostic.NewManager(schedulers, cluster.GetSchedulerConfig()),
+	}
+}
+
+// GetPatrolRegionsDuration returns the duration of the last patrol region round.
+func (c *Coordinator) GetPatrolRegionsDuration() time.Duration {
+	if c == nil {
+		return 0
+	}
+	c.RLock()
+	defer c.RUnlock()
+	return c.patrolRegionsDuration
+}
+
+func (c *Coordinator) setPatrolRegionsDuration(dur time.Duration) {
+	c.Lock()
+	defer c.Unlock()
+	c.patrolRegionsDuration = dur
+}
+
+// markSchedulersInitialized marks the scheduler initialization is finished.
+func (c *Coordinator) markSchedulersInitialized() {
+	c.Lock()
+	defer c.Unlock()
+	c.schedulersInitialized = true
+}
+
+// AreSchedulersInitialized returns whether the schedulers have been initialized.
+func (c *Coordinator) AreSchedulersInitialized() bool {
+	c.RLock()
+	defer c.RUnlock()
+	return c.schedulersInitialized
+}
+
+// GetWaitingRegions returns the regions in the waiting list.
+func (c *Coordinator) GetWaitingRegions() []*cache.Item {
+	return c.checkers.GetWaitingRegions()
+}
+
+// IsPendingRegion returns if the region is in the pending list.
+func (c *Coordinator) IsPendingRegion(region uint64) bool {
+	return c.checkers.IsPendingRegion(region)
+}
+
+// PatrolRegions is used to scan regions.
+// The checkers will check these regions to decide if they need to do some operations.
+// The function is exposed for test purpose.
+func (c *Coordinator) PatrolRegions() {
+	defer logutil.LogPanic()
+
+	defer c.wg.Done()
+	ticker := time.NewTicker(c.cluster.GetCheckerConfig().GetPatrolRegionInterval())
+	defer ticker.Stop()
+
+	log.Info("coordinator starts patrol regions")
+	start := time.Now()
+	var (
+		key     []byte
+		regions []*core.RegionInfo
+	)
+	for {
+		select {
+		case <-ticker.C:
+			// Note: we reset the ticker here to support updating configuration dynamically.
+			ticker.Reset(c.cluster.GetCheckerConfig().GetPatrolRegionInterval())
+		case <-c.ctx.Done():
+			patrolCheckRegionsGauge.Set(0)
+			c.setPatrolRegionsDuration(0)
+			log.Info("patrol regions has been stopped")
+			return
+		}
+		if c.isSchedulingHalted() {
+			continue
+		}
+
+		// Check priority regions first.
+		c.checkPriorityRegions()
+		// Check suspect regions first.
+		c.checkSuspectRegions()
+		// Check regions in the waiting list
+		c.checkWaitingRegions()
+
+		key, regions = c.checkRegions(key)
+		if len(regions) == 0 {
+			continue
+		}
+		// Updates the label level isolation statistics.
+		c.cluster.UpdateRegionsLabelLevelStats(regions)
+		if len(key) == 0 {
+			dur := time.Since(start)
+			patrolCheckRegionsGauge.Set(dur.Seconds())
+			c.setPatrolRegionsDuration(dur)
+			start = time.Now()
+		}
+		failpoint.Inject("break-patrol", func() {
+			failpoint.Break()
+		})
+	}
+}
+
+func (c *Coordinator) isSchedulingHalted() bool {
+	return c.cluster.GetSchedulerConfig().IsSchedulingHalted()
+}
+
+func (c *Coordinator) checkRegions(startKey []byte) (key []byte, regions []*core.RegionInfo) {
+	regions = c.cluster.ScanRegions(startKey, nil, patrolScanRegionLimit)
+	if len(regions) == 0 {
+		// Resets the scan key.
+		key = nil
+		return
+	}
+
+	for _, region := range regions {
+		c.tryAddOperators(region)
+		key = region.GetEndKey()
+	}
+	return
+}
+
+func (c *Coordinator) checkSuspectRegions() {
+	for _, id := range c.checkers.GetSuspectRegions() {
+		region := c.cluster.GetRegion(id)
+		c.tryAddOperators(region)
+	}
+}
+
+func (c *Coordinator) checkWaitingRegions() {
+	items := c.checkers.GetWaitingRegions()
+	waitingListGauge.Set(float64(len(items)))
+	for _, item := range items {
+		region := c.cluster.GetRegion(item.Key)
+		c.tryAddOperators(region)
+	}
+}
+
+// checkPriorityRegions checks priority regions
+func (c *Coordinator) checkPriorityRegions() {
+	items := c.checkers.GetPriorityRegions()
+	removes := make([]uint64, 0)
+	priorityListGauge.Set(float64(len(items)))
+	for _, id := range items {
+		region := c.cluster.GetRegion(id)
+		if region == nil {
+			removes = append(removes, id)
+			continue
+		}
+		ops := c.checkers.CheckRegion(region)
+		// it should skip if region needs to merge
+		if len(ops) == 0 || ops[0].Kind()&operator.OpMerge != 0 {
+			continue
+		}
+		if !c.opController.ExceedStoreLimit(ops...) {
+			c.opController.AddWaitingOperator(ops...)
+		}
+	}
+	for _, v := range removes {
+		c.checkers.RemovePriorityRegions(v)
+	}
+}
+
+// checkSuspectRanges would pop one suspect key range group
+// The regions of new version key range and old version key range would be placed into
+// the suspect regions map
+func (c *Coordinator) checkSuspectRanges() {
+	defer logutil.LogPanic()
+	defer c.wg.Done()
+	log.Info("coordinator begins to check suspect key ranges")
+	ticker := time.NewTicker(checkSuspectRangesInterval)
+	defer ticker.Stop()
+	for {
+		select {
+		case <-c.ctx.Done():
+			log.Info("check suspect key ranges has been stopped")
+			return
+		case <-ticker.C:
+			keyRange, success := c.checkers.PopOneSuspectKeyRange()
+			if !success {
+				continue
+			}
+			limit := 1024
+			regions := c.cluster.ScanRegions(keyRange[0], keyRange[1], limit)
+			if len(regions) == 0 {
+				continue
+			}
+			regionIDList := make([]uint64, 0, len(regions))
+			for _, region := range regions {
+				regionIDList = append(regionIDList, region.GetID())
+			}
+
+			// if the last region's end key is smaller the keyRange[1] which means there existed the remaining regions between
+			// keyRange[0] and keyRange[1] after scan regions, so we put the end key and keyRange[1] into Suspect KeyRanges
+			lastRegion := regions[len(regions)-1]
+			if lastRegion.GetEndKey() != nil && bytes.Compare(lastRegion.GetEndKey(), keyRange[1]) < 0 {
+				c.checkers.AddSuspectKeyRange(lastRegion.GetEndKey(), keyRange[1])
+			}
+			c.checkers.AddSuspectRegions(regionIDList...)
+		}
+	}
+}
+
+func (c *Coordinator) tryAddOperators(region *core.RegionInfo) {
+	if region == nil {
+		// the region could be recent split, continue to wait.
+		return
+	}
+	id := region.GetID()
+	if c.opController.GetOperator(id) != nil {
+		c.checkers.RemoveWaitingRegion(id)
+		c.checkers.RemoveSuspectRegion(id)
+		return
+	}
+	ops := c.checkers.CheckRegion(region)
+	if len(ops) == 0 {
+		return
+	}
+
+	if !c.opController.ExceedStoreLimit(ops...) {
+		c.opController.AddWaitingOperator(ops...)
+		c.checkers.RemoveWaitingRegion(id)
+		c.checkers.RemoveSuspectRegion(id)
+	} else {
+		c.checkers.AddWaitingRegion(region)
+	}
+}
+
+// drivePushOperator is used to push the unfinished operator to the executor.
+func (c *Coordinator) drivePushOperator() {
+	defer logutil.LogPanic()
+
+	defer c.wg.Done()
+	log.Info("coordinator begins to actively drive push operator")
+	ticker := time.NewTicker(pushOperatorTickInterval)
+	defer ticker.Stop()
+	for {
+		select {
+		case <-c.ctx.Done():
+			log.Info("drive push operator has been stopped")
+			return
+		case <-ticker.C:
+			c.opController.PushOperators(c.RecordOpStepWithTTL)
+		}
+	}
+}
+
+// driveSlowNodeScheduler is used to enable slow node scheduler when using `raft-kv2`.
+func (c *Coordinator) driveSlowNodeScheduler() {
+	defer logutil.LogPanic()
+	defer c.wg.Done()
+
+	ticker := time.NewTicker(time.Minute)
+	defer ticker.Stop()
+	for {
+		select {
+		case <-c.ctx.Done():
+			log.Info("drive slow node scheduler is stopped")
+			return
+		case <-ticker.C:
+			{
+				// If enabled, exit.
+				if exists, _ := c.schedulers.IsSchedulerExisted(schedulers.EvictSlowTrendName); exists {
+					return
+				}
+				// If the cluster was set up with `raft-kv2` engine, this cluster should
+				// enable `evict-slow-trend` scheduler as default.
+				if c.GetCluster().GetStoreConfig().IsRaftKV2() {
+					typ := schedulers.EvictSlowTrendType
+					args := []string{}
+
+					s, err := schedulers.CreateScheduler(typ, c.opController, c.cluster.GetStorage(), schedulers.ConfigSliceDecoder(typ, args), c.schedulers.RemoveScheduler)
+					if err != nil {
+						log.Warn("initializing evict-slow-trend scheduler failed", errs.ZapError(err))
+					} else if err = c.schedulers.AddScheduler(s, args...); err != nil {
+						log.Error("can not add scheduler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", args), errs.ZapError(err))
+					}
+				}
+			}
+		}
+	}
+}
+
+// RunUntilStop runs the coordinator until receiving the stop signal.
+func (c *Coordinator) RunUntilStop(collectWaitTime ...time.Duration) {
+	c.Run(collectWaitTime...)
+	<-c.ctx.Done()
+	log.Info("coordinator is stopping")
+	c.GetSchedulersController().Wait()
+	c.wg.Wait()
+	log.Info("coordinator has been stopped")
+}
+
+// Run starts coordinator.
+func (c *Coordinator) Run(collectWaitTime ...time.Duration) {
+	ticker := time.NewTicker(runSchedulerCheckInterval)
+	failpoint.Inject("changeCoordinatorTicker", func() {
+		ticker = time.NewTicker(100 * time.Millisecond)
+	})
+	defer ticker.Stop()
+	log.Info("coordinator starts to collect cluster information")
+	for {
+		if c.ShouldRun(collectWaitTime...) {
+			log.Info("coordinator has finished cluster information preparation")
+			break
+		}
+		select {
+		case <-ticker.C:
+		case <-c.ctx.Done():
+			log.Info("coordinator stops running")
+			return
+		}
+	}
+	log.Info("coordinator starts to run schedulers")
+	c.InitSchedulers(true)
+
+	c.wg.Add(4)
+	// Starts to patrol regions.
+	go c.PatrolRegions()
+	// Checks suspect key ranges
+	go c.checkSuspectRanges()
+	go c.drivePushOperator()
+	// Checks whether to create evict-slow-trend scheduler.
+	go c.driveSlowNodeScheduler()
+}
+
+// InitSchedulers initializes schedulers.
+func (c *Coordinator) InitSchedulers(needRun bool) {
+	var (
+		scheduleNames []string
+		configs       []string
+		err           error
+	)
+	for i := 0; i < maxLoadConfigRetries; i++ {
+		scheduleNames, configs, err = c.cluster.GetStorage().LoadAllSchedulerConfigs()
+		select {
+		case <-c.ctx.Done():
+			log.Info("init schedulers has been stopped")
+			return
+		default:
+		}
+		if err == nil {
+			break
+		}
+		log.Error("cannot load schedulers' config", zap.Int("retry-times", i), errs.ZapError(err))
+	}
+	if err != nil {
+		log.Fatal("cannot load schedulers' config", errs.ZapError(err))
+	}
+	scheduleCfg := c.cluster.GetSchedulerConfig().GetScheduleConfig().Clone()
+	// The new way to create scheduler with the independent configuration.
+	for i, name := range scheduleNames {
+		data := configs[i]
+		typ := schedulers.FindSchedulerTypeByName(name)
+		var cfg sc.SchedulerConfig
+		for _, c := range scheduleCfg.Schedulers {
+			if c.Type == typ {
+				cfg = c
+				break
+			}
+		}
+		if len(cfg.Type) == 0 {
+			log.Error("the scheduler type not found", zap.String("scheduler-name", name), errs.ZapError(errs.ErrSchedulerNotFound))
+			continue
+		}
+		if cfg.Disable {
+			log.Info("skip create scheduler with independent configuration", zap.String("scheduler-name", name), zap.String("scheduler-type", cfg.Type), zap.Strings("scheduler-args", cfg.Args))
+			continue
+		}
+		s, err := schedulers.CreateScheduler(cfg.Type, c.opController, c.cluster.GetStorage(), schedulers.ConfigJSONDecoder([]byte(data)), c.schedulers.RemoveScheduler)
+		if err != nil {
+			log.Error("can not create scheduler with independent configuration", zap.String("scheduler-name", name), zap.Strings("scheduler-args", cfg.Args), errs.ZapError(err))
+			continue
+		}
+		if needRun {
+			log.Info("create scheduler with independent configuration", zap.String("scheduler-name", s.GetName()))
+			if err = c.schedulers.AddScheduler(s); err != nil {
+				log.Error("can not add scheduler with independent configuration", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", cfg.Args), errs.ZapError(err))
+			}
+		} else {
+			log.Info("create scheduler handler with independent configuration", zap.String("scheduler-name", s.GetName()))
+			if err = c.schedulers.AddSchedulerHandler(s); err != nil {
+				log.Error("can not add scheduler handler with independent configuration", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", cfg.Args), errs.ZapError(err))
+			}
+		}
+	}
+
+	// The old way to create the scheduler.
+	k := 0
+	for _, schedulerCfg := range scheduleCfg.Schedulers {
+		if schedulerCfg.Disable {
+			scheduleCfg.Schedulers[k] = schedulerCfg
+			k++
+			log.Info("skip create scheduler", zap.String("scheduler-type", schedulerCfg.Type), zap.Strings("scheduler-args", schedulerCfg.Args))
+			continue
+		}
+
+		s, err := schedulers.CreateScheduler(schedulerCfg.Type, c.opController, c.cluster.GetStorage(), schedulers.ConfigSliceDecoder(schedulerCfg.Type, schedulerCfg.Args), c.schedulers.RemoveScheduler)
+		if err != nil {
+			log.Error("can not create scheduler", zap.String("scheduler-type", schedulerCfg.Type), zap.Strings("scheduler-args", schedulerCfg.Args), errs.ZapError(err))
+			continue
+		}
+
+		if needRun {
+			log.Info("create scheduler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", schedulerCfg.Args))
+			if err = c.schedulers.AddScheduler(s, schedulerCfg.Args...); err != nil && !errors.ErrorEqual(err, errs.ErrSchedulerExisted.FastGenByArgs()) {
+				log.Error("can not add scheduler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", schedulerCfg.Args), errs.ZapError(err))
+			} else {
+				// Only records the valid scheduler config.
+				scheduleCfg.Schedulers[k] = schedulerCfg
+				k++
+			}
+		} else {
+			log.Info("create scheduler handler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", schedulerCfg.Args))
+			if err = c.schedulers.AddSchedulerHandler(s, schedulerCfg.Args...); err != nil && !errors.ErrorEqual(err, errs.ErrSchedulerExisted.FastGenByArgs()) {
+				log.Error("can not add scheduler handler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", schedulerCfg.Args), errs.ZapError(err))
+			} else {
+				scheduleCfg.Schedulers[k] = schedulerCfg
+				k++
+			}
+		}
+	}
+
+	// Removes the invalid scheduler config and persist.
+	scheduleCfg.Schedulers = scheduleCfg.Schedulers[:k]
+	c.cluster.GetSchedulerConfig().SetScheduleConfig(scheduleCfg)
+	if err := c.cluster.GetSchedulerConfig().Persist(c.cluster.GetStorage()); err != nil {
+		log.Error("cannot persist schedule config", errs.ZapError(err))
+	}
+	log.Info("scheduler config is updated", zap.Reflect("scheduler-config", scheduleCfg.Schedulers))
+
+	c.markSchedulersInitialized()
+}
+
+// LoadPlugin load user plugin
+func (c *Coordinator) LoadPlugin(pluginPath string, ch chan string) {
+	log.Info("load plugin", zap.String("plugin-path", pluginPath))
+	// get func: SchedulerType from plugin
+	SchedulerType, err := c.pluginInterface.GetFunction(pluginPath, "SchedulerType")
+	if err != nil {
+		log.Error("GetFunction SchedulerType error", errs.ZapError(err))
+		return
+	}
+	schedulerType := SchedulerType.(func() string)
+	// get func: SchedulerArgs from plugin
+	SchedulerArgs, err := c.pluginInterface.GetFunction(pluginPath, "SchedulerArgs")
+	if err != nil {
+		log.Error("GetFunction SchedulerArgs error", errs.ZapError(err))
+		return
+	}
+	schedulerArgs := SchedulerArgs.(func() []string)
+	// create and add user scheduler
+	s, err := schedulers.CreateScheduler(schedulerType(), c.opController, c.cluster.GetStorage(), schedulers.ConfigSliceDecoder(schedulerType(), schedulerArgs()), c.schedulers.RemoveScheduler)
+	if err != nil {
+		log.Error("can not create scheduler", zap.String("scheduler-type", schedulerType()), errs.ZapError(err))
+		return
+	}
+	log.Info("create scheduler", zap.String("scheduler-name", s.GetName()))
+	// TODO: handle the plugin in API service mode.
+	if err = c.schedulers.AddScheduler(s); err != nil {
+		log.Error("can't add scheduler", zap.String("scheduler-name", s.GetName()), errs.ZapError(err))
+		return
+	}
+
+	c.wg.Add(1)
+	go c.waitPluginUnload(pluginPath, s.GetName(), ch)
+}
+
+func (c *Coordinator) waitPluginUnload(pluginPath, schedulerName string, ch chan string) {
+	defer logutil.LogPanic()
+	defer c.wg.Done()
+	// Get signal from channel which means user unload the plugin
+	for {
+		select {
+		case action := <-ch:
+			if action == PluginUnload {
+				err := c.schedulers.RemoveScheduler(schedulerName)
+				if err != nil {
+					log.Error("can not remove scheduler", zap.String("scheduler-name", schedulerName), errs.ZapError(err))
+				} else {
+					log.Info("unload plugin", zap.String("plugin", pluginPath))
+					return
+				}
+			} else {
+				log.Error("unknown action", zap.String("action", action))
+			}
+		case <-c.ctx.Done():
+			log.Info("unload plugin has been stopped")
+			return
+		}
+	}
+}
+
+// Stop stops the coordinator.
+func (c *Coordinator) Stop() {
+	c.cancel()
+}
+
+// GetHotRegionsByType gets hot regions' statistics by RWType.
+func (c *Coordinator) GetHotRegionsByType(typ utils.RWType) *statistics.StoreHotPeersInfos {
+	isTraceFlow := c.cluster.GetSchedulerConfig().IsTraceRegionFlow()
+	storeLoads := c.cluster.GetStoresLoads()
+	stores := c.cluster.GetStores()
+	var infos *statistics.StoreHotPeersInfos
+	switch typ {
+	case utils.Write:
+		regionStats := c.cluster.RegionWriteStats()
+		infos = statistics.GetHotStatus(stores, storeLoads, regionStats, utils.Write, isTraceFlow)
+	case utils.Read:
+		regionStats := c.cluster.RegionReadStats()
+		infos = statistics.GetHotStatus(stores, storeLoads, regionStats, utils.Read, isTraceFlow)
+	default:
+	}
+	// update params `IsLearner` and `LastUpdateTime`
+	s := []statistics.StoreHotPeersStat{infos.AsLeader, infos.AsPeer}
+	for i, stores := range s {
+		for j, store := range stores {
+			for k := range store.Stats {
+				h := &s[i][j].Stats[k]
+				region := c.cluster.GetRegion(h.RegionID)
+				if region != nil {
+					h.IsLearner = core.IsLearner(region.GetPeer(h.StoreID))
+				}
+				switch typ {
+				case utils.Write:
+					if region != nil {
+						h.LastUpdateTime = time.Unix(int64(region.GetInterval().GetEndTimestamp()), 0)
+					}
+				case utils.Read:
+					store := c.cluster.GetStore(h.StoreID)
+					if store != nil {
+						ts := store.GetMeta().GetLastHeartbeat()
+						h.LastUpdateTime = time.Unix(ts/1e9, ts%1e9)
+					}
+				default:
+				}
+			}
+		}
+	}
+	return infos
+}
+
+// GetHotRegions gets hot regions' statistics by RWType and storeIDs.
+// If storeIDs is empty, it returns all hot regions' statistics by RWType.
+func (c *Coordinator) GetHotRegions(typ utils.RWType, storeIDs ...uint64) *statistics.StoreHotPeersInfos {
+	hotRegions := c.GetHotRegionsByType(typ)
+	if len(storeIDs) > 0 && hotRegions != nil {
+		asLeader := statistics.StoreHotPeersStat{}
+		asPeer := statistics.StoreHotPeersStat{}
+		for _, storeID := range storeIDs {
+			asLeader[storeID] = hotRegions.AsLeader[storeID]
+			asPeer[storeID] = hotRegions.AsPeer[storeID]
+		}
+		return &statistics.StoreHotPeersInfos{
+			AsLeader: asLeader,
+			AsPeer:   asPeer,
+		}
+	}
+	return hotRegions
+}
+
+// GetWaitGroup returns the wait group. Only for test purpose.
+func (c *Coordinator) GetWaitGroup() *sync.WaitGroup {
+	return &c.wg
+}
+
+// CollectHotSpotMetrics collects hot spot metrics.
+func (c *Coordinator) CollectHotSpotMetrics() {
+	stores := c.cluster.GetStores()
+	// Collects hot write region metrics.
+	collectHotMetrics(c.cluster, stores, utils.Write)
+	// Collects hot read region metrics.
+	collectHotMetrics(c.cluster, stores, utils.Read)
+}
+
+func collectHotMetrics(cluster sche.ClusterInformer, stores []*core.StoreInfo, typ utils.RWType) {
+	var (
+		kind        string
+		regionStats map[uint64][]*statistics.HotPeerStat
+	)
+
+	switch typ {
+	case utils.Read:
+		regionStats = cluster.RegionReadStats()
+		kind = utils.Read.String()
+	case utils.Write:
+		regionStats = cluster.RegionWriteStats()
+		kind = utils.Write.String()
+	}
+	status := statistics.CollectHotPeerInfos(stores, regionStats) // only returns TotalBytesRate,TotalKeysRate,TotalQueryRate,Count
+
+	for _, s := range stores {
+		// TODO: pre-allocate gauge metrics
+		storeAddress := s.GetAddress()
+		storeID := s.GetID()
+		storeLabel := strconv.FormatUint(storeID, 10)
+		stat, hasHotLeader := status.AsLeader[storeID]
+		if hasHotLeader {
+			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_bytes_as_leader").Set(stat.TotalBytesRate)
+			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_keys_as_leader").Set(stat.TotalKeysRate)
+			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_query_as_leader").Set(stat.TotalQueryRate)
+			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "hot_"+kind+"_region_as_leader").Set(float64(stat.Count))
+		} else {
+			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_bytes_as_leader")
+			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_keys_as_leader")
+			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_query_as_leader")
+			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "hot_"+kind+"_region_as_leader")
+		}
+
+		stat, hasHotPeer := status.AsPeer[storeID]
+		if hasHotPeer {
+			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_bytes_as_peer").Set(stat.TotalBytesRate)
+			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_keys_as_peer").Set(stat.TotalKeysRate)
+			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_query_as_peer").Set(stat.TotalQueryRate)
+			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "hot_"+kind+"_region_as_peer").Set(float64(stat.Count))
+		} else {
+			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_bytes_as_peer")
+			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_keys_as_peer")
+			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_query_as_peer")
+			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "hot_"+kind+"_region_as_peer")
+		}
+
+		if !hasHotLeader && !hasHotPeer {
+			utils.ForeachRegionStats(func(rwTy utils.RWType, dim int, _ utils.RegionStatKind) {
+				schedulers.HotPendingSum.DeleteLabelValues(storeLabel, rwTy.String(), utils.DimToString(dim))
+			})
+		}
+	}
+}
+
+// ResetHotSpotMetrics resets hot spot metrics.
+func ResetHotSpotMetrics() {
+	hotSpotStatusGauge.Reset()
+	schedulers.HotPendingSum.Reset()
+}
+
+// ShouldRun returns true if the coordinator should run.
+func (c *Coordinator) ShouldRun(collectWaitTime ...time.Duration) bool {
+	return c.prepareChecker.check(c.cluster.GetBasicCluster(), collectWaitTime...)
+}
+
+// GetSchedulersController returns the schedulers controller.
+func (c *Coordinator) GetSchedulersController() *schedulers.Controller {
+	return c.schedulers
+}
+
+// PauseOrResumeChecker pauses or resumes a checker by name.
+func (c *Coordinator) PauseOrResumeChecker(name string, t int64) error {
+	c.Lock()
+	defer c.Unlock()
+	if c.cluster == nil {
+		return errs.ErrNotBootstrapped.FastGenByArgs()
+	}
+	p, err := c.checkers.GetPauseController(name)
+	if err != nil {
+		return err
+	}
+	p.PauseOrResume(t)
+	return nil
+}
+
+// IsCheckerPaused returns whether a checker is paused.
+func (c *Coordinator) IsCheckerPaused(name string) (bool, error) {
+	c.RLock()
+	defer c.RUnlock()
+	if c.cluster == nil {
+		return false, errs.ErrNotBootstrapped.FastGenByArgs()
+	}
+	p, err := c.checkers.GetPauseController(name)
+	if err != nil {
+		return false, err
+	}
+	return p.IsPaused(), nil
+}
+
+// GetRegionScatterer returns the region scatterer.
+func (c *Coordinator) GetRegionScatterer() *scatter.RegionScatterer {
+	return c.regionScatterer
+}
+
+// GetRegionSplitter returns the region splitter.
+func (c *Coordinator) GetRegionSplitter() *splitter.RegionSplitter {
+	return c.regionSplitter
+}
+
+// GetOperatorController returns the operator controller.
+func (c *Coordinator) GetOperatorController() *operator.Controller {
+	return c.opController
+}
+
+// GetCheckerController returns the checker controller.
+func (c *Coordinator) GetCheckerController() *checker.Controller {
+	return c.checkers
+}
+
+// GetMergeChecker returns the merge checker.
+func (c *Coordinator) GetMergeChecker() *checker.MergeChecker {
+	return c.checkers.GetMergeChecker()
+}
+
+// GetRuleChecker returns the rule checker.
+func (c *Coordinator) GetRuleChecker() *checker.RuleChecker {
+	return c.checkers.GetRuleChecker()
+}
+
+// GetPrepareChecker returns the prepare checker.
+func (c *Coordinator) GetPrepareChecker() *prepareChecker {
+	return c.prepareChecker
+}
+
+// GetHeartbeatStreams returns the heartbeat streams. Only for test purpose.
+func (c *Coordinator) GetHeartbeatStreams() *hbstream.HeartbeatStreams {
+	return c.hbStreams
+}
+
+// GetCluster returns the cluster. Only for test purpose.
+func (c *Coordinator) GetCluster() sche.ClusterInformer {
+	return c.cluster
+}
+
+// GetDiagnosticResult returns the diagnostic result.
+func (c *Coordinator) GetDiagnosticResult(name string) (*schedulers.DiagnosticResult, error) {
+	return c.diagnosticManager.GetDiagnosticResult(name)
+}
+
+// RecordOpStepWithTTL records OpStep with TTL
+func (c *Coordinator) RecordOpStepWithTTL(regionID uint64) {
+	c.GetRuleChecker().RecordRegionPromoteToNonWitness(regionID)
+}
diff --git a/server/cluster/cluster.go b/server/cluster/cluster.go
index 1637c2a8612..660e7347bd2 100644
--- a/server/cluster/cluster.go
+++ b/server/cluster/cluster.go
@@ -1430,7 +1430,7 @@ func (c *RaftCluster) RemoveStore(storeID uint64, physicallyDestroyed bool) erro
 	if err == nil {
 		regionSize := float64(c.core.GetStoreRegionSize(storeID))
 		c.resetProgress(storeID, store.GetAddress())
-		c.progressManager.AddProgress(encodeRemovingProgressKey(storeID), regionSize, regionSize, nodeStateCheckJobInterval)
+		c.progressManager.AddProgress(encodeRemovingProgressKey(storeID), regionSize, regionSize, nodeStateCheckJobInterval, progress.WindowDurationOption(c.GetCoordinator().GetPatrolRegionsDuration()))
 		// record the current store limit in memory
 		c.prevStoreLimit[storeID] = map[storelimit.Type]float64{
 			storelimit.AddPeer:    c.GetStoreLimitByType(storeID, storelimit.AddPeer),
@@ -1969,21 +1969,23 @@ func updateTopology(topology map[string]interface{}, sortedLabels []*metapb.Stor
 
 func (c *RaftCluster) updateProgress(storeID uint64, storeAddress, action string, current, remaining float64, isInc bool) {
 	storeLabel := strconv.FormatUint(storeID, 10)
-	var progress string
+	var progressName string
+	var opts []progress.Option
 	switch action {
 	case removingAction:
-		progress = encodeRemovingProgressKey(storeID)
+		progressName = encodeRemovingProgressKey(storeID)
+		opts = []progress.Option{progress.WindowDurationOption(c.coordinator.GetPatrolRegionsDuration())}
 	case preparingAction:
-		progress = encodePreparingProgressKey(storeID)
+		progressName = encodePreparingProgressKey(storeID)
 	}
 
-	if exist := c.progressManager.AddProgress(progress, current, remaining, nodeStateCheckJobInterval); !exist {
+	if exist := c.progressManager.AddProgress(progressName, current, remaining, nodeStateCheckJobInterval, opts...); !exist {
 		return
 	}
-	c.progressManager.UpdateProgress(progress, current, remaining, isInc)
-	process, ls, cs, err := c.progressManager.Status(progress)
+	c.progressManager.UpdateProgress(progressName, current, remaining, isInc, opts...)
+	process, ls, cs, err := c.progressManager.Status(progressName)
 	if err != nil {
-		log.Error("get progress status failed", zap.String("progress", progress), zap.Float64("remaining", remaining), errs.ZapError(err))
+		log.Error("get progress status failed", zap.String("progress", progressName), zap.Float64("remaining", remaining), errs.ZapError(err))
 		return
 	}
 	storesProgressGauge.WithLabelValues(storeAddress, storeLabel, action).Set(process)

From f443732c31a278d2e2c7e3794e43bfb093b54243 Mon Sep 17 00:00:00 2001
From: Cabinfever_B <cabinfeveroier@gmail.com>
Date: Mon, 1 Apr 2024 11:07:10 +0800
Subject: [PATCH 2/2] fix conflict

Signed-off-by: Cabinfever_B <cabinfeveroier@gmail.com>
---
 pkg/progress/progress.go      |  30 +-
 pkg/progress/progress_test.go |   4 -
 pkg/schedule/coordinator.go   | 835 ----------------------------------
 server/cluster/coordinator.go |  23 +-
 4 files changed, 30 insertions(+), 862 deletions(-)
 delete mode 100644 pkg/schedule/coordinator.go

diff --git a/pkg/progress/progress.go b/pkg/progress/progress.go
index 6940ad1dd01..855aa793a83 100644
--- a/pkg/progress/progress.go
+++ b/pkg/progress/progress.go
@@ -36,13 +36,13 @@ const (
 // Manager is used to maintain the progresses we care about.
 type Manager struct {
 	syncutil.RWMutex
-	progesses map[string]*progressIndicator
+	progresses map[string]*progressIndicator
 }
 
 // NewManager creates a new Manager.
 func NewManager() *Manager {
 	return &Manager{
-		progesses: make(map[string]*progressIndicator),
+		progresses: make(map[string]*progressIndicator),
 	}
 }
 
@@ -81,7 +81,7 @@ func (m *Manager) Reset() {
 	m.Lock()
 	defer m.Unlock()
 
-	m.progesses = make(map[string]*progressIndicator)
+	m.progresses = make(map[string]*progressIndicator)
 }
 
 // Option is used to do some action for progressIndicator.
@@ -106,15 +106,6 @@ func (m *Manager) AddProgress(progress string, current, total float64, updateInt
 
 	history := list.New()
 	history.PushBack(current)
-<<<<<<< HEAD
-	if _, exist = m.progesses[progress]; !exist {
-		m.progesses[progress] = &progressIndicator{
-			total:             total,
-			remaining:         total,
-			history:           history,
-			windowLengthLimit: int(speedStatisticalWindow / updateInterval),
-			updateInterval:    updateInterval,
-=======
 	if _, exist = m.progresses[progress]; !exist {
 		pi := &progressIndicator{
 			total:          total,
@@ -123,7 +114,6 @@ func (m *Manager) AddProgress(progress string, current, total float64, updateInt
 			windowCapacity: int(maxSpeedCalculationWindow/updateInterval) + 1,
 			windowLength:   int(minSpeedCalculationWindow / updateInterval),
 			updateInterval: updateInterval,
->>>>>>> 945e29c03 (cluster: dynamic progress time window for offline scene (#7722))
 		}
 		for _, op := range opts {
 			op(pi)
@@ -140,14 +130,10 @@ func (m *Manager) UpdateProgress(progress string, current, remaining float64, is
 	m.Lock()
 	defer m.Unlock()
 
-<<<<<<< HEAD
-	if p, exist := m.progesses[progress]; exist {
-=======
 	if p, exist := m.progresses[progress]; exist {
 		for _, op := range opts {
 			op(p)
 		}
->>>>>>> 945e29c03 (cluster: dynamic progress time window for offline scene (#7722))
 		p.remaining = remaining
 		if p.total < remaining {
 			p.total = remaining
@@ -193,7 +179,7 @@ func (m *Manager) UpdateProgressTotal(progress string, total float64) {
 	m.Lock()
 	defer m.Unlock()
 
-	if p, exist := m.progesses[progress]; exist {
+	if p, exist := m.progresses[progress]; exist {
 		p.total = total
 	}
 }
@@ -203,8 +189,8 @@ func (m *Manager) RemoveProgress(progress string) (exist bool) {
 	m.Lock()
 	defer m.Unlock()
 
-	if _, exist = m.progesses[progress]; exist {
-		delete(m.progesses, progress)
+	if _, exist = m.progresses[progress]; exist {
+		delete(m.progresses, progress)
 		return
 	}
 	return
@@ -216,7 +202,7 @@ func (m *Manager) GetProgresses(filter func(p string) bool) []string {
 	defer m.RUnlock()
 
 	processes := []string{}
-	for p := range m.progesses {
+	for p := range m.progresses {
 		if filter(p) {
 			processes = append(processes, p)
 		}
@@ -229,7 +215,7 @@ func (m *Manager) Status(progress string) (process, leftSeconds, currentSpeed fl
 	m.RLock()
 	defer m.RUnlock()
 
-	if p, exist := m.progesses[progress]; exist {
+	if p, exist := m.progresses[progress]; exist {
 		process = 1 - p.remaining/p.total
 		if process < 0 {
 			process = 0
diff --git a/pkg/progress/progress_test.go b/pkg/progress/progress_test.go
index 524d216d0ea..a7b159bc907 100644
--- a/pkg/progress/progress_test.go
+++ b/pkg/progress/progress_test.go
@@ -46,11 +46,7 @@ func TestProgress(t *testing.T) {
 	for i := 0; i < 1000; i++ {
 		m.UpdateProgress(n, 30, 30, false)
 	}
-<<<<<<< HEAD
-	re.Equal(61, m.progesses[n].history.Len())
-=======
 	re.Equal(721, m.progresses[n].history.Len())
->>>>>>> 945e29c03 (cluster: dynamic progress time window for offline scene (#7722))
 	p, ls, cs, err = m.Status(n)
 	re.NoError(err)
 	re.Equal(0.7, p)
diff --git a/pkg/schedule/coordinator.go b/pkg/schedule/coordinator.go
deleted file mode 100644
index 35d9c2029a1..00000000000
--- a/pkg/schedule/coordinator.go
+++ /dev/null
@@ -1,835 +0,0 @@
-// Copyright 2016 TiKV Project Authors.
-//
-// Licensed under the Apache License, Version 2.0 (the "License");
-// you may not use this file except in compliance with the License.
-// You may obtain a copy of the License at
-//
-//     http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing, software
-// distributed under the License is distributed on an "AS IS" BASIS,
-// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-// See the License for the specific language governing permissions and
-// limitations under the License.
-
-package schedule
-
-import (
-	"bytes"
-	"context"
-	"strconv"
-	"sync"
-	"time"
-
-	"github.com/pingcap/errors"
-	"github.com/pingcap/failpoint"
-	"github.com/pingcap/log"
-	"github.com/tikv/pd/pkg/cache"
-	"github.com/tikv/pd/pkg/core"
-	"github.com/tikv/pd/pkg/errs"
-	"github.com/tikv/pd/pkg/schedule/checker"
-	sc "github.com/tikv/pd/pkg/schedule/config"
-	sche "github.com/tikv/pd/pkg/schedule/core"
-	"github.com/tikv/pd/pkg/schedule/diagnostic"
-	"github.com/tikv/pd/pkg/schedule/hbstream"
-	"github.com/tikv/pd/pkg/schedule/operator"
-	"github.com/tikv/pd/pkg/schedule/scatter"
-	"github.com/tikv/pd/pkg/schedule/schedulers"
-	"github.com/tikv/pd/pkg/schedule/splitter"
-	"github.com/tikv/pd/pkg/statistics"
-	"github.com/tikv/pd/pkg/statistics/utils"
-	"github.com/tikv/pd/pkg/utils/logutil"
-	"github.com/tikv/pd/pkg/utils/syncutil"
-	"go.uber.org/zap"
-)
-
-const (
-	runSchedulerCheckInterval  = 3 * time.Second
-	checkSuspectRangesInterval = 100 * time.Millisecond
-	collectFactor              = 0.9
-	collectTimeout             = 5 * time.Minute
-	maxLoadConfigRetries       = 10
-	// pushOperatorTickInterval is the interval try to push the operator.
-	pushOperatorTickInterval = 500 * time.Millisecond
-
-	patrolScanRegionLimit = 128 // It takes about 14 minutes to iterate 1 million regions.
-	// PluginLoad means action for load plugin
-	PluginLoad = "PluginLoad"
-	// PluginUnload means action for unload plugin
-	PluginUnload = "PluginUnload"
-)
-
-var (
-	// WithLabelValues is a heavy operation, define variable to avoid call it every time.
-	waitingListGauge  = regionListGauge.WithLabelValues("waiting_list")
-	priorityListGauge = regionListGauge.WithLabelValues("priority_list")
-)
-
-// Coordinator is used to manage all schedulers and checkers to decide if the region needs to be scheduled.
-type Coordinator struct {
-	syncutil.RWMutex
-
-	wg     sync.WaitGroup
-	ctx    context.Context
-	cancel context.CancelFunc
-
-	schedulersInitialized bool
-	patrolRegionsDuration time.Duration
-
-	cluster           sche.ClusterInformer
-	prepareChecker    *prepareChecker
-	checkers          *checker.Controller
-	regionScatterer   *scatter.RegionScatterer
-	regionSplitter    *splitter.RegionSplitter
-	schedulers        *schedulers.Controller
-	opController      *operator.Controller
-	hbStreams         *hbstream.HeartbeatStreams
-	pluginInterface   *PluginInterface
-	diagnosticManager *diagnostic.Manager
-}
-
-// NewCoordinator creates a new Coordinator.
-func NewCoordinator(parentCtx context.Context, cluster sche.ClusterInformer, hbStreams *hbstream.HeartbeatStreams) *Coordinator {
-	ctx, cancel := context.WithCancel(parentCtx)
-	opController := operator.NewController(ctx, cluster.GetBasicCluster(), cluster.GetSharedConfig(), hbStreams)
-	schedulers := schedulers.NewController(ctx, cluster, cluster.GetStorage(), opController)
-	checkers := checker.NewController(ctx, cluster, cluster.GetCheckerConfig(), cluster.GetRuleManager(), cluster.GetRegionLabeler(), opController)
-	return &Coordinator{
-		ctx:                   ctx,
-		cancel:                cancel,
-		schedulersInitialized: false,
-		cluster:               cluster,
-		prepareChecker:        newPrepareChecker(),
-		checkers:              checkers,
-		regionScatterer:       scatter.NewRegionScatterer(ctx, cluster, opController, checkers.AddSuspectRegions),
-		regionSplitter:        splitter.NewRegionSplitter(cluster, splitter.NewSplitRegionsHandler(cluster, opController), checkers.AddSuspectRegions),
-		schedulers:            schedulers,
-		opController:          opController,
-		hbStreams:             hbStreams,
-		pluginInterface:       NewPluginInterface(),
-		diagnosticManager:     diagnostic.NewManager(schedulers, cluster.GetSchedulerConfig()),
-	}
-}
-
-// GetPatrolRegionsDuration returns the duration of the last patrol region round.
-func (c *Coordinator) GetPatrolRegionsDuration() time.Duration {
-	if c == nil {
-		return 0
-	}
-	c.RLock()
-	defer c.RUnlock()
-	return c.patrolRegionsDuration
-}
-
-func (c *Coordinator) setPatrolRegionsDuration(dur time.Duration) {
-	c.Lock()
-	defer c.Unlock()
-	c.patrolRegionsDuration = dur
-}
-
-// markSchedulersInitialized marks the scheduler initialization is finished.
-func (c *Coordinator) markSchedulersInitialized() {
-	c.Lock()
-	defer c.Unlock()
-	c.schedulersInitialized = true
-}
-
-// AreSchedulersInitialized returns whether the schedulers have been initialized.
-func (c *Coordinator) AreSchedulersInitialized() bool {
-	c.RLock()
-	defer c.RUnlock()
-	return c.schedulersInitialized
-}
-
-// GetWaitingRegions returns the regions in the waiting list.
-func (c *Coordinator) GetWaitingRegions() []*cache.Item {
-	return c.checkers.GetWaitingRegions()
-}
-
-// IsPendingRegion returns if the region is in the pending list.
-func (c *Coordinator) IsPendingRegion(region uint64) bool {
-	return c.checkers.IsPendingRegion(region)
-}
-
-// PatrolRegions is used to scan regions.
-// The checkers will check these regions to decide if they need to do some operations.
-// The function is exposed for test purpose.
-func (c *Coordinator) PatrolRegions() {
-	defer logutil.LogPanic()
-
-	defer c.wg.Done()
-	ticker := time.NewTicker(c.cluster.GetCheckerConfig().GetPatrolRegionInterval())
-	defer ticker.Stop()
-
-	log.Info("coordinator starts patrol regions")
-	start := time.Now()
-	var (
-		key     []byte
-		regions []*core.RegionInfo
-	)
-	for {
-		select {
-		case <-ticker.C:
-			// Note: we reset the ticker here to support updating configuration dynamically.
-			ticker.Reset(c.cluster.GetCheckerConfig().GetPatrolRegionInterval())
-		case <-c.ctx.Done():
-			patrolCheckRegionsGauge.Set(0)
-			c.setPatrolRegionsDuration(0)
-			log.Info("patrol regions has been stopped")
-			return
-		}
-		if c.isSchedulingHalted() {
-			continue
-		}
-
-		// Check priority regions first.
-		c.checkPriorityRegions()
-		// Check suspect regions first.
-		c.checkSuspectRegions()
-		// Check regions in the waiting list
-		c.checkWaitingRegions()
-
-		key, regions = c.checkRegions(key)
-		if len(regions) == 0 {
-			continue
-		}
-		// Updates the label level isolation statistics.
-		c.cluster.UpdateRegionsLabelLevelStats(regions)
-		if len(key) == 0 {
-			dur := time.Since(start)
-			patrolCheckRegionsGauge.Set(dur.Seconds())
-			c.setPatrolRegionsDuration(dur)
-			start = time.Now()
-		}
-		failpoint.Inject("break-patrol", func() {
-			failpoint.Break()
-		})
-	}
-}
-
-func (c *Coordinator) isSchedulingHalted() bool {
-	return c.cluster.GetSchedulerConfig().IsSchedulingHalted()
-}
-
-func (c *Coordinator) checkRegions(startKey []byte) (key []byte, regions []*core.RegionInfo) {
-	regions = c.cluster.ScanRegions(startKey, nil, patrolScanRegionLimit)
-	if len(regions) == 0 {
-		// Resets the scan key.
-		key = nil
-		return
-	}
-
-	for _, region := range regions {
-		c.tryAddOperators(region)
-		key = region.GetEndKey()
-	}
-	return
-}
-
-func (c *Coordinator) checkSuspectRegions() {
-	for _, id := range c.checkers.GetSuspectRegions() {
-		region := c.cluster.GetRegion(id)
-		c.tryAddOperators(region)
-	}
-}
-
-func (c *Coordinator) checkWaitingRegions() {
-	items := c.checkers.GetWaitingRegions()
-	waitingListGauge.Set(float64(len(items)))
-	for _, item := range items {
-		region := c.cluster.GetRegion(item.Key)
-		c.tryAddOperators(region)
-	}
-}
-
-// checkPriorityRegions checks priority regions
-func (c *Coordinator) checkPriorityRegions() {
-	items := c.checkers.GetPriorityRegions()
-	removes := make([]uint64, 0)
-	priorityListGauge.Set(float64(len(items)))
-	for _, id := range items {
-		region := c.cluster.GetRegion(id)
-		if region == nil {
-			removes = append(removes, id)
-			continue
-		}
-		ops := c.checkers.CheckRegion(region)
-		// it should skip if region needs to merge
-		if len(ops) == 0 || ops[0].Kind()&operator.OpMerge != 0 {
-			continue
-		}
-		if !c.opController.ExceedStoreLimit(ops...) {
-			c.opController.AddWaitingOperator(ops...)
-		}
-	}
-	for _, v := range removes {
-		c.checkers.RemovePriorityRegions(v)
-	}
-}
-
-// checkSuspectRanges would pop one suspect key range group
-// The regions of new version key range and old version key range would be placed into
-// the suspect regions map
-func (c *Coordinator) checkSuspectRanges() {
-	defer logutil.LogPanic()
-	defer c.wg.Done()
-	log.Info("coordinator begins to check suspect key ranges")
-	ticker := time.NewTicker(checkSuspectRangesInterval)
-	defer ticker.Stop()
-	for {
-		select {
-		case <-c.ctx.Done():
-			log.Info("check suspect key ranges has been stopped")
-			return
-		case <-ticker.C:
-			keyRange, success := c.checkers.PopOneSuspectKeyRange()
-			if !success {
-				continue
-			}
-			limit := 1024
-			regions := c.cluster.ScanRegions(keyRange[0], keyRange[1], limit)
-			if len(regions) == 0 {
-				continue
-			}
-			regionIDList := make([]uint64, 0, len(regions))
-			for _, region := range regions {
-				regionIDList = append(regionIDList, region.GetID())
-			}
-
-			// if the last region's end key is smaller the keyRange[1] which means there existed the remaining regions between
-			// keyRange[0] and keyRange[1] after scan regions, so we put the end key and keyRange[1] into Suspect KeyRanges
-			lastRegion := regions[len(regions)-1]
-			if lastRegion.GetEndKey() != nil && bytes.Compare(lastRegion.GetEndKey(), keyRange[1]) < 0 {
-				c.checkers.AddSuspectKeyRange(lastRegion.GetEndKey(), keyRange[1])
-			}
-			c.checkers.AddSuspectRegions(regionIDList...)
-		}
-	}
-}
-
-func (c *Coordinator) tryAddOperators(region *core.RegionInfo) {
-	if region == nil {
-		// the region could be recent split, continue to wait.
-		return
-	}
-	id := region.GetID()
-	if c.opController.GetOperator(id) != nil {
-		c.checkers.RemoveWaitingRegion(id)
-		c.checkers.RemoveSuspectRegion(id)
-		return
-	}
-	ops := c.checkers.CheckRegion(region)
-	if len(ops) == 0 {
-		return
-	}
-
-	if !c.opController.ExceedStoreLimit(ops...) {
-		c.opController.AddWaitingOperator(ops...)
-		c.checkers.RemoveWaitingRegion(id)
-		c.checkers.RemoveSuspectRegion(id)
-	} else {
-		c.checkers.AddWaitingRegion(region)
-	}
-}
-
-// drivePushOperator is used to push the unfinished operator to the executor.
-func (c *Coordinator) drivePushOperator() {
-	defer logutil.LogPanic()
-
-	defer c.wg.Done()
-	log.Info("coordinator begins to actively drive push operator")
-	ticker := time.NewTicker(pushOperatorTickInterval)
-	defer ticker.Stop()
-	for {
-		select {
-		case <-c.ctx.Done():
-			log.Info("drive push operator has been stopped")
-			return
-		case <-ticker.C:
-			c.opController.PushOperators(c.RecordOpStepWithTTL)
-		}
-	}
-}
-
-// driveSlowNodeScheduler is used to enable slow node scheduler when using `raft-kv2`.
-func (c *Coordinator) driveSlowNodeScheduler() {
-	defer logutil.LogPanic()
-	defer c.wg.Done()
-
-	ticker := time.NewTicker(time.Minute)
-	defer ticker.Stop()
-	for {
-		select {
-		case <-c.ctx.Done():
-			log.Info("drive slow node scheduler is stopped")
-			return
-		case <-ticker.C:
-			{
-				// If enabled, exit.
-				if exists, _ := c.schedulers.IsSchedulerExisted(schedulers.EvictSlowTrendName); exists {
-					return
-				}
-				// If the cluster was set up with `raft-kv2` engine, this cluster should
-				// enable `evict-slow-trend` scheduler as default.
-				if c.GetCluster().GetStoreConfig().IsRaftKV2() {
-					typ := schedulers.EvictSlowTrendType
-					args := []string{}
-
-					s, err := schedulers.CreateScheduler(typ, c.opController, c.cluster.GetStorage(), schedulers.ConfigSliceDecoder(typ, args), c.schedulers.RemoveScheduler)
-					if err != nil {
-						log.Warn("initializing evict-slow-trend scheduler failed", errs.ZapError(err))
-					} else if err = c.schedulers.AddScheduler(s, args...); err != nil {
-						log.Error("can not add scheduler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", args), errs.ZapError(err))
-					}
-				}
-			}
-		}
-	}
-}
-
-// RunUntilStop runs the coordinator until receiving the stop signal.
-func (c *Coordinator) RunUntilStop(collectWaitTime ...time.Duration) {
-	c.Run(collectWaitTime...)
-	<-c.ctx.Done()
-	log.Info("coordinator is stopping")
-	c.GetSchedulersController().Wait()
-	c.wg.Wait()
-	log.Info("coordinator has been stopped")
-}
-
-// Run starts coordinator.
-func (c *Coordinator) Run(collectWaitTime ...time.Duration) {
-	ticker := time.NewTicker(runSchedulerCheckInterval)
-	failpoint.Inject("changeCoordinatorTicker", func() {
-		ticker = time.NewTicker(100 * time.Millisecond)
-	})
-	defer ticker.Stop()
-	log.Info("coordinator starts to collect cluster information")
-	for {
-		if c.ShouldRun(collectWaitTime...) {
-			log.Info("coordinator has finished cluster information preparation")
-			break
-		}
-		select {
-		case <-ticker.C:
-		case <-c.ctx.Done():
-			log.Info("coordinator stops running")
-			return
-		}
-	}
-	log.Info("coordinator starts to run schedulers")
-	c.InitSchedulers(true)
-
-	c.wg.Add(4)
-	// Starts to patrol regions.
-	go c.PatrolRegions()
-	// Checks suspect key ranges
-	go c.checkSuspectRanges()
-	go c.drivePushOperator()
-	// Checks whether to create evict-slow-trend scheduler.
-	go c.driveSlowNodeScheduler()
-}
-
-// InitSchedulers initializes schedulers.
-func (c *Coordinator) InitSchedulers(needRun bool) {
-	var (
-		scheduleNames []string
-		configs       []string
-		err           error
-	)
-	for i := 0; i < maxLoadConfigRetries; i++ {
-		scheduleNames, configs, err = c.cluster.GetStorage().LoadAllSchedulerConfigs()
-		select {
-		case <-c.ctx.Done():
-			log.Info("init schedulers has been stopped")
-			return
-		default:
-		}
-		if err == nil {
-			break
-		}
-		log.Error("cannot load schedulers' config", zap.Int("retry-times", i), errs.ZapError(err))
-	}
-	if err != nil {
-		log.Fatal("cannot load schedulers' config", errs.ZapError(err))
-	}
-	scheduleCfg := c.cluster.GetSchedulerConfig().GetScheduleConfig().Clone()
-	// The new way to create scheduler with the independent configuration.
-	for i, name := range scheduleNames {
-		data := configs[i]
-		typ := schedulers.FindSchedulerTypeByName(name)
-		var cfg sc.SchedulerConfig
-		for _, c := range scheduleCfg.Schedulers {
-			if c.Type == typ {
-				cfg = c
-				break
-			}
-		}
-		if len(cfg.Type) == 0 {
-			log.Error("the scheduler type not found", zap.String("scheduler-name", name), errs.ZapError(errs.ErrSchedulerNotFound))
-			continue
-		}
-		if cfg.Disable {
-			log.Info("skip create scheduler with independent configuration", zap.String("scheduler-name", name), zap.String("scheduler-type", cfg.Type), zap.Strings("scheduler-args", cfg.Args))
-			continue
-		}
-		s, err := schedulers.CreateScheduler(cfg.Type, c.opController, c.cluster.GetStorage(), schedulers.ConfigJSONDecoder([]byte(data)), c.schedulers.RemoveScheduler)
-		if err != nil {
-			log.Error("can not create scheduler with independent configuration", zap.String("scheduler-name", name), zap.Strings("scheduler-args", cfg.Args), errs.ZapError(err))
-			continue
-		}
-		if needRun {
-			log.Info("create scheduler with independent configuration", zap.String("scheduler-name", s.GetName()))
-			if err = c.schedulers.AddScheduler(s); err != nil {
-				log.Error("can not add scheduler with independent configuration", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", cfg.Args), errs.ZapError(err))
-			}
-		} else {
-			log.Info("create scheduler handler with independent configuration", zap.String("scheduler-name", s.GetName()))
-			if err = c.schedulers.AddSchedulerHandler(s); err != nil {
-				log.Error("can not add scheduler handler with independent configuration", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", cfg.Args), errs.ZapError(err))
-			}
-		}
-	}
-
-	// The old way to create the scheduler.
-	k := 0
-	for _, schedulerCfg := range scheduleCfg.Schedulers {
-		if schedulerCfg.Disable {
-			scheduleCfg.Schedulers[k] = schedulerCfg
-			k++
-			log.Info("skip create scheduler", zap.String("scheduler-type", schedulerCfg.Type), zap.Strings("scheduler-args", schedulerCfg.Args))
-			continue
-		}
-
-		s, err := schedulers.CreateScheduler(schedulerCfg.Type, c.opController, c.cluster.GetStorage(), schedulers.ConfigSliceDecoder(schedulerCfg.Type, schedulerCfg.Args), c.schedulers.RemoveScheduler)
-		if err != nil {
-			log.Error("can not create scheduler", zap.String("scheduler-type", schedulerCfg.Type), zap.Strings("scheduler-args", schedulerCfg.Args), errs.ZapError(err))
-			continue
-		}
-
-		if needRun {
-			log.Info("create scheduler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", schedulerCfg.Args))
-			if err = c.schedulers.AddScheduler(s, schedulerCfg.Args...); err != nil && !errors.ErrorEqual(err, errs.ErrSchedulerExisted.FastGenByArgs()) {
-				log.Error("can not add scheduler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", schedulerCfg.Args), errs.ZapError(err))
-			} else {
-				// Only records the valid scheduler config.
-				scheduleCfg.Schedulers[k] = schedulerCfg
-				k++
-			}
-		} else {
-			log.Info("create scheduler handler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", schedulerCfg.Args))
-			if err = c.schedulers.AddSchedulerHandler(s, schedulerCfg.Args...); err != nil && !errors.ErrorEqual(err, errs.ErrSchedulerExisted.FastGenByArgs()) {
-				log.Error("can not add scheduler handler", zap.String("scheduler-name", s.GetName()), zap.Strings("scheduler-args", schedulerCfg.Args), errs.ZapError(err))
-			} else {
-				scheduleCfg.Schedulers[k] = schedulerCfg
-				k++
-			}
-		}
-	}
-
-	// Removes the invalid scheduler config and persist.
-	scheduleCfg.Schedulers = scheduleCfg.Schedulers[:k]
-	c.cluster.GetSchedulerConfig().SetScheduleConfig(scheduleCfg)
-	if err := c.cluster.GetSchedulerConfig().Persist(c.cluster.GetStorage()); err != nil {
-		log.Error("cannot persist schedule config", errs.ZapError(err))
-	}
-	log.Info("scheduler config is updated", zap.Reflect("scheduler-config", scheduleCfg.Schedulers))
-
-	c.markSchedulersInitialized()
-}
-
-// LoadPlugin load user plugin
-func (c *Coordinator) LoadPlugin(pluginPath string, ch chan string) {
-	log.Info("load plugin", zap.String("plugin-path", pluginPath))
-	// get func: SchedulerType from plugin
-	SchedulerType, err := c.pluginInterface.GetFunction(pluginPath, "SchedulerType")
-	if err != nil {
-		log.Error("GetFunction SchedulerType error", errs.ZapError(err))
-		return
-	}
-	schedulerType := SchedulerType.(func() string)
-	// get func: SchedulerArgs from plugin
-	SchedulerArgs, err := c.pluginInterface.GetFunction(pluginPath, "SchedulerArgs")
-	if err != nil {
-		log.Error("GetFunction SchedulerArgs error", errs.ZapError(err))
-		return
-	}
-	schedulerArgs := SchedulerArgs.(func() []string)
-	// create and add user scheduler
-	s, err := schedulers.CreateScheduler(schedulerType(), c.opController, c.cluster.GetStorage(), schedulers.ConfigSliceDecoder(schedulerType(), schedulerArgs()), c.schedulers.RemoveScheduler)
-	if err != nil {
-		log.Error("can not create scheduler", zap.String("scheduler-type", schedulerType()), errs.ZapError(err))
-		return
-	}
-	log.Info("create scheduler", zap.String("scheduler-name", s.GetName()))
-	// TODO: handle the plugin in API service mode.
-	if err = c.schedulers.AddScheduler(s); err != nil {
-		log.Error("can't add scheduler", zap.String("scheduler-name", s.GetName()), errs.ZapError(err))
-		return
-	}
-
-	c.wg.Add(1)
-	go c.waitPluginUnload(pluginPath, s.GetName(), ch)
-}
-
-func (c *Coordinator) waitPluginUnload(pluginPath, schedulerName string, ch chan string) {
-	defer logutil.LogPanic()
-	defer c.wg.Done()
-	// Get signal from channel which means user unload the plugin
-	for {
-		select {
-		case action := <-ch:
-			if action == PluginUnload {
-				err := c.schedulers.RemoveScheduler(schedulerName)
-				if err != nil {
-					log.Error("can not remove scheduler", zap.String("scheduler-name", schedulerName), errs.ZapError(err))
-				} else {
-					log.Info("unload plugin", zap.String("plugin", pluginPath))
-					return
-				}
-			} else {
-				log.Error("unknown action", zap.String("action", action))
-			}
-		case <-c.ctx.Done():
-			log.Info("unload plugin has been stopped")
-			return
-		}
-	}
-}
-
-// Stop stops the coordinator.
-func (c *Coordinator) Stop() {
-	c.cancel()
-}
-
-// GetHotRegionsByType gets hot regions' statistics by RWType.
-func (c *Coordinator) GetHotRegionsByType(typ utils.RWType) *statistics.StoreHotPeersInfos {
-	isTraceFlow := c.cluster.GetSchedulerConfig().IsTraceRegionFlow()
-	storeLoads := c.cluster.GetStoresLoads()
-	stores := c.cluster.GetStores()
-	var infos *statistics.StoreHotPeersInfos
-	switch typ {
-	case utils.Write:
-		regionStats := c.cluster.RegionWriteStats()
-		infos = statistics.GetHotStatus(stores, storeLoads, regionStats, utils.Write, isTraceFlow)
-	case utils.Read:
-		regionStats := c.cluster.RegionReadStats()
-		infos = statistics.GetHotStatus(stores, storeLoads, regionStats, utils.Read, isTraceFlow)
-	default:
-	}
-	// update params `IsLearner` and `LastUpdateTime`
-	s := []statistics.StoreHotPeersStat{infos.AsLeader, infos.AsPeer}
-	for i, stores := range s {
-		for j, store := range stores {
-			for k := range store.Stats {
-				h := &s[i][j].Stats[k]
-				region := c.cluster.GetRegion(h.RegionID)
-				if region != nil {
-					h.IsLearner = core.IsLearner(region.GetPeer(h.StoreID))
-				}
-				switch typ {
-				case utils.Write:
-					if region != nil {
-						h.LastUpdateTime = time.Unix(int64(region.GetInterval().GetEndTimestamp()), 0)
-					}
-				case utils.Read:
-					store := c.cluster.GetStore(h.StoreID)
-					if store != nil {
-						ts := store.GetMeta().GetLastHeartbeat()
-						h.LastUpdateTime = time.Unix(ts/1e9, ts%1e9)
-					}
-				default:
-				}
-			}
-		}
-	}
-	return infos
-}
-
-// GetHotRegions gets hot regions' statistics by RWType and storeIDs.
-// If storeIDs is empty, it returns all hot regions' statistics by RWType.
-func (c *Coordinator) GetHotRegions(typ utils.RWType, storeIDs ...uint64) *statistics.StoreHotPeersInfos {
-	hotRegions := c.GetHotRegionsByType(typ)
-	if len(storeIDs) > 0 && hotRegions != nil {
-		asLeader := statistics.StoreHotPeersStat{}
-		asPeer := statistics.StoreHotPeersStat{}
-		for _, storeID := range storeIDs {
-			asLeader[storeID] = hotRegions.AsLeader[storeID]
-			asPeer[storeID] = hotRegions.AsPeer[storeID]
-		}
-		return &statistics.StoreHotPeersInfos{
-			AsLeader: asLeader,
-			AsPeer:   asPeer,
-		}
-	}
-	return hotRegions
-}
-
-// GetWaitGroup returns the wait group. Only for test purpose.
-func (c *Coordinator) GetWaitGroup() *sync.WaitGroup {
-	return &c.wg
-}
-
-// CollectHotSpotMetrics collects hot spot metrics.
-func (c *Coordinator) CollectHotSpotMetrics() {
-	stores := c.cluster.GetStores()
-	// Collects hot write region metrics.
-	collectHotMetrics(c.cluster, stores, utils.Write)
-	// Collects hot read region metrics.
-	collectHotMetrics(c.cluster, stores, utils.Read)
-}
-
-func collectHotMetrics(cluster sche.ClusterInformer, stores []*core.StoreInfo, typ utils.RWType) {
-	var (
-		kind        string
-		regionStats map[uint64][]*statistics.HotPeerStat
-	)
-
-	switch typ {
-	case utils.Read:
-		regionStats = cluster.RegionReadStats()
-		kind = utils.Read.String()
-	case utils.Write:
-		regionStats = cluster.RegionWriteStats()
-		kind = utils.Write.String()
-	}
-	status := statistics.CollectHotPeerInfos(stores, regionStats) // only returns TotalBytesRate,TotalKeysRate,TotalQueryRate,Count
-
-	for _, s := range stores {
-		// TODO: pre-allocate gauge metrics
-		storeAddress := s.GetAddress()
-		storeID := s.GetID()
-		storeLabel := strconv.FormatUint(storeID, 10)
-		stat, hasHotLeader := status.AsLeader[storeID]
-		if hasHotLeader {
-			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_bytes_as_leader").Set(stat.TotalBytesRate)
-			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_keys_as_leader").Set(stat.TotalKeysRate)
-			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_query_as_leader").Set(stat.TotalQueryRate)
-			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "hot_"+kind+"_region_as_leader").Set(float64(stat.Count))
-		} else {
-			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_bytes_as_leader")
-			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_keys_as_leader")
-			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_query_as_leader")
-			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "hot_"+kind+"_region_as_leader")
-		}
-
-		stat, hasHotPeer := status.AsPeer[storeID]
-		if hasHotPeer {
-			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_bytes_as_peer").Set(stat.TotalBytesRate)
-			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_keys_as_peer").Set(stat.TotalKeysRate)
-			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "total_"+kind+"_query_as_peer").Set(stat.TotalQueryRate)
-			hotSpotStatusGauge.WithLabelValues(storeAddress, storeLabel, "hot_"+kind+"_region_as_peer").Set(float64(stat.Count))
-		} else {
-			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_bytes_as_peer")
-			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_keys_as_peer")
-			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "total_"+kind+"_query_as_peer")
-			hotSpotStatusGauge.DeleteLabelValues(storeAddress, storeLabel, "hot_"+kind+"_region_as_peer")
-		}
-
-		if !hasHotLeader && !hasHotPeer {
-			utils.ForeachRegionStats(func(rwTy utils.RWType, dim int, _ utils.RegionStatKind) {
-				schedulers.HotPendingSum.DeleteLabelValues(storeLabel, rwTy.String(), utils.DimToString(dim))
-			})
-		}
-	}
-}
-
-// ResetHotSpotMetrics resets hot spot metrics.
-func ResetHotSpotMetrics() {
-	hotSpotStatusGauge.Reset()
-	schedulers.HotPendingSum.Reset()
-}
-
-// ShouldRun returns true if the coordinator should run.
-func (c *Coordinator) ShouldRun(collectWaitTime ...time.Duration) bool {
-	return c.prepareChecker.check(c.cluster.GetBasicCluster(), collectWaitTime...)
-}
-
-// GetSchedulersController returns the schedulers controller.
-func (c *Coordinator) GetSchedulersController() *schedulers.Controller {
-	return c.schedulers
-}
-
-// PauseOrResumeChecker pauses or resumes a checker by name.
-func (c *Coordinator) PauseOrResumeChecker(name string, t int64) error {
-	c.Lock()
-	defer c.Unlock()
-	if c.cluster == nil {
-		return errs.ErrNotBootstrapped.FastGenByArgs()
-	}
-	p, err := c.checkers.GetPauseController(name)
-	if err != nil {
-		return err
-	}
-	p.PauseOrResume(t)
-	return nil
-}
-
-// IsCheckerPaused returns whether a checker is paused.
-func (c *Coordinator) IsCheckerPaused(name string) (bool, error) {
-	c.RLock()
-	defer c.RUnlock()
-	if c.cluster == nil {
-		return false, errs.ErrNotBootstrapped.FastGenByArgs()
-	}
-	p, err := c.checkers.GetPauseController(name)
-	if err != nil {
-		return false, err
-	}
-	return p.IsPaused(), nil
-}
-
-// GetRegionScatterer returns the region scatterer.
-func (c *Coordinator) GetRegionScatterer() *scatter.RegionScatterer {
-	return c.regionScatterer
-}
-
-// GetRegionSplitter returns the region splitter.
-func (c *Coordinator) GetRegionSplitter() *splitter.RegionSplitter {
-	return c.regionSplitter
-}
-
-// GetOperatorController returns the operator controller.
-func (c *Coordinator) GetOperatorController() *operator.Controller {
-	return c.opController
-}
-
-// GetCheckerController returns the checker controller.
-func (c *Coordinator) GetCheckerController() *checker.Controller {
-	return c.checkers
-}
-
-// GetMergeChecker returns the merge checker.
-func (c *Coordinator) GetMergeChecker() *checker.MergeChecker {
-	return c.checkers.GetMergeChecker()
-}
-
-// GetRuleChecker returns the rule checker.
-func (c *Coordinator) GetRuleChecker() *checker.RuleChecker {
-	return c.checkers.GetRuleChecker()
-}
-
-// GetPrepareChecker returns the prepare checker.
-func (c *Coordinator) GetPrepareChecker() *prepareChecker {
-	return c.prepareChecker
-}
-
-// GetHeartbeatStreams returns the heartbeat streams. Only for test purpose.
-func (c *Coordinator) GetHeartbeatStreams() *hbstream.HeartbeatStreams {
-	return c.hbStreams
-}
-
-// GetCluster returns the cluster. Only for test purpose.
-func (c *Coordinator) GetCluster() sche.ClusterInformer {
-	return c.cluster
-}
-
-// GetDiagnosticResult returns the diagnostic result.
-func (c *Coordinator) GetDiagnosticResult(name string) (*schedulers.DiagnosticResult, error) {
-	return c.diagnosticManager.GetDiagnosticResult(name)
-}
-
-// RecordOpStepWithTTL records OpStep with TTL
-func (c *Coordinator) RecordOpStepWithTTL(regionID uint64) {
-	c.GetRuleChecker().RecordRegionPromoteToNonWitness(regionID)
-}
diff --git a/server/cluster/coordinator.go b/server/cluster/coordinator.go
index 157931c9db4..2f8ebcb3a45 100644
--- a/server/cluster/coordinator.go
+++ b/server/cluster/coordinator.go
@@ -81,6 +81,8 @@ type coordinator struct {
 	hbStreams         *hbstream.HeartbeatStreams
 	pluginInterface   *schedule.PluginInterface
 	diagnosticManager *diagnosticManager
+
+	patrolRegionsDuration time.Duration
 }
 
 // newCoordinator creates a new coordinator.
@@ -104,6 +106,22 @@ func newCoordinator(ctx context.Context, cluster *RaftCluster, hbStreams *hbstre
 	}
 }
 
+// GetPatrolRegionsDuration returns the duration of the last patrol region round.
+func (c *coordinator) GetPatrolRegionsDuration() time.Duration {
+	if c == nil {
+		return 0
+	}
+	c.RLock()
+	defer c.RUnlock()
+	return c.patrolRegionsDuration
+}
+
+func (c *coordinator) setPatrolRegionsDuration(dur time.Duration) {
+	c.Lock()
+	defer c.Unlock()
+	c.patrolRegionsDuration = dur
+}
+
 func (c *coordinator) GetWaitingRegions() []*cache.Item {
 	return c.checkers.GetWaitingRegions()
 }
@@ -132,6 +150,7 @@ func (c *coordinator) patrolRegions() {
 		case <-timer.C:
 			timer.Reset(c.cluster.GetOpts().GetPatrolRegionInterval())
 		case <-c.ctx.Done():
+			c.setPatrolRegionsDuration(0)
 			log.Info("patrol regions has been stopped")
 			return
 		}
@@ -154,7 +173,9 @@ func (c *coordinator) patrolRegions() {
 		// Updates the label level isolation statistics.
 		c.cluster.updateRegionsLabelLevelStats(regions)
 		if len(key) == 0 {
-			patrolCheckRegionsGauge.Set(time.Since(start).Seconds())
+			dur := time.Since(start)
+			patrolCheckRegionsGauge.Set(dur.Seconds())
+			c.setPatrolRegionsDuration(dur)
 			start = time.Now()
 		}
 		failpoint.Inject("break-patrol", func() {