From 4a95bcaabea3bffff0aa75840a4cbf8ec210abb3 Mon Sep 17 00:00:00 2001 From: Song Gao Date: Fri, 18 Sep 2020 17:07:08 +0800 Subject: [PATCH] scheduler: add leader verify in balance-region scheduler (#2966) Signed-off-by: Song Gao --- pkg/mock/mockcluster/mockcluster.go | 8 ++++++-- server/schedule/filter/filters.go | 7 ++----- server/schedulers/balance_region.go | 6 ++++++ server/schedulers/balance_test.go | 17 +++++++++++++++++ 4 files changed, 31 insertions(+), 7 deletions(-) diff --git a/pkg/mock/mockcluster/mockcluster.go b/pkg/mock/mockcluster/mockcluster.go index deb019fdca1..937eeb3b333 100644 --- a/pkg/mock/mockcluster/mockcluster.go +++ b/pkg/mock/mockcluster/mockcluster.go @@ -574,6 +574,7 @@ func (mc *Cluster) RemoveScheduler(name string) error { } // MockRegionInfo returns a mock region +// If leaderStoreID is zero, the regions would have no leader func (mc *Cluster) MockRegionInfo(regionID uint64, leaderStoreID uint64, followerStoreIDs, learnerStoreIDs []uint64, epoch *metapb.RegionEpoch) *core.RegionInfo { @@ -583,8 +584,11 @@ func (mc *Cluster) MockRegionInfo(regionID uint64, leaderStoreID uint64, EndKey: []byte(fmt.Sprintf("%20d", regionID+1)), RegionEpoch: epoch, } - leader, _ := mc.AllocPeer(leaderStoreID) - region.Peers = []*metapb.Peer{leader} + var leader *metapb.Peer + if leaderStoreID != 0 { + leader, _ = mc.AllocPeer(leaderStoreID) + region.Peers = append(region.Peers, leader) + } for _, storeID := range followerStoreIDs { peer, _ := mc.AllocPeer(storeID) region.Peers = append(region.Peers, peer) diff --git a/server/schedule/filter/filters.go b/server/schedule/filter/filters.go index 06fa404e10e..7ae154b3ee9 100644 --- a/server/schedule/filter/filters.go +++ b/server/schedule/filter/filters.go @@ -16,6 +16,7 @@ package filter import ( "fmt" + "github.com/golang/protobuf/proto" "github.com/pingcap/kvproto/pkg/metapb" "github.com/pingcap/log" "github.com/tikv/pd/pkg/slice" @@ -683,11 +684,7 @@ func (f *isolationFilter) Target(opt *config.PersistOptions, store *core.StoreIn // FitRegion in filter func createRegionForRuleFit(startKey, endKey []byte, peers []*metapb.Peer, leader *metapb.Peer, opts ...core.RegionCreateOption) *core.RegionInfo { - copyLeader := &metapb.Peer{ - Id: leader.Id, - StoreId: leader.StoreId, - Role: leader.Role, - } + copyLeader := proto.Clone(leader).(*metapb.Peer) copyPeers := make([]*metapb.Peer, 0, len(peers)) for _, p := range peers { peer := &metapb.Peer{ diff --git a/server/schedulers/balance_region.go b/server/schedulers/balance_region.go index 5f0ed88f83a..6900a7856d5 100644 --- a/server/schedulers/balance_region.go +++ b/server/schedulers/balance_region.go @@ -173,6 +173,12 @@ func (s *balanceRegionScheduler) Schedule(cluster opt.Cluster) []*operator.Opera schedulerCounter.WithLabelValues(s.GetName(), "region-hot").Inc() continue } + // Check region whether have leader + if region.GetLeader() == nil { + log.Warn("region have no leader", zap.String("scheduler", s.GetName()), zap.Uint64("region-id", region.GetID())) + schedulerCounter.WithLabelValues(s.GetName(), "no-leader").Inc() + continue + } oldPeer := region.GetStorePeer(sourceID) if op := s.transferPeer(cluster, region, oldPeer); op != nil { diff --git a/server/schedulers/balance_test.go b/server/schedulers/balance_test.go index 446116ee9e6..9e076cf6edc 100644 --- a/server/schedulers/balance_test.go +++ b/server/schedulers/balance_test.go @@ -900,6 +900,23 @@ func (s *testBalanceRegionSchedulerSuite) checkReplacePendingRegion(c *C, tc *mo testutil.CheckTransferPeer(c, sb.Schedule(tc)[0], operator.OpKind(0), 1, 4) } +func (s *testBalanceRegionSchedulerSuite) TestShouldNotBalance(c *C) { + opt := config.NewTestOptions() + tc := mockcluster.NewCluster(opt) + tc.DisableFeature(versioninfo.JointConsensus) + oc := schedule.NewOperatorController(s.ctx, nil, nil) + sb, err := schedule.CreateScheduler(BalanceRegionType, oc, core.NewStorage(kv.NewMemoryKV()), schedule.ConfigSliceDecoder(BalanceRegionType, []string{"", ""})) + c.Assert(err, IsNil) + region := tc.MockRegionInfo(1, 0, []uint64{2, 3, 4}, nil, nil) + tc.PutRegion(region) + operators := sb.Schedule(tc) + if operators != nil { + c.Assert(len(operators), Equals, 0) + } else { + c.Assert(operators, IsNil) + } +} + var _ = Suite(&testRandomMergeSchedulerSuite{}) type testRandomMergeSchedulerSuite struct{}