From f04a6d1380874bfbc0fba28a4eb94075df1a08a9 Mon Sep 17 00:00:00 2001 From: okJiang <819421878@qq.com> Date: Mon, 17 Jun 2024 15:50:48 +0800 Subject: [PATCH 1/7] fix pkg/core/store_stats.go Signed-off-by: okJiang <819421878@qq.com> --- .golangci.yml | 2 +- pkg/core/store_stats.go | 5 ++--- 2 files changed, 3 insertions(+), 4 deletions(-) diff --git a/.golangci.yml b/.golangci.yml index 4f5c96cd343..382b4f65a74 100644 --- a/.golangci.yml +++ b/.golangci.yml @@ -207,6 +207,6 @@ issues: - path: (pd-analysis|pd-api-bench|pd-backup|pd-ctl|pd-heartbeat-bench|pd-recover|pd-simulator|pd-tso-bench|pd-ut|regions-dump|stores-dump) linters: - errcheck - - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/schedule/placement/rule.go|pkg/tso/allocator_manager.go|pkg/core/store_stats.go|pkg/core/store_stats.go|pkg/storage/hot_region_storage.go|pkg/syncer/server.go) + - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/schedule/placement/rule.go|pkg/tso/allocator_manager.go|pkg/storage/hot_region_storage.go|pkg/syncer/server.go) linters: - errcheck diff --git a/pkg/core/store_stats.go b/pkg/core/store_stats.go index bcc90a58a2b..d68f8b8e43c 100644 --- a/pkg/core/store_stats.go +++ b/pkg/core/store_stats.go @@ -18,6 +18,7 @@ import ( "github.com/pingcap/kvproto/pkg/pdpb" "github.com/tikv/pd/pkg/movingaverage" "github.com/tikv/pd/pkg/utils/syncutil" + "github.com/tikv/pd/pkg/utils/typeutil" ) type storeStats struct { @@ -56,10 +57,8 @@ func (ss *storeStats) GetStoreStats() *pdpb.StoreStats { // CloneStoreStats returns the statistics information cloned from the store. func (ss *storeStats) CloneStoreStats() *pdpb.StoreStats { ss.mu.RLock() - b, _ := ss.rawStats.Marshal() + stats := typeutil.DeepClone(ss.rawStats, StoreStatsFactory) ss.mu.RUnlock() - stats := &pdpb.StoreStats{} - stats.Unmarshal(b) return stats } From 76b49327ff7842027631642ad1d3746c5b14a02a Mon Sep 17 00:00:00 2001 From: okJiang <819421878@qq.com> Date: Mon, 17 Jun 2024 15:58:01 +0800 Subject: [PATCH 2/7] fix pkg/schedule/placement/rule.go Signed-off-by: okJiang <819421878@qq.com> --- .golangci.yml | 2 +- pkg/schedule/placement/rule.go | 4 +--- 2 files changed, 2 insertions(+), 4 deletions(-) diff --git a/.golangci.yml b/.golangci.yml index 382b4f65a74..b050b3de99c 100644 --- a/.golangci.yml +++ b/.golangci.yml @@ -207,6 +207,6 @@ issues: - path: (pd-analysis|pd-api-bench|pd-backup|pd-ctl|pd-heartbeat-bench|pd-recover|pd-simulator|pd-tso-bench|pd-ut|regions-dump|stores-dump) linters: - errcheck - - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/schedule/placement/rule.go|pkg/tso/allocator_manager.go|pkg/storage/hot_region_storage.go|pkg/syncer/server.go) + - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/tso/allocator_manager.go|pkg/storage/hot_region_storage.go|pkg/syncer/server.go) linters: - errcheck diff --git a/pkg/schedule/placement/rule.go b/pkg/schedule/placement/rule.go index 75ccd509ee8..d6df9caa31e 100644 --- a/pkg/schedule/placement/rule.go +++ b/pkg/schedule/placement/rule.go @@ -90,9 +90,7 @@ func (r *Rule) String() string { // Clone returns a copy of Rule. func (r *Rule) Clone() *Rule { var clone Rule - json.Unmarshal([]byte(r.String()), &clone) - clone.StartKey = append(r.StartKey[:0:0], r.StartKey...) - clone.EndKey = append(r.EndKey[:0:0], r.EndKey...) + _ = json.Unmarshal([]byte(r.String()), &clone) return &clone } From 93005549db3d55b309aec8b3f8870e28fc3aad17 Mon Sep 17 00:00:00 2001 From: okJiang <819421878@qq.com> Date: Mon, 17 Jun 2024 16:05:20 +0800 Subject: [PATCH 3/7] fix pkg/tso/allocator_manager.go Signed-off-by: okJiang <819421878@qq.com> --- .golangci.yml | 2 +- pkg/tso/allocator_manager.go | 65 +++++++++--------------------------- 2 files changed, 17 insertions(+), 50 deletions(-) diff --git a/.golangci.yml b/.golangci.yml index b050b3de99c..d9cbaf4710a 100644 --- a/.golangci.yml +++ b/.golangci.yml @@ -207,6 +207,6 @@ issues: - path: (pd-analysis|pd-api-bench|pd-backup|pd-ctl|pd-heartbeat-bench|pd-recover|pd-simulator|pd-tso-bench|pd-ut|regions-dump|stores-dump) linters: - errcheck - - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/tso/allocator_manager.go|pkg/storage/hot_region_storage.go|pkg/syncer/server.go) + - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/storage/hot_region_storage.go|pkg/syncer/server.go) linters: - errcheck diff --git a/pkg/tso/allocator_manager.go b/pkg/tso/allocator_manager.go index f1683de1352..5b36fbabbc9 100644 --- a/pkg/tso/allocator_manager.go +++ b/pkg/tso/allocator_manager.go @@ -624,11 +624,13 @@ func (am *AllocatorManager) campaignAllocatorLeader( dcLocationInfo *pdpb.GetDCLocationInfoResponse, isNextLeader bool, ) { - log.Info("start to campaign local tso allocator leader", + logger := log.With( logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), zap.String("dc-location", allocator.GetDCLocation()), zap.Any("dc-location-info", dcLocationInfo), - zap.String("name", am.member.Name())) + zap.String("name", am.member.Name()), + ) + logger.Info("start to campaign local tso allocator leader") cmps := make([]clientv3.Cmp, 0) nextLeaderKey := am.nextLeaderKey(allocator.GetDCLocation()) if !isNextLeader { @@ -648,18 +650,9 @@ func (am *AllocatorManager) campaignAllocatorLeader( }) if err := allocator.CampaignAllocatorLeader(am.leaderLease, cmps...); err != nil { if err.Error() == errs.ErrEtcdTxnConflict.Error() { - log.Info("failed to campaign local tso allocator leader due to txn conflict, another allocator may campaign successfully", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - zap.String("name", am.member.Name())) + logger.Info("failed to campaign local tso allocator leader due to txn conflict, another allocator may campaign successfully") } else { - log.Error("failed to campaign local tso allocator leader due to etcd error", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - zap.String("name", am.member.Name()), - errs.ZapError(err)) + logger.Error("failed to campaign local tso allocator leader due to etcd error", errs.ZapError(err)) } return } @@ -670,44 +663,26 @@ func (am *AllocatorManager) campaignAllocatorLeader( defer am.ResetAllocatorGroup(allocator.GetDCLocation()) // Maintain the Local TSO Allocator leader go allocator.KeepAllocatorLeader(ctx) - log.Info("campaign local tso allocator leader ok", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - zap.String("name", am.member.Name())) + logger.Info("campaign local tso allocator leader ok") - log.Info("initialize the local TSO allocator", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - zap.String("name", am.member.Name())) + logger.Info("initialize the local TSO allocator") if err := allocator.Initialize(int(dcLocationInfo.Suffix)); err != nil { - log.Error("failed to initialize the local TSO allocator", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - errs.ZapError(err)) + log.Error("failed to initialize the local TSO allocator", errs.ZapError(err)) return } if dcLocationInfo.GetMaxTs().GetPhysical() != 0 { if err := allocator.WriteTSO(dcLocationInfo.GetMaxTs()); err != nil { - log.Error("failed to write the max local TSO after member changed", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - errs.ZapError(err)) + log.Error("failed to write the max local TSO after member changed", errs.ZapError(err)) return } } am.compareAndSetMaxSuffix(dcLocationInfo.Suffix) allocator.EnableAllocatorLeader() // The next leader is me, delete it to finish campaigning - am.deleteNextLeaderID(allocator.GetDCLocation()) - log.Info("local tso allocator leader is ready to serve", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - zap.String("name", am.member.Name())) + if err := am.deleteNextLeaderID(allocator.GetDCLocation()); err != nil { + logger.Warn("failed to delete next leader key after campaign local tso allocator leader", errs.ZapError(err)) + } + logger.Info("local tso allocator leader is ready to serve") leaderTicker := time.NewTicker(mcsutils.LeaderTickInterval) defer leaderTicker.Stop() @@ -716,20 +691,12 @@ func (am *AllocatorManager) campaignAllocatorLeader( select { case <-leaderTicker.C: if !allocator.IsAllocatorLeader() { - log.Info("no longer a local tso allocator leader because lease has expired, local tso allocator leader will step down", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - zap.String("name", am.member.Name())) + logger.Info("no longer a local tso allocator leader because lease has expired, local tso allocator leader will step down") return } case <-ctx.Done(): // Server is closed and it should return nil. - log.Info("server is closed, reset the local tso allocator", - logutil.CondUint32("keyspace-group-id", am.kgID, am.kgID > 0), - zap.String("dc-location", allocator.GetDCLocation()), - zap.Any("dc-location-info", dcLocationInfo), - zap.String("name", am.member.Name())) + logger.Info("server is closed, reset the local tso allocator") return } } From 936e78dcb352430fa0e0668653e286184d02c28c Mon Sep 17 00:00:00 2001 From: okJiang <819421878@qq.com> Date: Mon, 17 Jun 2024 16:11:17 +0800 Subject: [PATCH 4/7] fix pkg/storage/hot_region_storage.go Signed-off-by: okJiang <819421878@qq.com> --- .golangci.yml | 2 +- pkg/storage/hot_region_storage.go | 4 +++- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/.golangci.yml b/.golangci.yml index d9cbaf4710a..bc1b7ddc00e 100644 --- a/.golangci.yml +++ b/.golangci.yml @@ -207,6 +207,6 @@ issues: - path: (pd-analysis|pd-api-bench|pd-backup|pd-ctl|pd-heartbeat-bench|pd-recover|pd-simulator|pd-tso-bench|pd-ut|regions-dump|stores-dump) linters: - errcheck - - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/storage/hot_region_storage.go|pkg/syncer/server.go) + - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/syncer/server.go) linters: - errcheck diff --git a/pkg/storage/hot_region_storage.go b/pkg/storage/hot_region_storage.go index 0393035c85b..c08825dbba1 100644 --- a/pkg/storage/hot_region_storage.go +++ b/pkg/storage/hot_region_storage.go @@ -171,7 +171,9 @@ func (h *HotRegionStorage) backgroundDelete() { there may be residual hot regions, you can remove it manually, [pd-dir]/data/hot-region.`) continue } - h.delete(int(curReservedDays)) + if err := h.delete(int(curReservedDays)); err != nil { + log.Error("delete hot region meet error", errs.ZapError(err)) + } case <-h.hotRegionInfoCtx.Done(): return } From ea9026c786217e05e41d22308010a999b106cb84 Mon Sep 17 00:00:00 2001 From: okJiang <819421878@qq.com> Date: Mon, 17 Jun 2024 16:19:45 +0800 Subject: [PATCH 5/7] fix plugin/scheduler_example/evict_leader.go Signed-off-by: okJiang <819421878@qq.com> --- .golangci.yml | 2 +- plugin/scheduler_example/evict_leader.go | 46 ++++++++++++++---------- 2 files changed, 28 insertions(+), 20 deletions(-) diff --git a/.golangci.yml b/.golangci.yml index bc1b7ddc00e..e938c24cc59 100644 --- a/.golangci.yml +++ b/.golangci.yml @@ -207,6 +207,6 @@ issues: - path: (pd-analysis|pd-api-bench|pd-backup|pd-ctl|pd-heartbeat-bench|pd-recover|pd-simulator|pd-tso-bench|pd-ut|regions-dump|stores-dump) linters: - errcheck - - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|plugin/scheduler_example/evict_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/syncer/server.go) + - path: (pkg/tso/admin.go|pkg/schedule/schedulers/split_bucket.go|server/api/plugin_disable.go|server/api/plugin_disable.go|server/api/operator.go|server/api/region.go|pkg/schedule/schedulers/balance_leader.go|server/api/.*\.go|pkg/replication/replication_mode.go|pkg/storage/endpoint/gc_safe_point.go|server/.*\.go|pkg/schedule/schedulers/.*\.go|pkg/syncer/server.go) linters: - errcheck diff --git a/plugin/scheduler_example/evict_leader.go b/plugin/scheduler_example/evict_leader.go index f761b3812c5..1e26a97e12c 100644 --- a/plugin/scheduler_example/evict_leader.go +++ b/plugin/scheduler_example/evict_leader.go @@ -259,7 +259,7 @@ func (handler *evictLeaderHandler) UpdateConfig(w http.ResponseWriter, r *http.R id = (uint64)(idFloat) if _, exists = handler.config.StoreIDWitRanges[id]; !exists { if err := handler.config.cluster.PauseLeaderTransfer(id); err != nil { - handler.rd.JSON(w, http.StatusInternalServerError, err.Error()) + _ = handler.rd.JSON(w, http.StatusInternalServerError, err.Error()) return } } @@ -273,47 +273,55 @@ func (handler *evictLeaderHandler) UpdateConfig(w http.ResponseWriter, r *http.R args = append(args, handler.config.getRanges(id)...) } - handler.config.BuildWithArgs(args) - err := handler.config.Persist() + err := handler.config.BuildWithArgs(args) if err != nil { - handler.rd.JSON(w, http.StatusInternalServerError, err.Error()) + _ = handler.rd.JSON(w, http.StatusBadRequest, err.Error()) + return } - handler.rd.JSON(w, http.StatusOK, nil) + err = handler.config.Persist() + if err != nil { + _ = handler.rd.JSON(w, http.StatusInternalServerError, err.Error()) + return + } + _ = handler.rd.JSON(w, http.StatusOK, nil) } func (handler *evictLeaderHandler) ListConfig(w http.ResponseWriter, _ *http.Request) { conf := handler.config.Clone() - handler.rd.JSON(w, http.StatusOK, conf) + _ = handler.rd.JSON(w, http.StatusOK, conf) } func (handler *evictLeaderHandler) DeleteConfig(w http.ResponseWriter, r *http.Request) { idStr := mux.Vars(r)["store_id"] id, err := strconv.ParseUint(idStr, 10, 64) if err != nil { - handler.rd.JSON(w, http.StatusBadRequest, err.Error()) + _ = handler.rd.JSON(w, http.StatusBadRequest, err.Error()) return } handler.config.mu.Lock() defer handler.config.mu.Unlock() _, exists := handler.config.StoreIDWitRanges[id] - if exists { - delete(handler.config.StoreIDWitRanges, id) - handler.config.cluster.ResumeLeaderTransfer(id) + if !exists { + _ = handler.rd.JSON(w, http.StatusInternalServerError, errors.New("the config does not exist")) + return + } + delete(handler.config.StoreIDWitRanges, id) + handler.config.cluster.ResumeLeaderTransfer(id) - handler.config.mu.Unlock() - handler.config.Persist() + handler.config.mu.Unlock() + if err := handler.config.Persist(); err != nil { handler.config.mu.Lock() - - var resp any - if len(handler.config.StoreIDWitRanges) == 0 { - resp = noStoreInSchedulerInfo - } - handler.rd.JSON(w, http.StatusOK, resp) + _ = handler.rd.JSON(w, http.StatusInternalServerError, err.Error()) return } + handler.config.mu.Lock() - handler.rd.JSON(w, http.StatusInternalServerError, errors.New("the config does not exist")) + var resp any + if len(handler.config.StoreIDWitRanges) == 0 { + resp = noStoreInSchedulerInfo + } + _ = handler.rd.JSON(w, http.StatusOK, resp) } func newEvictLeaderHandler(config *evictLeaderSchedulerConfig) http.Handler { From df7e371b4d249fb839b5749fab17477d2a0689f1 Mon Sep 17 00:00:00 2001 From: okJiang <819421878@qq.com> Date: Tue, 18 Jun 2024 11:07:17 +0800 Subject: [PATCH 6/7] merge log Signed-off-by: okJiang <819421878@qq.com> --- pkg/tso/allocator_manager.go | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/pkg/tso/allocator_manager.go b/pkg/tso/allocator_manager.go index 5b36fbabbc9..62a4fb97a57 100644 --- a/pkg/tso/allocator_manager.go +++ b/pkg/tso/allocator_manager.go @@ -663,9 +663,8 @@ func (am *AllocatorManager) campaignAllocatorLeader( defer am.ResetAllocatorGroup(allocator.GetDCLocation()) // Maintain the Local TSO Allocator leader go allocator.KeepAllocatorLeader(ctx) - logger.Info("campaign local tso allocator leader ok") - logger.Info("initialize the local TSO allocator") + logger.Info("Complete campaign local tso allocator leader, begin to initialize the local TSO allocator") if err := allocator.Initialize(int(dcLocationInfo.Suffix)); err != nil { log.Error("failed to initialize the local TSO allocator", errs.ZapError(err)) return From 2c4a20389c3d68880cb81b80fc01fa9237667099 Mon Sep 17 00:00:00 2001 From: okJiang <819421878@qq.com> Date: Wed, 19 Jun 2024 13:00:56 +0800 Subject: [PATCH 7/7] fix comment Signed-off-by: okJiang <819421878@qq.com> --- pkg/schedule/placement/rule.go | 2 ++ 1 file changed, 2 insertions(+) diff --git a/pkg/schedule/placement/rule.go b/pkg/schedule/placement/rule.go index d6df9caa31e..07054b7b1cd 100644 --- a/pkg/schedule/placement/rule.go +++ b/pkg/schedule/placement/rule.go @@ -91,6 +91,8 @@ func (r *Rule) String() string { func (r *Rule) Clone() *Rule { var clone Rule _ = json.Unmarshal([]byte(r.String()), &clone) + clone.StartKey = append(r.StartKey[:0:0], r.StartKey...) + clone.EndKey = append(r.EndKey[:0:0], r.EndKey...) return &clone }