From 74ad869edc76e3ed2bff51aef54585be8d562264 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Micha=C5=82=20Leszczy=C5=84ski?= <2000michal@wp.pl> Date: Mon, 11 Mar 2024 00:34:40 +0100 Subject: [PATCH] feat(repair): add MaxRingParallel MaxRingParallel is a cleaner and more comprehensible way of calculating max repair parallelism based on Ring replication strategy. --- pkg/service/repair/plan.go | 33 +++++++++ pkg/service/repair/repair_test.go | 108 ++++++++++++++++++++++++++++++ 2 files changed, 141 insertions(+) create mode 100644 pkg/service/repair/repair_test.go diff --git a/pkg/service/repair/plan.go b/pkg/service/repair/plan.go index cd15c8d933..b2d2631bc1 100644 --- a/pkg/service/repair/plan.go +++ b/pkg/service/repair/plan.go @@ -320,6 +320,39 @@ func maxRepairRangesInParallel(shards uint, totalMemory int64) Intensity { return NewIntensity(max) } +// MaxRingParallel calculates max amount of repair jobs on ring limited to dcs. +func MaxRingParallel(ring scyllaclient.Ring, dcs []string) int { + repairedDCs := strset.New(dcs...) + dcNodeCnt := make(map[string]int) + for _, dc := range ring.HostDC { + dcNodeCnt[dc]++ + } + + switch ring.Replication { + case scyllaclient.SimpleStrategy: + repaired := 0 + for dc, cnt := range dcNodeCnt { + if repairedDCs.Has(dc) { + repaired += cnt + } + } + return repaired / ring.RF + case scyllaclient.NetworkTopologyStrategy: + minDC := math.MaxInt / 2 + for dc, rf := range ring.DCrf { + if repairedDCs.Has(dc) { + minDC = min(minDC, dcNodeCnt[dc]/rf) + } + } + if minDC == math.MaxInt/2 { + minDC = 1 + } + return minDC + default: + return 1 + } +} + // keyspacePlan describes repair schedule and state for keyspace. type keyspacePlan struct { Keyspace string diff --git a/pkg/service/repair/repair_test.go b/pkg/service/repair/repair_test.go new file mode 100644 index 0000000000..fc59929e2b --- /dev/null +++ b/pkg/service/repair/repair_test.go @@ -0,0 +1,108 @@ +// Copyright (C) 2024 ScyllaDB + +package repair_test + +import ( + "fmt" + "testing" + + "github.com/scylladb/scylla-manager/v3/pkg/scyllaclient" + "github.com/scylladb/scylla-manager/v3/pkg/service/repair" +) + +func TestMaxRingParallel(t *testing.T) { + hostDC := map[string]string{ + // dc1 -> 3 + "h1": "dc1", + "h2": "dc1", + "h3": "dc1", + // dc2 -> 4 + "h4": "dc2", + "h5": "dc2", + "h6": "dc2", + "h7": "dc2", + // dc3 -> 5 + "h8": "dc3", + "h9": "dc3", + "h10": "dc3", + "h11": "dc3", + "h12": "dc3", + } + + testCases := []struct { + Ring scyllaclient.Ring + DCs []string + Expected int + }{ + { + Ring: scyllaclient.Ring{ + HostDC: hostDC, + Replication: scyllaclient.SimpleStrategy, + RF: 4, + }, + DCs: []string{"dc1", "dc2", "dc3"}, + Expected: 3, + }, + { + Ring: scyllaclient.Ring{ + HostDC: hostDC, + Replication: scyllaclient.SimpleStrategy, + RF: 3, + }, + DCs: []string{"dc1", "dc2"}, + Expected: 2, + }, + { + Ring: scyllaclient.Ring{ + HostDC: hostDC, + Replication: scyllaclient.NetworkTopologyStrategy, + RF: 5, + DCrf: map[string]int{ + "dc1": 1, + "dc2": 2, + "dc3": 2, + }, + }, + DCs: []string{"dc1", "dc2", "dc3"}, + Expected: 2, + }, + { + Ring: scyllaclient.Ring{ + HostDC: hostDC, + Replication: scyllaclient.NetworkTopologyStrategy, + RF: 8, + DCrf: map[string]int{ + "dc1": 1, + "dc2": 2, + "dc3": 5, + }, + }, + DCs: []string{"dc1", "dc2"}, + Expected: 2, + }, + { + Ring: scyllaclient.Ring{ + HostDC: hostDC, + Replication: scyllaclient.NetworkTopologyStrategy, + RF: 4, + DCrf: map[string]int{ + "dc1": 2, + "dc2": 1, + "dc3": 1, + }, + }, + DCs: []string{"dc1", "dc3"}, + Expected: 1, + }, + } + + for i := range testCases { + tc := testCases[i] + t.Run("test "+fmt.Sprint(i), func(t *testing.T) { + t.Parallel() + if out := repair.MaxRingParallel(tc.Ring, tc.DCs); out != tc.Expected { + t.Fatalf("Expected %d, got %d", tc.Expected, out) + } + }) + } +}