diff --git a/pkg/statistics/handle/bootstrap.go b/pkg/statistics/handle/bootstrap.go index 8504e18f3e53a..4913153acc475 100644 --- a/pkg/statistics/handle/bootstrap.go +++ b/pkg/statistics/handle/bootstrap.go @@ -363,7 +363,7 @@ func (h *Handle) initStatsHistogramsConcurrency(is infoschema.InfoSchema, cache } func (*Handle) initStatsTopN4Chunk(cache statstypes.StatsCache, iter *chunk.Iterator4Chunk, totalMemory uint64) { - if isFullCache(cache, totalMemory) { + if IsFullCacheFunc(cache, totalMemory) { return } affectedIndexes := make(map[*statistics.Index]struct{}) @@ -458,20 +458,20 @@ func (h *Handle) initStatsTopNByPaging(cache statstypes.StatsCache, task initsta } func (h *Handle) initStatsTopNConcurrency(cache statstypes.StatsCache, totalMemory uint64) error { - if isFullCache(cache, totalMemory) { + if IsFullCacheFunc(cache, totalMemory) { return nil } var maxTid = maxTidRecord.tid.Load() tid := int64(0) ls := initstats.NewRangeWorker("TopN", func(task initstats.Task) error { - if isFullCache(cache, totalMemory) { + if IsFullCacheFunc(cache, totalMemory) { return nil } return h.initStatsTopNByPaging(cache, task, totalMemory) }, uint64(maxTid), uint64(initStatsStep), initStatsPercentageInterval) ls.LoadStats() for tid <= maxTid { - if isFullCache(cache, totalMemory) { + if IsFullCacheFunc(cache, totalMemory) { break } ls.SendTask(initstats.Task{ @@ -620,7 +620,7 @@ func (*Handle) initStatsBuckets4Chunk(cache statstypes.StatsCache, iter *chunk.I } func (h *Handle) initStatsBuckets(cache statstypes.StatsCache, totalMemory uint64) error { - if isFullCache(cache, totalMemory) { + if IsFullCacheFunc(cache, totalMemory) { return nil } if config.GetGlobalConfig().Performance.ConcurrentlyInitStats { @@ -691,13 +691,13 @@ func (h *Handle) initStatsBucketsByPaging(cache statstypes.StatsCache, task init } func (h *Handle) initStatsBucketsConcurrency(cache statstypes.StatsCache, totalMemory uint64) error { - if isFullCache(cache, totalMemory) { + if IsFullCacheFunc(cache, totalMemory) { return nil } var maxTid = maxTidRecord.tid.Load() tid := int64(0) ls := initstats.NewRangeWorker("bucket", func(task initstats.Task) error { - if isFullCache(cache, totalMemory) { + if IsFullCacheFunc(cache, totalMemory) { return nil } return h.initStatsBucketsByPaging(cache, task) @@ -709,7 +709,7 @@ func (h *Handle) initStatsBucketsConcurrency(cache statstypes.StatsCache, totalM EndTid: tid + initStatsStep, }) tid += initStatsStep - if isFullCache(cache, totalMemory) { + if IsFullCacheFunc(cache, totalMemory) { break } } @@ -809,6 +809,9 @@ func (h *Handle) InitStats(ctx context.Context, is infoschema.InfoSchema) (err e return nil } +// IsFullCacheFunc is whether the cache is full or not. but we can only change it when to test +var IsFullCacheFunc func(cache statstypes.StatsCache, total uint64) bool = isFullCache + func isFullCache(cache statstypes.StatsCache, total uint64) bool { memQuota := variable.StatsCacheMemQuota.Load() return (uint64(cache.MemConsumed()) >= total/4) || (cache.MemConsumed() >= memQuota && memQuota != 0) diff --git a/pkg/statistics/handle/handletest/initstats/BUILD.bazel b/pkg/statistics/handle/handletest/initstats/BUILD.bazel new file mode 100644 index 0000000000000..c5c3b99b15a86 --- /dev/null +++ b/pkg/statistics/handle/handletest/initstats/BUILD.bazel @@ -0,0 +1,21 @@ +load("@io_bazel_rules_go//go:def.bzl", "go_test") + +go_test( + name = "initstats_test", + timeout = "short", + srcs = [ + "load_stats_test.go", + "main_test.go", + ], + flaky = True, + deps = [ + "//pkg/config", + "//pkg/parser/model", + "//pkg/statistics/handle", + "//pkg/statistics/handle/types", + "//pkg/testkit", + "//pkg/testkit/testsetup", + "@com_github_stretchr_testify//require", + "@org_uber_go_goleak//:goleak", + ], +) diff --git a/pkg/statistics/handle/handletest/initstats/load_stats_test.go b/pkg/statistics/handle/handletest/initstats/load_stats_test.go new file mode 100644 index 0000000000000..8fcaaa769f602 --- /dev/null +++ b/pkg/statistics/handle/handletest/initstats/load_stats_test.go @@ -0,0 +1,103 @@ +// Copyright 2024 PingCAP, Inc. +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. + +package initstats + +import ( + "context" + "fmt" + "testing" + + "github.com/pingcap/tidb/pkg/config" + "github.com/pingcap/tidb/pkg/parser/model" + "github.com/pingcap/tidb/pkg/statistics/handle" + "github.com/pingcap/tidb/pkg/statistics/handle/types" + "github.com/pingcap/tidb/pkg/testkit" + "github.com/stretchr/testify/require" +) + +func TestConcurrentlyInitStatsWithMemoryLimit(t *testing.T) { + restore := config.RestoreFunc() + defer restore() + config.UpdateGlobal(func(conf *config.Config) { + conf.Performance.LiteInitStats = false + conf.Performance.ConcurrentlyInitStats = true + }) + handle.IsFullCacheFunc = func(cache types.StatsCache, total uint64) bool { + return true + } + testConcurrentlyInitStats(t) +} + +func TestConcurrentlyInitStatsWithoutMemoryLimit(t *testing.T) { + restore := config.RestoreFunc() + defer restore() + config.UpdateGlobal(func(conf *config.Config) { + conf.Performance.LiteInitStats = false + conf.Performance.ConcurrentlyInitStats = true + }) + handle.IsFullCacheFunc = func(cache types.StatsCache, total uint64) bool { + return false + } + testConcurrentlyInitStats(t) +} + +func testConcurrentlyInitStats(t *testing.T) { + store, dom := testkit.CreateMockStoreAndDomain(t) + tk := testkit.NewTestKit(t, store) + tk.MustExec("use test") + tk.MustExec("set global tidb_analyze_column_options='ALL'") + tk.MustExec("create table t1 (a int, b int, c int, primary key(c))") + tk.MustExec("insert into t1 values (1,1,1),(2,2,2),(3,3,3),(4,4,4),(5,5,5),(6,7,8)") + tk.MustExec("analyze table t1") + for i := 2; i < 10; i++ { + tk.MustExec(fmt.Sprintf("create table t%v (a int, b int, c int, primary key(c))", i)) + tk.MustExec(fmt.Sprintf("insert into t%v select * from t1", i)) + tk.MustExec(fmt.Sprintf("analyze table t%v all columns", i)) + } + h := dom.StatsHandle() + is := dom.InfoSchema() + h.Clear() + require.Equal(t, h.MemConsumed(), int64(0)) + require.NoError(t, h.InitStats(context.Background(), is)) + for i := 1; i < 10; i++ { + tbl, err := is.TableByName(context.Background(), model.NewCIStr("test"), model.NewCIStr(fmt.Sprintf("t%v", i))) + require.NoError(t, err) + stats, ok := h.StatsCache.Get(tbl.Meta().ID) + require.True(t, ok) + for _, col := range stats.GetColSlice() { + require.True(t, col.IsAllEvicted()) + require.False(t, col.IsFullLoad()) + } + } + for i := 1; i < 10; i++ { + tk.MustQuery(fmt.Sprintf("explain select * from t%v where a = 1", i)).CheckNotContain("pseudo") + } + for i := 1; i < 10; i++ { + tk.MustQuery(fmt.Sprintf("explain select * from t%v where b = 1", i)).CheckNotContain("pseudo") + } + for i := 1; i < 10; i++ { + tk.MustQuery(fmt.Sprintf("explain select * from t%v where c = 1", i)).CheckNotContain("pseudo") + } + for i := 1; i < 10; i++ { + tbl, err := is.TableByName(context.Background(), model.NewCIStr("test"), model.NewCIStr(fmt.Sprintf("t%v", i))) + require.NoError(t, err) + stats, ok := h.StatsCache.Get(tbl.Meta().ID) + require.True(t, ok) + for _, col := range stats.GetColSlice() { + require.True(t, col.IsFullLoad()) + require.False(t, col.IsAllEvicted()) + } + } +} diff --git a/pkg/statistics/handle/handletest/initstats/main_test.go b/pkg/statistics/handle/handletest/initstats/main_test.go new file mode 100644 index 0000000000000..13d11c7eaef3f --- /dev/null +++ b/pkg/statistics/handle/handletest/initstats/main_test.go @@ -0,0 +1,34 @@ +// Copyright 2024 PingCAP, Inc. +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. + +package initstats + +import ( + "testing" + + "github.com/pingcap/tidb/pkg/testkit/testsetup" + "go.uber.org/goleak" +) + +func TestMain(m *testing.M) { + opts := []goleak.Option{ + goleak.IgnoreTopFunction("github.com/golang/glog.(*fileSink).flushDaemon"), + goleak.IgnoreTopFunction("github.com/bazelbuild/rules_go/go/tools/bzltestutil.RegisterTimeoutHandler.func1"), + goleak.IgnoreTopFunction("github.com/lestrrat-go/httprc.runFetchWorker"), + goleak.IgnoreTopFunction("go.etcd.io/etcd/client/pkg/v3/logutil.(*MergeLogger).outputLoop"), + goleak.IgnoreTopFunction("go.opencensus.io/stats/view.(*worker).start"), + } + testsetup.SetupForCommonTest() + goleak.VerifyTestMain(m, opts...) +}