From a39c2c92249c62a0ed21115715caa88d5fa51b11 Mon Sep 17 00:00:00 2001 From: Yuanjia Zhang Date: Thu, 10 Aug 2023 18:25:56 +0800 Subject: [PATCH 1/3] This is an automated cherry-pick of #45962 Signed-off-by: ti-chi-bot --- planner/core/planbuilder.go | 2 +- .../handle/handletest/analyze/analyze_test.go | 298 ++++++++++++++++++ 2 files changed, 299 insertions(+), 1 deletion(-) create mode 100644 statistics/handle/handletest/analyze/analyze_test.go diff --git a/planner/core/planbuilder.go b/planner/core/planbuilder.go index 1612cddf41ca2..3e7e8d285c732 100644 --- a/planner/core/planbuilder.go +++ b/planner/core/planbuilder.go @@ -2775,7 +2775,7 @@ var CMSketchSizeLimit = kv.TxnEntrySizeLimit / binary.MaxVarintLen32 var analyzeOptionLimit = map[ast.AnalyzeOptionType]uint64{ ast.AnalyzeOptNumBuckets: 1024, - ast.AnalyzeOptNumTopN: 1024, + ast.AnalyzeOptNumTopN: 16384, ast.AnalyzeOptCMSketchWidth: CMSketchSizeLimit, ast.AnalyzeOptCMSketchDepth: CMSketchSizeLimit, ast.AnalyzeOptNumSamples: 500000, diff --git a/statistics/handle/handletest/analyze/analyze_test.go b/statistics/handle/handletest/analyze/analyze_test.go new file mode 100644 index 0000000000000..9b5514c1b58a4 --- /dev/null +++ b/statistics/handle/handletest/analyze/analyze_test.go @@ -0,0 +1,298 @@ +// Copyright 2023 PingCAP, Inc. +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. + +package analyze + +import ( + "bytes" + "fmt" + "testing" + + "github.com/pingcap/failpoint" + "github.com/pingcap/tidb/config" + "github.com/pingcap/tidb/domain" + "github.com/pingcap/tidb/parser/model" + "github.com/pingcap/tidb/sessionctx/variable" + "github.com/pingcap/tidb/statistics/handle" + "github.com/pingcap/tidb/testkit" + "github.com/stretchr/testify/require" +) + +// nolint:unused +func checkForGlobalStatsWithOpts(t *testing.T, dom *domain.Domain, db, tt, pp string, topn, buckets int) { + tbl, err := dom.InfoSchema().TableByName(model.NewCIStr(db), model.NewCIStr(tt)) + require.NoError(t, err) + + tblInfo := tbl.Meta() + physicalID := tblInfo.ID + if pp != "global" { + for _, def := range tbl.Meta().GetPartitionInfo().Definitions { + if def.Name.L == pp { + physicalID = def.ID + } + } + } + tblStats, err := dom.StatsHandle().TableStatsFromStorage(tblInfo, physicalID, true, 0) + require.NoError(t, err) + + delta := buckets/2 + 10 + for _, idxStats := range tblStats.Indices { + if len(idxStats.Buckets) == 0 { + continue // it's not loaded + } + numTopN := idxStats.TopN.Num() + numBuckets := len(idxStats.Buckets) + // since the hist-building algorithm doesn't stipulate the final bucket number to be equal to the expected number exactly, + // we have to check the results by a range here. + require.Equal(t, topn, numTopN) + require.GreaterOrEqual(t, numBuckets, buckets-delta) + require.LessOrEqual(t, numBuckets, buckets+delta) + } + for _, colStats := range tblStats.Columns { + if len(colStats.Buckets) == 0 { + continue // it's not loaded + } + numTopN := colStats.TopN.Num() + numBuckets := len(colStats.Buckets) + require.Equal(t, topn, numTopN) + require.GreaterOrEqual(t, numBuckets, buckets-delta) + require.LessOrEqual(t, numBuckets, buckets+delta) + } +} + +// nolint:unused +func prepareForGlobalStatsWithOptsV2(t *testing.T, dom *domain.Domain, tk *testkit.TestKit, tblName, dbName string) { + tk.MustExec("create database if not exists " + dbName) + tk.MustExec("use " + dbName) + tk.MustExec("drop table if exists " + tblName) + tk.MustExec(` create table ` + tblName + ` (a int, key(a)) partition by range (a) ` + + `(partition p0 values less than (100000), partition p1 values less than (200000))`) + buf1 := bytes.NewBufferString("insert into " + tblName + " values (0)") + buf2 := bytes.NewBufferString("insert into " + tblName + " values (100000)") + for i := 0; i < 1000; i++ { + buf1.WriteString(fmt.Sprintf(", (%v)", 2)) + buf2.WriteString(fmt.Sprintf(", (%v)", 100002)) + buf1.WriteString(fmt.Sprintf(", (%v)", 1)) + buf2.WriteString(fmt.Sprintf(", (%v)", 100001)) + buf1.WriteString(fmt.Sprintf(", (%v)", 0)) + buf2.WriteString(fmt.Sprintf(", (%v)", 100000)) + } + for i := 0; i < 5000; i += 3 { + buf1.WriteString(fmt.Sprintf(", (%v)", i)) + buf2.WriteString(fmt.Sprintf(", (%v)", 100000+i)) + } + tk.MustExec(buf1.String()) + tk.MustExec(buf2.String()) + tk.MustExec("set @@tidb_analyze_version=2") + tk.MustExec("set @@tidb_partition_prune_mode='dynamic'") + require.NoError(t, dom.StatsHandle().DumpStatsDeltaToKV(handle.DumpAll)) +} + +// nolint:unused +func prepareForGlobalStatsWithOpts(t *testing.T, dom *domain.Domain, tk *testkit.TestKit, tblName, dbName string) { + tk.MustExec("create database if not exists " + dbName) + tk.MustExec("use " + dbName) + tk.MustExec("drop table if exists " + tblName) + tk.MustExec(` create table ` + tblName + ` (a int, key(a)) partition by range (a) ` + + `(partition p0 values less than (100000), partition p1 values less than (200000))`) + buf1 := bytes.NewBufferString("insert into " + tblName + " values (0)") + buf2 := bytes.NewBufferString("insert into " + tblName + " values (100000)") + for i := 0; i < 5000; i += 3 { + buf1.WriteString(fmt.Sprintf(", (%v)", i)) + buf2.WriteString(fmt.Sprintf(", (%v)", 100000+i)) + } + for i := 0; i < 1000; i++ { + buf1.WriteString(fmt.Sprintf(", (%v)", 0)) + buf2.WriteString(fmt.Sprintf(", (%v)", 100000)) + } + tk.MustExec(buf1.String()) + tk.MustExec(buf2.String()) + tk.MustExec("set @@tidb_analyze_version=2") + tk.MustExec("set @@tidb_partition_prune_mode='dynamic'") + require.NoError(t, dom.StatsHandle().DumpStatsDeltaToKV(handle.DumpAll)) +} + +func TestAnalyzeVirtualCol(t *testing.T) { + store := testkit.CreateMockStore(t) + tk := testkit.NewTestKit(t, store) + tk.MustExec("use test") + tk.MustExec("drop table if exists t") + tk.MustExec("create table t(a int, b int generated always as (-a) virtual, c int generated always as (-a) stored, index (c))") + tk.MustExec("insert into t(a) values(2),(1),(1),(3),(NULL)") + tk.MustExec("set @@tidb_analyze_version = 2") + tk.MustExec("analyze table t") + require.Len(t, tk.MustQuery("show stats_histograms where table_name ='t'").Rows(), 3) +} + +func TestAnalyzeGlobalStatsWithOpts1(t *testing.T) { + store, dom := testkit.CreateMockStoreAndDomain(t) + tk := testkit.NewTestKit(t, store) + prepareForGlobalStatsWithOpts(t, dom, tk, "test_gstats_opt", "test_gstats_opt") + + // nolint:unused + type opt struct { + topn int + buckets int + err bool + } + + cases := []opt{ + {1, 37, false}, + {2, 47, false}, + {10, 77, false}, + {77, 219, false}, + {-31, 222, true}, + {10, -77, true}, + {100000, 47, true}, + {77, 47000, true}, + } + for _, ca := range cases { + sql := fmt.Sprintf("analyze table test_gstats_opt with %v topn, %v buckets", ca.topn, ca.buckets) + if !ca.err { + tk.MustExec(sql) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt", "test_gstats_opt", "global", ca.topn, ca.buckets) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt", "test_gstats_opt", "p0", ca.topn, ca.buckets) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt", "test_gstats_opt", "p1", ca.topn, ca.buckets) + } else { + err := tk.ExecToErr(sql) + require.Error(t, err) + } + } +} + +func TestAnalyzeGlobalStatsWithOpts2(t *testing.T) { + store, dom := testkit.CreateMockStoreAndDomain(t) + tk := testkit.NewTestKit(t, store) + originalVal1 := tk.MustQuery("select @@tidb_persist_analyze_options").Rows()[0][0].(string) + defer func() { + tk.MustExec(fmt.Sprintf("set global tidb_persist_analyze_options = %v", originalVal1)) + }() + tk.MustExec("set global tidb_persist_analyze_options=false") + prepareForGlobalStatsWithOptsV2(t, dom, tk, "test_gstats_opt2", "test_gstats_opt2") + + tk.MustExec("analyze table test_gstats_opt2 with 2 topn, 10 buckets, 1000 samples") + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "global", 2, 10) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p0", 2, 10) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p1", 2, 10) + + // analyze a partition to let its options be different with others' + tk.MustExec("analyze table test_gstats_opt2 partition p0 with 3 topn, 20 buckets") + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "global", 3, 20) // use new options + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p0", 3, 20) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p1", 2, 10) + + tk.MustExec("analyze table test_gstats_opt2 partition p1 with 1 topn, 15 buckets") + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "global", 1, 15) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p0", 3, 20) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p1", 1, 15) + + tk.MustExec("analyze table test_gstats_opt2 partition p0 with 2 topn, 10 buckets") // change back to 2 topn + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "global", 2, 10) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p0", 2, 10) + checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p1", 1, 15) +} + +func TestAnalyzeWithDynamicPartitionPruneMode(t *testing.T) { + store := testkit.CreateMockStore(t) + tk := testkit.NewTestKit(t, store) + tk.MustExec("use test") + tk.MustExec("set @@tidb_partition_prune_mode = '" + string(variable.Dynamic) + "'") + tk.MustExec("set @@tidb_analyze_version = 2") + tk.MustExec(`create table t (a int, key(a)) partition by range(a) + (partition p0 values less than (10), + partition p1 values less than (22))`) + tk.MustExec(`insert into t values (1), (2), (3), (10), (11)`) + tk.MustExec(`analyze table t with 1 topn, 2 buckets`) + rows := tk.MustQuery("show stats_buckets where partition_name = 'global' and is_index=1").Rows() + require.Len(t, rows, 2) + require.Equal(t, "4", rows[1][6]) + tk.MustExec("insert into t values (1), (2), (2)") + tk.MustExec("analyze table t partition p0 with 1 topn, 2 buckets") + rows = tk.MustQuery("show stats_buckets where partition_name = 'global' and is_index=1").Rows() + require.Len(t, rows, 2) + require.Equal(t, "5", rows[1][6]) + tk.MustExec("insert into t values (3)") + tk.MustExec("analyze table t partition p0 index a with 1 topn, 2 buckets") + rows = tk.MustQuery("show stats_buckets where partition_name = 'global' and is_index=1").Rows() + require.Len(t, rows, 1) + require.Equal(t, "6", rows[0][6]) +} + +func TestFMSWithAnalyzePartition(t *testing.T) { + store := testkit.CreateMockStore(t) + tk := testkit.NewTestKit(t, store) + tk.MustExec("use test") + tk.MustExec("set @@tidb_partition_prune_mode = '" + string(variable.Dynamic) + "'") + tk.MustExec("set @@tidb_analyze_version = 2") + tk.MustExec(`create table t (a int, key(a)) partition by range(a) + (partition p0 values less than (10), + partition p1 values less than (22))`) + tk.MustExec(`insert into t values (1), (2), (3), (10), (11)`) + tk.MustQuery("select count(*) from mysql.stats_fm_sketch").Check(testkit.Rows("0")) + tk.MustExec("analyze table t partition p0 with 1 topn, 2 buckets") + tk.MustQuery("show warnings").Sort().Check(testkit.Rows( + "Note 1105 Analyze use auto adjusted sample rate 1.000000 for table test.t's partition p0, reason to use this rate is \"use min(1, 110000/10000) as the sample-rate=1\"", + "Warning 1105 Ignore columns and options when analyze partition in dynamic mode", + "Warning 8131 Build global-level stats failed due to missing partition-level stats: table `t` partition `p1`", + "Warning 8131 Build global-level stats failed due to missing partition-level stats: table `t` partition `p1`", + )) + tk.MustQuery("select count(*) from mysql.stats_fm_sketch").Check(testkit.Rows("2")) +} + +func TestFastAnalyzeColumnHistWithNullValue(t *testing.T) { + store := testkit.CreateMockStore(t) + testKit := testkit.NewTestKit(t, store) + testKit.MustExec("use test") + testKit.MustExec("drop table if exists t") + testKit.MustExec("create table t (a int)") + testKit.MustExec("insert into t values (1), (2), (3), (4), (NULL)") + testKit.MustExec("set @@session.tidb_analyze_version = 1") + testKit.MustExec("set @@tidb_enable_fast_analyze=1") + defer testKit.MustExec("set @@tidb_enable_fast_analyze=0") + testKit.MustExec("analyze table t with 0 topn, 2 buckets") + // If NULL is in hist, the min(lower_bound) will be "". + testKit.MustQuery("select min(lower_bound) from mysql.stats_buckets").Check(testkit.Rows("1")) +} + +func TestAnalyzeIncrementalEvictedIndex(t *testing.T) { + t.Skip("now we don't support to evict index") + restore := config.RestoreFunc() + defer restore() + config.UpdateGlobal(func(conf *config.Config) { + conf.Performance.EnableStatsCacheMemQuota = true + }) + store, dom := testkit.CreateMockStoreAndDomain(t) + tk := testkit.NewTestKit(t, store) + tk.MustExec("set @@tidb_analyze_version = 1") + tk.MustExec("use test") + tk.MustExec("drop table if exists t") + tk.MustExec("create table t(a int, b varchar(10), index idx_b (b))") + tk.MustExec("analyze table test.t") + tbl, err := dom.InfoSchema().TableByName(model.NewCIStr("test"), model.NewCIStr("t")) + require.Nil(t, err) + tblStats := domain.GetDomain(tk.Session()).StatsHandle().GetTableStats(tbl.Meta()) + for _, index := range tblStats.Indices { + require.False(t, index.IsEvicted()) + } + + domain.GetDomain(tk.Session()).StatsHandle().SetStatsCacheCapacity(1) + tblStats = domain.GetDomain(tk.Session()).StatsHandle().GetTableStats(tbl.Meta()) + for _, index := range tblStats.Indices { + require.True(t, index.IsEvicted()) + } + + require.Nil(t, failpoint.Enable("github.com/pingcap/tidb/executor/assertEvictIndex", `return(true)`)) + tk.MustExec("analyze incremental table test.t index idx_b") + require.Nil(t, failpoint.Disable("github.com/pingcap/tidb/executor/assertEvictIndex")) +} From 6f6f78a3d7b57477278db9edcef0ce3e9b9d8a73 Mon Sep 17 00:00:00 2001 From: qw4990 Date: Thu, 17 Aug 2023 12:14:19 +0800 Subject: [PATCH 2/3] update readme --- .../handle/handletest/analyze/analyze_test.go | 298 ------------------ 1 file changed, 298 deletions(-) delete mode 100644 statistics/handle/handletest/analyze/analyze_test.go diff --git a/statistics/handle/handletest/analyze/analyze_test.go b/statistics/handle/handletest/analyze/analyze_test.go deleted file mode 100644 index 9b5514c1b58a4..0000000000000 --- a/statistics/handle/handletest/analyze/analyze_test.go +++ /dev/null @@ -1,298 +0,0 @@ -// Copyright 2023 PingCAP, Inc. -// -// Licensed under the Apache License, Version 2.0 (the "License"); -// you may not use this file except in compliance with the License. -// You may obtain a copy of the License at -// -// http://www.apache.org/licenses/LICENSE-2.0 -// -// Unless required by applicable law or agreed to in writing, software -// distributed under the License is distributed on an "AS IS" BASIS, -// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -// See the License for the specific language governing permissions and -// limitations under the License. - -package analyze - -import ( - "bytes" - "fmt" - "testing" - - "github.com/pingcap/failpoint" - "github.com/pingcap/tidb/config" - "github.com/pingcap/tidb/domain" - "github.com/pingcap/tidb/parser/model" - "github.com/pingcap/tidb/sessionctx/variable" - "github.com/pingcap/tidb/statistics/handle" - "github.com/pingcap/tidb/testkit" - "github.com/stretchr/testify/require" -) - -// nolint:unused -func checkForGlobalStatsWithOpts(t *testing.T, dom *domain.Domain, db, tt, pp string, topn, buckets int) { - tbl, err := dom.InfoSchema().TableByName(model.NewCIStr(db), model.NewCIStr(tt)) - require.NoError(t, err) - - tblInfo := tbl.Meta() - physicalID := tblInfo.ID - if pp != "global" { - for _, def := range tbl.Meta().GetPartitionInfo().Definitions { - if def.Name.L == pp { - physicalID = def.ID - } - } - } - tblStats, err := dom.StatsHandle().TableStatsFromStorage(tblInfo, physicalID, true, 0) - require.NoError(t, err) - - delta := buckets/2 + 10 - for _, idxStats := range tblStats.Indices { - if len(idxStats.Buckets) == 0 { - continue // it's not loaded - } - numTopN := idxStats.TopN.Num() - numBuckets := len(idxStats.Buckets) - // since the hist-building algorithm doesn't stipulate the final bucket number to be equal to the expected number exactly, - // we have to check the results by a range here. - require.Equal(t, topn, numTopN) - require.GreaterOrEqual(t, numBuckets, buckets-delta) - require.LessOrEqual(t, numBuckets, buckets+delta) - } - for _, colStats := range tblStats.Columns { - if len(colStats.Buckets) == 0 { - continue // it's not loaded - } - numTopN := colStats.TopN.Num() - numBuckets := len(colStats.Buckets) - require.Equal(t, topn, numTopN) - require.GreaterOrEqual(t, numBuckets, buckets-delta) - require.LessOrEqual(t, numBuckets, buckets+delta) - } -} - -// nolint:unused -func prepareForGlobalStatsWithOptsV2(t *testing.T, dom *domain.Domain, tk *testkit.TestKit, tblName, dbName string) { - tk.MustExec("create database if not exists " + dbName) - tk.MustExec("use " + dbName) - tk.MustExec("drop table if exists " + tblName) - tk.MustExec(` create table ` + tblName + ` (a int, key(a)) partition by range (a) ` + - `(partition p0 values less than (100000), partition p1 values less than (200000))`) - buf1 := bytes.NewBufferString("insert into " + tblName + " values (0)") - buf2 := bytes.NewBufferString("insert into " + tblName + " values (100000)") - for i := 0; i < 1000; i++ { - buf1.WriteString(fmt.Sprintf(", (%v)", 2)) - buf2.WriteString(fmt.Sprintf(", (%v)", 100002)) - buf1.WriteString(fmt.Sprintf(", (%v)", 1)) - buf2.WriteString(fmt.Sprintf(", (%v)", 100001)) - buf1.WriteString(fmt.Sprintf(", (%v)", 0)) - buf2.WriteString(fmt.Sprintf(", (%v)", 100000)) - } - for i := 0; i < 5000; i += 3 { - buf1.WriteString(fmt.Sprintf(", (%v)", i)) - buf2.WriteString(fmt.Sprintf(", (%v)", 100000+i)) - } - tk.MustExec(buf1.String()) - tk.MustExec(buf2.String()) - tk.MustExec("set @@tidb_analyze_version=2") - tk.MustExec("set @@tidb_partition_prune_mode='dynamic'") - require.NoError(t, dom.StatsHandle().DumpStatsDeltaToKV(handle.DumpAll)) -} - -// nolint:unused -func prepareForGlobalStatsWithOpts(t *testing.T, dom *domain.Domain, tk *testkit.TestKit, tblName, dbName string) { - tk.MustExec("create database if not exists " + dbName) - tk.MustExec("use " + dbName) - tk.MustExec("drop table if exists " + tblName) - tk.MustExec(` create table ` + tblName + ` (a int, key(a)) partition by range (a) ` + - `(partition p0 values less than (100000), partition p1 values less than (200000))`) - buf1 := bytes.NewBufferString("insert into " + tblName + " values (0)") - buf2 := bytes.NewBufferString("insert into " + tblName + " values (100000)") - for i := 0; i < 5000; i += 3 { - buf1.WriteString(fmt.Sprintf(", (%v)", i)) - buf2.WriteString(fmt.Sprintf(", (%v)", 100000+i)) - } - for i := 0; i < 1000; i++ { - buf1.WriteString(fmt.Sprintf(", (%v)", 0)) - buf2.WriteString(fmt.Sprintf(", (%v)", 100000)) - } - tk.MustExec(buf1.String()) - tk.MustExec(buf2.String()) - tk.MustExec("set @@tidb_analyze_version=2") - tk.MustExec("set @@tidb_partition_prune_mode='dynamic'") - require.NoError(t, dom.StatsHandle().DumpStatsDeltaToKV(handle.DumpAll)) -} - -func TestAnalyzeVirtualCol(t *testing.T) { - store := testkit.CreateMockStore(t) - tk := testkit.NewTestKit(t, store) - tk.MustExec("use test") - tk.MustExec("drop table if exists t") - tk.MustExec("create table t(a int, b int generated always as (-a) virtual, c int generated always as (-a) stored, index (c))") - tk.MustExec("insert into t(a) values(2),(1),(1),(3),(NULL)") - tk.MustExec("set @@tidb_analyze_version = 2") - tk.MustExec("analyze table t") - require.Len(t, tk.MustQuery("show stats_histograms where table_name ='t'").Rows(), 3) -} - -func TestAnalyzeGlobalStatsWithOpts1(t *testing.T) { - store, dom := testkit.CreateMockStoreAndDomain(t) - tk := testkit.NewTestKit(t, store) - prepareForGlobalStatsWithOpts(t, dom, tk, "test_gstats_opt", "test_gstats_opt") - - // nolint:unused - type opt struct { - topn int - buckets int - err bool - } - - cases := []opt{ - {1, 37, false}, - {2, 47, false}, - {10, 77, false}, - {77, 219, false}, - {-31, 222, true}, - {10, -77, true}, - {100000, 47, true}, - {77, 47000, true}, - } - for _, ca := range cases { - sql := fmt.Sprintf("analyze table test_gstats_opt with %v topn, %v buckets", ca.topn, ca.buckets) - if !ca.err { - tk.MustExec(sql) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt", "test_gstats_opt", "global", ca.topn, ca.buckets) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt", "test_gstats_opt", "p0", ca.topn, ca.buckets) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt", "test_gstats_opt", "p1", ca.topn, ca.buckets) - } else { - err := tk.ExecToErr(sql) - require.Error(t, err) - } - } -} - -func TestAnalyzeGlobalStatsWithOpts2(t *testing.T) { - store, dom := testkit.CreateMockStoreAndDomain(t) - tk := testkit.NewTestKit(t, store) - originalVal1 := tk.MustQuery("select @@tidb_persist_analyze_options").Rows()[0][0].(string) - defer func() { - tk.MustExec(fmt.Sprintf("set global tidb_persist_analyze_options = %v", originalVal1)) - }() - tk.MustExec("set global tidb_persist_analyze_options=false") - prepareForGlobalStatsWithOptsV2(t, dom, tk, "test_gstats_opt2", "test_gstats_opt2") - - tk.MustExec("analyze table test_gstats_opt2 with 2 topn, 10 buckets, 1000 samples") - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "global", 2, 10) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p0", 2, 10) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p1", 2, 10) - - // analyze a partition to let its options be different with others' - tk.MustExec("analyze table test_gstats_opt2 partition p0 with 3 topn, 20 buckets") - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "global", 3, 20) // use new options - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p0", 3, 20) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p1", 2, 10) - - tk.MustExec("analyze table test_gstats_opt2 partition p1 with 1 topn, 15 buckets") - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "global", 1, 15) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p0", 3, 20) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p1", 1, 15) - - tk.MustExec("analyze table test_gstats_opt2 partition p0 with 2 topn, 10 buckets") // change back to 2 topn - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "global", 2, 10) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p0", 2, 10) - checkForGlobalStatsWithOpts(t, dom, "test_gstats_opt2", "test_gstats_opt2", "p1", 1, 15) -} - -func TestAnalyzeWithDynamicPartitionPruneMode(t *testing.T) { - store := testkit.CreateMockStore(t) - tk := testkit.NewTestKit(t, store) - tk.MustExec("use test") - tk.MustExec("set @@tidb_partition_prune_mode = '" + string(variable.Dynamic) + "'") - tk.MustExec("set @@tidb_analyze_version = 2") - tk.MustExec(`create table t (a int, key(a)) partition by range(a) - (partition p0 values less than (10), - partition p1 values less than (22))`) - tk.MustExec(`insert into t values (1), (2), (3), (10), (11)`) - tk.MustExec(`analyze table t with 1 topn, 2 buckets`) - rows := tk.MustQuery("show stats_buckets where partition_name = 'global' and is_index=1").Rows() - require.Len(t, rows, 2) - require.Equal(t, "4", rows[1][6]) - tk.MustExec("insert into t values (1), (2), (2)") - tk.MustExec("analyze table t partition p0 with 1 topn, 2 buckets") - rows = tk.MustQuery("show stats_buckets where partition_name = 'global' and is_index=1").Rows() - require.Len(t, rows, 2) - require.Equal(t, "5", rows[1][6]) - tk.MustExec("insert into t values (3)") - tk.MustExec("analyze table t partition p0 index a with 1 topn, 2 buckets") - rows = tk.MustQuery("show stats_buckets where partition_name = 'global' and is_index=1").Rows() - require.Len(t, rows, 1) - require.Equal(t, "6", rows[0][6]) -} - -func TestFMSWithAnalyzePartition(t *testing.T) { - store := testkit.CreateMockStore(t) - tk := testkit.NewTestKit(t, store) - tk.MustExec("use test") - tk.MustExec("set @@tidb_partition_prune_mode = '" + string(variable.Dynamic) + "'") - tk.MustExec("set @@tidb_analyze_version = 2") - tk.MustExec(`create table t (a int, key(a)) partition by range(a) - (partition p0 values less than (10), - partition p1 values less than (22))`) - tk.MustExec(`insert into t values (1), (2), (3), (10), (11)`) - tk.MustQuery("select count(*) from mysql.stats_fm_sketch").Check(testkit.Rows("0")) - tk.MustExec("analyze table t partition p0 with 1 topn, 2 buckets") - tk.MustQuery("show warnings").Sort().Check(testkit.Rows( - "Note 1105 Analyze use auto adjusted sample rate 1.000000 for table test.t's partition p0, reason to use this rate is \"use min(1, 110000/10000) as the sample-rate=1\"", - "Warning 1105 Ignore columns and options when analyze partition in dynamic mode", - "Warning 8131 Build global-level stats failed due to missing partition-level stats: table `t` partition `p1`", - "Warning 8131 Build global-level stats failed due to missing partition-level stats: table `t` partition `p1`", - )) - tk.MustQuery("select count(*) from mysql.stats_fm_sketch").Check(testkit.Rows("2")) -} - -func TestFastAnalyzeColumnHistWithNullValue(t *testing.T) { - store := testkit.CreateMockStore(t) - testKit := testkit.NewTestKit(t, store) - testKit.MustExec("use test") - testKit.MustExec("drop table if exists t") - testKit.MustExec("create table t (a int)") - testKit.MustExec("insert into t values (1), (2), (3), (4), (NULL)") - testKit.MustExec("set @@session.tidb_analyze_version = 1") - testKit.MustExec("set @@tidb_enable_fast_analyze=1") - defer testKit.MustExec("set @@tidb_enable_fast_analyze=0") - testKit.MustExec("analyze table t with 0 topn, 2 buckets") - // If NULL is in hist, the min(lower_bound) will be "". - testKit.MustQuery("select min(lower_bound) from mysql.stats_buckets").Check(testkit.Rows("1")) -} - -func TestAnalyzeIncrementalEvictedIndex(t *testing.T) { - t.Skip("now we don't support to evict index") - restore := config.RestoreFunc() - defer restore() - config.UpdateGlobal(func(conf *config.Config) { - conf.Performance.EnableStatsCacheMemQuota = true - }) - store, dom := testkit.CreateMockStoreAndDomain(t) - tk := testkit.NewTestKit(t, store) - tk.MustExec("set @@tidb_analyze_version = 1") - tk.MustExec("use test") - tk.MustExec("drop table if exists t") - tk.MustExec("create table t(a int, b varchar(10), index idx_b (b))") - tk.MustExec("analyze table test.t") - tbl, err := dom.InfoSchema().TableByName(model.NewCIStr("test"), model.NewCIStr("t")) - require.Nil(t, err) - tblStats := domain.GetDomain(tk.Session()).StatsHandle().GetTableStats(tbl.Meta()) - for _, index := range tblStats.Indices { - require.False(t, index.IsEvicted()) - } - - domain.GetDomain(tk.Session()).StatsHandle().SetStatsCacheCapacity(1) - tblStats = domain.GetDomain(tk.Session()).StatsHandle().GetTableStats(tbl.Meta()) - for _, index := range tblStats.Indices { - require.True(t, index.IsEvicted()) - } - - require.Nil(t, failpoint.Enable("github.com/pingcap/tidb/executor/assertEvictIndex", `return(true)`)) - tk.MustExec("analyze incremental table test.t index idx_b") - require.Nil(t, failpoint.Disable("github.com/pingcap/tidb/executor/assertEvictIndex")) -} From 1d954c36e735c5c8411722725d8a56dd876332ed Mon Sep 17 00:00:00 2001 From: qw4990 Date: Thu, 17 Aug 2023 12:15:02 +0800 Subject: [PATCH 3/3] update readme --- statistics/handle/handle_test.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/statistics/handle/handle_test.go b/statistics/handle/handle_test.go index 0a9363f626ce8..41ab5b9f49918 100644 --- a/statistics/handle/handle_test.go +++ b/statistics/handle/handle_test.go @@ -1002,7 +1002,7 @@ func TestAnalyzeGlobalStatsWithOpts1(t *testing.T) { {77, 219, false}, {-31, 222, true}, {10, -77, true}, - {10000, 47, true}, + {100000, 47, true}, {77, 47000, true}, } for _, ca := range cases {