Skip to content

Commit

Permalink
cluster,dm: replace ENV_LABELS_ENV in prometheus rules (#1238)
Browse files Browse the repository at this point in the history
  • Loading branch information
9547 authored Mar 24, 2021
1 parent 3fbcafb commit 6721fd0
Show file tree
Hide file tree
Showing 3 changed files with 32 additions and 9 deletions.
14 changes: 8 additions & 6 deletions pkg/cluster/spec/prometheus.go
Original file line number Diff line number Diff line change
Expand Up @@ -290,11 +290,11 @@ func (i *MonitorInstance) InitConfig(
}
}

if err := i.installRules(ctx, e, paths.Deploy, clusterVersion); err != nil {
if err := i.installRules(ctx, e, paths.Deploy, clusterName, clusterVersion); err != nil {
return errors.Annotate(err, "install rules")
}

if err := i.initRules(ctx, e, spec, paths); err != nil {
if err := i.initRules(ctx, e, spec, paths, clusterName); err != nil {
return err
}

Expand All @@ -314,7 +314,7 @@ func (i *MonitorInstance) InitConfig(
// cluster), and the rules for dm cluster is packed in the dm-master component. So if deploying tidb
// cluster, the rules is correct, if deploying dm cluster, we should remove rules for tidb and install
// rules for dm.
func (i *MonitorInstance) installRules(ctx context.Context, e ctxt.Executor, deployDir, clusterVersion string) error {
func (i *MonitorInstance) installRules(ctx context.Context, e ctxt.Executor, deployDir, clusterName, clusterVersion string) error {
if i.topo.Type() != TopoTypeDM {
return nil
}
Expand Down Expand Up @@ -346,16 +346,17 @@ func (i *MonitorInstance) installRules(ctx context.Context, e ctxt.Executor, dep
`find %[1]s -type f -name "*.rules.yml" -delete`,
`find %[2]s/dm-master/conf -type f -name "*.rules.yml" -exec cp {} %[1]s \;`,
"rm -rf %[2]s",
`find %[1]s -maxdepth 1 -type f -name "*.rules.yml" -exec sed -i "s/ENV_LABELS_ENV/%[3]s/g" {} \;`,
}
_, stderr, err = e.Execute(ctx, fmt.Sprintf(strings.Join(cmds, " && "), targetDir, tmp), false)
_, stderr, err = e.Execute(ctx, fmt.Sprintf(strings.Join(cmds, " && "), targetDir, tmp, clusterName), false)
if err != nil {
return errors.Annotatef(err, "stderr: %s", string(stderr))
}

return nil
}

func (i *MonitorInstance) initRules(ctx context.Context, e ctxt.Executor, spec *PrometheusSpec, paths meta.DirPaths) error {
func (i *MonitorInstance) initRules(ctx context.Context, e ctxt.Executor, spec *PrometheusSpec, paths meta.DirPaths, clusterName string) error {
if spec.RuleDir != "" {
return i.TransferLocalConfigDir(ctx, e, spec.RuleDir, path.Join(paths.Deploy, "conf"), func(name string) bool {
return strings.HasSuffix(name, ".rules.yml")
Expand All @@ -367,8 +368,9 @@ func (i *MonitorInstance) initRules(ctx context.Context, e ctxt.Executor, spec *
"mkdir -p %[1]s/conf",
`find %[1]s/conf -type f -name "*.rules.yml" -delete`,
`find %[1]s/bin/prometheus -maxdepth 1 -type f -name "*.rules.yml" -exec cp {} %[1]s/conf/ \;`,
`find %[1]s/conf -maxdepth 1 -type f -name "*.rules.yml" -exec sed -i "s/ENV_LABELS_ENV/%[2]s/g" {} \;`,
}
_, stderr, err := e.Execute(ctx, fmt.Sprintf(strings.Join(cmds, " && "), paths.Deploy), false)
_, stderr, err := e.Execute(ctx, fmt.Sprintf(strings.Join(cmds, " && "), paths.Deploy, clusterName), false)
if err != nil {
return errors.Annotatef(err, "stderr: %s", string(stderr))
}
Expand Down
25 changes: 22 additions & 3 deletions pkg/cluster/spec/prometheus_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -58,7 +58,7 @@ func TestLocalRuleDirs(t *testing.T) {
assert.Nil(t, err)

ctx := checkpoint.NewContext(context.Background())
err = promInstance.initRules(ctx, e, promInstance.InstanceSpec.(*PrometheusSpec), meta.DirPaths{Deploy: deployDir})
err = promInstance.initRules(ctx, e, promInstance.InstanceSpec.(*PrometheusSpec), meta.DirPaths{Deploy: deployDir}, "dummy-cluster")
assert.Nil(t, err)

assert.NoFileExists(t, path.Join(deployDir, "conf", "dummy.rules.yml"))
Expand All @@ -78,7 +78,22 @@ func TestNoLocalRuleDirs(t *testing.T) {
localDir, err := filepath.Abs("./testdata/rules")
assert.Nil(t, err)

err = os.WriteFile(path.Join(deployDir, "bin/prometheus", "dummy.rules.yml"), []byte("dummy"), 0644)
err = os.WriteFile(path.Join(deployDir, "bin/prometheus", "dummy.rules.yml"), []byte(`
groups:
- name: alert.rules
rules:
- alert: TiDB_schema_error
expr: increase(tidb_session_schema_lease_error_total{type="outdated"}[15m]) > 0
for: 1m
labels:
env: ENV_LABELS_ENV
level: emergency
expr: increase(tidb_session_schema_lease_error_total{type="outdated"}[15m]) > 0
annotations:
description: "cluster: ENV_LABELS_ENV, instance: {{ $labels.instance }}, values:{{ $value }}"
value: "{{ $value }}"
summary: TiDB schema error
`), 0644)
assert.Nil(t, err)

topo := new(Specification)
Expand All @@ -99,8 +114,12 @@ func TestNoLocalRuleDirs(t *testing.T) {
assert.Nil(t, err)

ctx := checkpoint.NewContext(context.Background())
err = promInstance.initRules(ctx, e, promInstance.InstanceSpec.(*PrometheusSpec), meta.DirPaths{Deploy: deployDir})
err = promInstance.initRules(ctx, e, promInstance.InstanceSpec.(*PrometheusSpec), meta.DirPaths{Deploy: deployDir}, "dummy-cluster")
assert.Nil(t, err)
body, err := os.ReadFile(path.Join(deployDir, "conf", "dummy.rules.yml"))
assert.Nil(t, err)
assert.Contains(t, string(body), "dummy-cluster")
assert.NotContains(t, string(body), "ENV_LABELS_ENV")

assert.FileExists(t, path.Join(deployDir, "conf", "dummy.rules.yml"))
fs, err := os.ReadDir(localDir)
Expand Down
2 changes: 2 additions & 0 deletions tests/tiup-cluster/test_upgrade_tls.sh
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,8 @@ mkdir -p ~/.tiup/bin && cp -f ./root.json ~/.tiup/bin/
yes | tiup-cluster deploy $name $old_version $topo -i ~/.ssh/id_rsa

yes | tiup-cluster start $name
tiup-cluster exec $name -N n1 --command "grep -q ${name} /home/tidb/deploy/prometheus-9090/conf/*.rules.yml"
! tiup-cluster exec $name -N n1 --command "grep -q ENV_LABELS_ENV /home/tidb/deploy/prometheus-9090/conf/*.rules.yml"

tiup-cluster _test $name writable

Expand Down

0 comments on commit 6721fd0

Please sign in to comment.