forked from prometheus/mysqld_exporter
-
Notifications
You must be signed in to change notification settings - Fork 43
/
Copy pathexample.rules
123 lines (108 loc) · 3.83 KB
/
example.rules
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
###
# Sample prometheus rules/alerts for mysqld.
#
# NOTE: Please review these carefully as thresholds and behavior may not meet
# your SLOs or labels.
#
###
# Recording Rules
# Record slave lag seconds for pre-computed timeseries that takes
# `mysql_slave_status_sql_delay` into account
mysql_slave_lag_seconds = mysql_slave_status_seconds_behind_master - mysql_slave_status_sql_delay
# Record slave lag via heartbeat method
mysql_heartbeat_lag_seconds = mysql_heartbeat_now_timestamp_seconds - mysql_heartbeat_stored_timestamp_seconds
# Record "Transactions per second"
# See: https://dev.mysql.com/doc/refman/5.7/en/glossary.html#glos_transaction
job:mysql_transactions:rate5m = sum(rate(mysql_global_status_commands_total{command=~"(commit|rollback)"}[5m])) without (command)
###
# Galera Alerts
# Alert: Galera node is not "ready".
ALERT MySQLGaleraNotReady
IF mysql_global_status_wsrep_ready != 1
FOR 5m
LABELS {
severity = "warning"
}
ANNOTATIONS {
summary = "Galera cluster node not ready",
description = "{{$labels.job}} on {{$labels.instance}} is not ready.",
}
# Alert: Galera node state is not synced.
ALERT MySQLGaleraOutOfSync
IF (mysql_global_status_wsrep_local_state != 4 AND mysql_global_variables_wsrep_desync == 0)
FOR 5m
LABELS {
severity = "warning"
}
ANNOTATIONS {
summary = "Galera cluster node out of sync",
description = "{{$labels.job}} on {{$labels.instance}} is not in sync ({{$value}} != 4).",
}
# Alert: Galera node is in "doner" state, and is behind applying transactions.
ALERT MySQLGaleraDonorFallingBehind
IF (mysql_global_status_wsrep_local_state == 2 AND mysql_global_status_wsrep_local_recv_queue > 100)
FOR 5m
LABELS {
severity = "warning"
}
ANNOTATIONS {
summary = "xtradb cluster donor node falling behind",
description = "{{$labels.job}} on {{$labels.instance}} is a donor (hotbackup) and is falling behind (queue size {{$value}}).",
}
###
# Replication Alerts
# Alert: The replication IO or SQL threads are stopped.
ALERT MySQLReplicationNotRunning
IF mysql_slave_status_slave_io_running == 0 OR mysql_slave_status_slave_sql_running == 0
FOR 2m
LABELS {
severity = "critical"
}
ANNOTATIONS {
summary = "Slave replication is not running",
description = "Slave replication (IO or SQL) has been down for more than 2 minutes.",
}
# Alert: The replication lag is non-zero and it predicted to not recover within
# 2 minutes. This allows for a small amount of replication lag.
# NOTE: This alert depends on the recording rule at the top of the file.
ALERT MySQLReplicationLag
IF
(mysql_slave_lag_seconds > 30)
AND on (instance)
(predict_linear(mysql_slave_lag_seconds[5m], 60*2) > 0)
FOR 1m
LABELS {
severity = "critical"
}
ANNOTATIONS {
summary = "MySQL slave replication is lagging",
description = "The mysql slave replication has fallen behind and is not recovering",
}
# Alert: The replication lag is non-zero and it predicted to not recover within
# 2 minutes. This allows for a small amount of replication lag.
# NOTE: This alert depends on the recording rule at the top of the file.
ALERT MySQLReplicationLag
IF
(mysql_heartbeat_lag_seconds > 30)
AND on (instance)
(predict_linear(mysql_heartbeat_lag_seconds[5m], 60*2) > 0)
FOR 1m
LABELS {
severity = "critical"
}
ANNOTATIONS {
summary = "MySQL slave replication is lagging",
description = "The mysql slave replication has fallen behind and is not recovering",
}
###
# Performance Alerts
# Alert: InnoDB log writes are stalling.
ALERT MySQLInnoDBLogWaits
IF rate(mysql_global_status_innodb_log_waits[15m]) > 10
LABELS {
severity = "warning"
}
ANNOTATIONS {
summary = "MySQL innodb log writes stalling",
description = "The innodb logs are waiting for disk at a rate of {{$value}} / second",
}