2018-10-03 20:08:36 +03:00
rule_files :
- mixin.yaml
evaluation_interval : 1m
tests :
- interval : 1m
input_series :
- series : 'up{job="etcd",instance="10.10.10.0"}'
values : '1 1 1 1 1 1 1 1 1 1 1 1 0 0 0 0'
- series : 'up{job="etcd",instance="10.10.10.1"}'
values : '1 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0'
- series : 'up{job="etcd",instance="10.10.10.2"}'
values : '1 1 1 1 0 0 0 0 0 0 0 0 0 0 0 0'
alert_rule_test :
- eval_time : 3m
2019-07-18 23:57:44 +03:00
alertname : etcdInsufficientMembers
- eval_time : 5m
alertname : etcdInsufficientMembers
- eval_time : 5m
alertname : etcdMembersDown
2018-10-03 20:08:36 +03:00
- eval_time : 7m
2019-07-18 23:57:44 +03:00
alertname : etcdMembersDown
exp_alerts :
- exp_labels :
job : etcd
severity : critical
exp_annotations :
message : 'etcd cluster "etcd": members are down (1).'
- eval_time : 7m
alertname : etcdInsufficientMembers
2018-10-03 20:08:36 +03:00
- eval_time : 11m
2019-07-18 23:57:44 +03:00
alertname : etcdInsufficientMembers
2018-10-03 20:08:36 +03:00
exp_alerts :
- exp_labels :
job : etcd
severity : critical
exp_annotations :
2019-07-18 23:57:44 +03:00
message : 'etcd cluster "etcd": insufficient members (1).'
2018-10-03 20:08:36 +03:00
- eval_time : 15m
2019-07-18 23:57:44 +03:00
alertname : etcdInsufficientMembers
exp_alerts :
- exp_labels :
job : etcd
severity : critical
exp_annotations :
message : 'etcd cluster "etcd": insufficient members (0).'
- interval : 1m
input_series :
- series : 'up{job="etcd",instance="10.10.10.0"}'
values : '1 1 1 1 1 1 1 1 1 1 1 1 0 0 0 0'
- series : 'up{job="etcd",instance="10.10.10.1"}'
values : '1 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0'
- series : 'up{job="etcd",instance="10.10.10.2"}'
values : '1 1 1 1 0 0 0 0'
alert_rule_test :
- eval_time : 10m
alertname : etcdMembersDown
exp_alerts :
- exp_labels :
job : etcd
severity : critical
exp_annotations :
message : 'etcd cluster "etcd": members are down (2).'
- interval : 1m
input_series :
- series : 'up{job="etcd",instance="10.10.10.0"}'
values : '1 1 1 1 1 1 1 1 1 1 1 1 0 0 0 0'
- series : 'up{job="etcd",instance="10.10.10.1"}'
values : '1 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0'
- series : 'etcd_network_peer_sent_failures_total{To="member-1",job="etcd",endpoint="test"}'
values : '0 0 1 2 3 4 5 6 7 8 9 10'
alert_rule_test :
- eval_time : 4m
alertname : etcdMembersDown
- eval_time : 6m
alertname : etcdMembersDown
2018-10-03 20:08:36 +03:00
exp_alerts :
- exp_labels :
job : etcd
severity : critical
exp_annotations :
2019-07-18 23:57:44 +03:00
message : 'etcd cluster "etcd": members are down (1).'
2019-12-14 03:00:11 +03:00
- interval : 1m
input_series :
- series : 'etcd_server_leader_changes_seen_total{job="etcd",instance="10.10.10.0"}'
values : '0 0 2 0 0 1 0 0 0 0 0 0 0 0 0 0'
- series : 'etcd_server_leader_changes_seen_total{job="etcd",instance="10.10.10.1"}'
values : '0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0'
- series : 'etcd_server_leader_changes_seen_total{job="etcd",instance="10.10.10.2"}'
values : '0 0 0 0 0 0 0 0'
alert_rule_test :
- eval_time : 10m
alertname : etcdHighNumberOfLeaderChanges
exp_alerts :
- exp_labels :
job : etcd
severity : warning
exp_annotations :
message : 'etcd cluster "etcd": 3 leader changes within the last 15 minutes. Frequent elections may be a sign of insufficient resources, high network latency, or disruptions by other components and should be investigated.'
- interval : 1m
input_series :
- series : 'etcd_server_leader_changes_seen_total{job="etcd",instance="10.10.10.0"}'
values : '0 0 2 0 0 0 0 0 0 0 0 0 0 0 0 0'
- series : 'etcd_server_leader_changes_seen_total{job="etcd",instance="10.10.10.1"}'
values : '0 0 1 0 0 0 0 0 0 0 0 0 0 0 0 0'
- series : 'etcd_server_leader_changes_seen_total{job="etcd",instance="10.10.10.2"}'
values : '0 0 0 0 0 0 0 0'
alert_rule_test :
- eval_time : 10m
alertname : etcdHighNumberOfLeaderChanges
exp_alerts :