Merge pull request #11768 from brancz/uid

Use UID instead of ID in Grafana dashboard
This commit is contained in:
Brandon Philips 2020-04-29 05:35:06 -07:00 committed by GitHub
commit 1044a8b07c
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 24 additions and 8 deletions

View File

@ -217,7 +217,7 @@
grafanaDashboards+:: { grafanaDashboards+:: {
'etcd.json': { 'etcd.json': {
id: 6, uid: std.md5('etcd.json'),
title: 'etcd', title: 'etcd',
description: 'etcd sample Grafana dashboard with Prometheus', description: 'etcd sample Grafana dashboard with Prometheus',
tags: [], tags: [],
@ -516,7 +516,7 @@
stack: false, stack: false,
steppedLine: false, steppedLine: false,
targets: [{ targets: [{
expr: 'etcd_debugging_mvcc_db_total_size_in_bytes{job="$cluster"}', expr: 'etcd_mvcc_db_total_size_in_bytes{job="$cluster"}',
hide: false, hide: false,
interval: '', interval: '',
intervalFactor: 2, intervalFactor: 2,

View File

@ -2,6 +2,21 @@
groups: groups:
- name: etcd - name: etcd
rules: rules:
- alert: etcdMembersDown
annotations:
message: 'etcd cluster "{{ $labels.job }}": members are down ({{ $value }}).'
expr: |
max by (job) (
sum by (job) (up{job=~".*etcd.*"} == bool 0)
or
count by (job,endpoint) (
sum by (job,endpoint,To) (rate(etcd_network_peer_sent_failures_total{job=~".*etcd.*"}[3m])) > 0.01
)
)
> 0
for: 3m
labels:
severity: critical
- alert: etcdInsufficientMembers - alert: etcdInsufficientMembers
annotations: annotations:
message: 'etcd cluster "{{ $labels.job }}": insufficient members ({{ $value message: 'etcd cluster "{{ $labels.job }}": insufficient members ({{ $value
@ -22,11 +37,12 @@ groups:
severity: critical severity: critical
- alert: etcdHighNumberOfLeaderChanges - alert: etcdHighNumberOfLeaderChanges
annotations: annotations:
message: 'etcd cluster "{{ $labels.job }}": instance {{ $labels.instance }} message: 'etcd cluster "{{ $labels.job }}": {{ $value }} leader changes within
has seen {{ $value }} leader changes within the last hour.' the last 15 minutes. Frequent elections may be a sign of insufficient resources,
high network latency, or disruptions by other components and should be investigated.'
expr: | expr: |
rate(etcd_server_leader_changes_seen_total{job=~".*etcd.*"}[15m]) > 3 increase((max by (job) (etcd_server_leader_changes_seen_total{job=~".*etcd.*"}) or 0*absent(etcd_server_leader_changes_seen_total{job=~".*etcd.*"}))[15m:1m]) >= 3
for: 15m for: 5m
labels: labels:
severity: warning severity: warning
- alert: etcdHighNumberOfFailedGRPCRequests - alert: etcdHighNumberOfFailedGRPCRequests
@ -76,7 +92,7 @@ groups:
- alert: etcdHighNumberOfFailedProposals - alert: etcdHighNumberOfFailedProposals
annotations: annotations:
message: 'etcd cluster "{{ $labels.job }}": {{ $value }} proposal failures within message: 'etcd cluster "{{ $labels.job }}": {{ $value }} proposal failures within
the last hour on etcd instance {{ $labels.instance }}.' the last 30 minutes on etcd instance {{ $labels.instance }}.'
expr: | expr: |
rate(etcd_server_proposals_failed_total{job=~".*etcd.*"}[15m]) > 5 rate(etcd_server_proposals_failed_total{job=~".*etcd.*"}[15m]) > 5
for: 15m for: 15m

View File

@ -9,7 +9,6 @@
"editable": true, "editable": true,
"gnetId": null, "gnetId": null,
"hideControls": false, "hideControls": false,
"id": 6,
"links": [ "links": [
], ],
@ -1220,6 +1219,7 @@
}, },
"timezone": "browser", "timezone": "browser",
"title": "etcd", "title": "etcd",
"uid": "c2f4e12cdf69feb95caa41a5a1b423d9",
"version": 215 "version": 215
} }
} }