Installation Prometheus-postgres-exporter #53
2 changed files with 38 additions and 37 deletions
|
@ -33,6 +33,7 @@
|
|||
- alerts.rules.yml
|
||||
- django.rules.yml
|
||||
|
||||
|
||||
- name: Configure Prometheus alerts
|
||||
template:
|
||||
src: "{{ item }}.j2"
|
||||
|
|
|
@ -10,41 +10,41 @@ groups:
|
|||
- name: docker.rules
|
||||
rules:
|
||||
|
||||
- alert: ContainerDown
|
||||
expr: docker_container_running_state
|
||||
for: 0m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: >-
|
||||
Container Docker mort
|
||||
(instance {{ raw('$labels.instance') }}, container {{ raw('$labels.name') }})
|
||||
- alert: ContainerDown
|
||||
expr: docker_container_running_state != 1
|
||||
for: 0m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: >-
|
||||
Container Docker mort
|
||||
(instance {{ raw('$labels.instance') }}, container {{ raw('$labels.name') }})
|
||||
|
||||
- alert: ContainerFailed
|
||||
expr: sum(increase(docker_container_restart_count[5m])) > 2
|
||||
for: 0m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: >-
|
||||
Container Docker redémarre souvent
|
||||
(instance raw('{{ $labels.instance') }}, container {{ raw('$labels.name') }})
|
||||
- alert: ContainerFailed
|
||||
expr: sum(increase(docker_container_restart_count[5m])) > 2
|
||||
for: 0m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: >-
|
||||
Container Docker redémarre souvent
|
||||
(instance {{ raw('$labels.instance') }}, container {{ raw('$labels.name') }})
|
||||
|
||||
- alert: ContainerFailed
|
||||
expr:
|
||||
(
|
||||
docker_container_cpu_used_total
|
||||
/
|
||||
docker_container_cpu_capacity_total
|
||||
) * 100
|
||||
> 30
|
||||
for: 0m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: >-
|
||||
Container Docker utilise beaucoup de CPU
|
||||
(instance {{ raw('$labels.instance') }}, container {{ raw('$labels.name') }},
|
||||
value {{ raw('$value | printf "%.1f"'') }})
|
||||
- alert: ContainerFailed
|
||||
expr:
|
||||
(
|
||||
docker_container_cpu_used_total
|
||||
/
|
||||
docker_container_cpu_capacity_total
|
||||
) * 100
|
||||
> 30
|
||||
for: 0m
|
||||
labels:
|
||||
severity: critical
|
||||
annotations:
|
||||
summary: >-
|
||||
Container Docker utilise beaucoup de CPU
|
||||
(instance {{ raw('$labels.instance') }}, container {{ raw('$labels.name') }},
|
||||
value {{ raw('$value | printf "%.1f"') }})
|
||||
|
||||
...
|
||||
|
|
Loading…
Reference in a new issue