Compare commits

...

6 Commits

@ -5,17 +5,21 @@ prometheus__scraping_bird:
port: 9324 port: 9324
prometheus__rules_bird: prometheus__rules_bird:
- record: bird:protocol_up:bgp - record: bird:protocol_up:bgp_all
expr: expr:
label_replace( label_replace(
bird_protocol_up{proto="BGP",} bird_protocol_up{proto="BGP"},
unless bird_protocol_up{
proto="BGP",
name=~"^(viarezo|isp[12]|rezel)[46]$"
},
"group", "$1", "group", "$1",
"instance", "^([^0-9\\.]+)-[0-9]+.*" "instance", "^([^0-9\\.]+)-[0-9]+.*"
) )
# FIXME: sessions en cours d'installation, pas encore monitorées
- record: bird:protocol_up:bgp
expr:
bird:protocol_up:bgp_all
unless bird:protocol_up:bgp_all{
group="edge",
name=~"^(viarezo|isp[12]|rezel)[46]$"
}
# Sessions qui ne sont volontairement pas redondées # Sessions qui ne sont volontairement pas redondées
# au sein d'un groupe # au sein d'un groupe
- record: bird:protocol_up:bgp:non_redundant - record: bird:protocol_up:bgp:non_redundant
@ -35,10 +39,10 @@ prometheus__rules_bird:
( (
count by (group, name) ( count by (group, name) (
bird:protocol_up:bgp:redundant{state="Established"} bird:protocol_up:bgp:redundant{state="Established"}
) or ( ) + (
count by (group, name) ( count by (group, name) (
bird:protocol_up:bgp:redundant{state!="Established"} bird:protocol_up:bgp:redundant{state!="Established"} * 0
) * 0 )
) )
) < 2 ) < 2
for: 0m for: 0m
@ -53,10 +57,10 @@ prometheus__rules_bird:
( (
count by (group, name) ( count by (group, name) (
bird:protocol_up:bgp{state="Established"} bird:protocol_up:bgp{state="Established"}
) or ( ) + (
count by (group, name) ( count by (group, name) (
bird:protocol_up:bgp{state!="Established"} bird:protocol_up:bgp{state!="Established"} * 0
) * 0 )
) )
) == 0 ) == 0
for: 0m for: 0m
@ -65,6 +69,7 @@ prometheus__rules_bird:
annotations: annotations:
Session: !unsafe "{{ $labels.name }}" Session: !unsafe "{{ $labels.name }}"
Group: !unsafe "{{ $labels.group }}" Group: !unsafe "{{ $labels.group }}"
# TODO: warning pour redondant ?
- alert: BirdBGPNoExportedPrefixRedundant - alert: BirdBGPNoExportedPrefixRedundant
expr: expr:
bird_protocol_prefix_export_count{ bird_protocol_prefix_export_count{

@ -1,7 +1,7 @@
--- ---
prometheus__rules_common: prometheus__rules_common:
- alert: CollectorDown - alert: CollectorDown
expr: > expr:
up == 0 up == 0
for: 3m for: 3m
labels: labels:

@ -14,7 +14,7 @@ prometheus__rules_keepalived:
keepalived_vrrp_state{ keepalived_vrrp_state{
keepalived_vvrp_state="master" keepalived_vvrp_state="master"
}[1m] }[1m]
) > 1 ) > 0
for: 0m for: 0m
labels: labels:
severity: warning severity: warning

@ -58,7 +58,8 @@ prometheus__rules_quanta:
- alert: QuantaTemp - alert: QuantaTemp
expr: expr:
0.5 * snAgentTempValue > 45 0.5 * snAgentTempValue > 45
for: 0m for: 10m
keep_firing_for: 30m
labels: labels:
severity: warning severity: warning
annotations: annotations:
@ -67,7 +68,8 @@ prometheus__rules_quanta:
- alert: QuantaTemp - alert: QuantaTemp
expr: expr:
0.5 * snAgentTempValue > 60 0.5 * snAgentTempValue > 60
for: 0m for: 10m
keep_firing_for: 30m
labels: labels:
severity: critical severity: critical
annotations: annotations:

@ -44,4 +44,48 @@ prometheus__rules_switch:
ErrorRate: !unsafe '{{ printf "%.2f" $value }} %' ErrorRate: !unsafe '{{ printf "%.2f" $value }} %'
Interface: !unsafe "{{ $labels.ifName }} Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}" {{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchInLinkUsage
expr:
100 * rate(ifHCInOctets[5m]) / (ifHighSpeed * 1000000 / 8) > 50
for: 5m
keep_firing_for: 10m
labels:
severity: warning
annotations:
Usage: !unsafe '{{ printf "%.2f" $value }} %'
Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchInLinkUsage
expr:
100 * rate(ifHCInOctets[5m]) / (ifHighSpeed * 1000000 / 8) > 80
for: 5m
keep_firing_for: 10m
labels:
severity: critical
annotations:
Usage: !unsafe '{{ printf "%.2f" $value }} %'
Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchOutLinkUsage
expr:
100 * rate(ifHCOutOctets[5m]) / (ifHighSpeed * 1000000 / 8) > 50
for: 5m
keep_firing_for: 10m
labels:
severity: warning
annotations:
Usage: !unsafe '{{ printf "%.2f" $value }} %'
Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchOutLinkUsage
expr:
100 * rate(ifHCOutOctets[5m]) / (ifHighSpeed * 1000000 / 8) > 80
for: 5m
keep_firing_for: 10m
labels:
severity: warning
annotations:
Usage: !unsafe '{{ printf "%.2f" $value }} %'
Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
... ...

@ -420,6 +420,18 @@ knotd__zones:
ff-1.core.sw: ff-1.core.sw:
#- 2a09:6840:207::1:1 #- 2a09:6840:207::1:1
- 10.207.1.1 - 10.207.1.1
ff-2.core.sw:
#- 2a09:6840:207::1:2
- 10.207.1.2
fl-1.core.sw:
#- 2a09:6840:207::1:3
- 10.207.1.3
fl-2.core.sw:
#- 2a09:6840:207::1:4
- 10.207.1.4
fd-1.core.sw:
#- 2a09:6840:207::1:5
- 10.207.1.5
gk-1.core.sw: gk-1.core.sw:
#- 2a09:6840:207::2:1 #- 2a09:6840:207::2:1
- 10.207.2.1 - 10.207.2.1

@ -5,6 +5,10 @@ eb-1.acs.sw.infra.auro.re
[quanta] [quanta]
ff-1.core.sw.infra.auro.re ff-1.core.sw.infra.auro.re
ff-2.core.sw.infra.auro.re
fl-1.core.sw.infra.auro.re
fl-2.core.sw.infra.auro.re
fd-1.core.sw.infra.auro.re
gk-1.core.sw.infra.auro.re gk-1.core.sw.infra.auro.re
ec-1.core.sw.infra.auro.re ec-1.core.sw.infra.auro.re
r3-1.core.sw.infra.auro.re r3-1.core.sw.infra.auro.re

Loading…
Cancel
Save