Compare commits

...

3 Commits

@ -16,7 +16,7 @@ prometheus__rules_node:
labels: labels:
severity: warning severity: warning
annotations: annotations:
FreeMemory: !unsafe "{{ $value | humanizePercentage }} %" FreeMemory: !unsafe "{{ $value | humanizePercentage }}"
- alert: HostSwapIsFillingUp - alert: HostSwapIsFillingUp
expr: expr:
( (
@ -29,7 +29,7 @@ prometheus__rules_node:
labels: labels:
severity: critical severity: critical
annotations: annotations:
UsedSwap: !unsafe "{{ $value | humanizePercentage }} %" UsedSwap: !unsafe "{{ $value | humanizePercentage }}"
- alert: HostPhysicalComponentTooHot - alert: HostPhysicalComponentTooHot
expr: expr:
node_hwmon_temp_celsius > 79 node_hwmon_temp_celsius > 79
@ -103,7 +103,7 @@ prometheus__rules_node:
severity: critical severity: critical
annotations: annotations:
Mountpoint: !unsafe "{{ $labels.mountpoint }}" Mountpoint: !unsafe "{{ $labels.mountpoint }}"
FreeSpace: !unsafe "{{ $value | humanizePercentage }} %" FreeSpace: !unsafe "{{ $value | humanizePercentage }}"
- alert: HostConntrackLimit - alert: HostConntrackLimit
expr: expr:
( (
@ -114,7 +114,7 @@ prometheus__rules_node:
labels: labels:
severity: warning severity: warning
annotations: annotations:
Filled: !unsafe "{{ $value | humanizePercentage }} %" Filled: !unsafe "{{ $value | humanizePercentage }}"
- alert: HostClockSkew - alert: HostClockSkew
expr: expr:
( (
@ -149,7 +149,7 @@ prometheus__rules_node:
severity: warning severity: warning
annotations: annotations:
Mountpoint: !unsafe "{{ $labels.mountpoint }}" Mountpoint: !unsafe "{{ $labels.mountpoint }}"
FreeInodes: !unsafe "{{ $value | humanizePercentage }} %" FreeInodes: !unsafe "{{ $value | humanizePercentage }}"
- alert: CpuUsage - alert: CpuUsage
expr: expr:
( (
@ -161,7 +161,7 @@ prometheus__rules_node:
labels: labels:
severity: warning severity: warning
annotations: annotations:
Usage: !unsafe "{{ $value | humanizePercentage }} %" Usage: !unsafe "{{ $value | humanizePercentage }}"
- alert: SystemdServiceFailed - alert: SystemdServiceFailed
expr: expr:
node_systemd_unit_state{state="failed"} == 1 node_systemd_unit_state{state="failed"} == 1
@ -196,5 +196,5 @@ prometheus__rules_node:
severity: warning severity: warning
annotations: annotations:
Disk: !unsafe "{{ $labels.disk }}" Disk: !unsafe "{{ $labels.disk }}"
Steal: !unsafe "{{ $value | humanizePercentage }} %" Steal: !unsafe "{{ $value | humanizePercentage }}"
... ...

@ -28,7 +28,7 @@ prometheus__rules_switch:
labels: labels:
severity: warning severity: warning
annotations: annotations:
ErrorRate: !unsafe "{{ $value | humanizePercentage }} %" ErrorRate: !unsafe "{{ $value | humanizePercentage }}"
Interface: !unsafe "{{ $labels.ifName }} Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}" {{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchOutErrors - alert: SwitchOutErrors
@ -41,7 +41,7 @@ prometheus__rules_switch:
labels: labels:
severity: warning severity: warning
annotations: annotations:
ErrorRate: !unsafe "{{ $value | humanizePercentage }} %" ErrorRate: !unsafe "{{ $value | humanizePercentage }}"
Interface: !unsafe "{{ $labels.ifName }} Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}" {{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchInLinkUsage - alert: SwitchInLinkUsage
@ -52,7 +52,7 @@ prometheus__rules_switch:
labels: labels:
severity: warning severity: warning
annotations: annotations:
Usage: !unsafe "{{ $value | humanizePercentage }} %" Usage: !unsafe "{{ $value | humanizePercentage }}"
Interface: !unsafe "{{ $labels.ifName }} Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}" {{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchInLinkUsage - alert: SwitchInLinkUsage
@ -63,7 +63,7 @@ prometheus__rules_switch:
labels: labels:
severity: critical severity: critical
annotations: annotations:
Usage: !unsafe "{{ $value | humanizePercentage }} %" Usage: !unsafe "{{ $value | humanizePercentage }}"
Interface: !unsafe "{{ $labels.ifName }} Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}" {{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchOutLinkUsage - alert: SwitchOutLinkUsage
@ -74,7 +74,7 @@ prometheus__rules_switch:
labels: labels:
severity: warning severity: warning
annotations: annotations:
Usage: !unsafe "{{ $value | humanizePercentage }} %" Usage: !unsafe "{{ $value | humanizePercentage }}"
Interface: !unsafe "{{ $labels.ifName }} Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}" {{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
- alert: SwitchOutLinkUsage - alert: SwitchOutLinkUsage
@ -85,7 +85,7 @@ prometheus__rules_switch:
labels: labels:
severity: warning severity: warning
annotations: annotations:
Usage: !unsafe "{{ $value | humanizePercentage }} %" Usage: !unsafe "{{ $value | humanizePercentage }}"
Interface: !unsafe "{{ $labels.ifName }} Interface: !unsafe "{{ $labels.ifName }}
{{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}" {{ if $labels.ifAlias }}- {{ $labels.ifAlias }}{{ end }}"
... ...

@ -2,6 +2,8 @@
prometheus_snmp__modules_quanta: prometheus_snmp__modules_quanta:
auth: auth:
community: "{{ vault_snmp_quanta_community }}" community: "{{ vault_snmp_quanta_community }}"
timeout: 60s
retries: 3
walk: walk:
- interfaces - interfaces
- ifXTable - ifXTable
@ -27,6 +29,8 @@ prometheus_snmp__modules_quanta:
- dot3CollTable - dot3CollTable
- lldpLocChassisId - lldpLocChassisId
- lldpRemTable - lldpRemTable
- lldpLocPortTable
- dot1dBasePort
lookups: lookups:
- source_indexes: - source_indexes:
- ifIndex - ifIndex
@ -59,6 +63,14 @@ prometheus_snmp__modules_quanta:
- source_indexes: - source_indexes:
- dot3StatsIndex - dot3StatsIndex
lookup: ifName lookup: ifName
- source_indexes:
- lldpRemTimeMark
- lldpRemLocalPortNum
- lldpRemIndex
lookup: lldpRemChassisId
#- source_indexes:
# - lldpLocPortNum
# lookup: lldpLocPortIdSubtype
overrides: overrides:
ifIndex: ifIndex:
ignore: true ignore: true
@ -106,4 +118,8 @@ prometheus_snmp__modules_quanta:
ignore: true ignore: true
dot3StatsDuplexStatus: dot3StatsDuplexStatus:
type: EnumAsStateSet type: EnumAsStateSet
lldpLocPortIdSubtype:
type: EnumAsInfo
lldpRemPortIdSubtype:
type: EnumAsInfo
... ...

Loading…
Cancel
Save