Skip to content
Snippets Groups Projects
Verified Commit 15e2d18b authored by Christian Heusel's avatar Christian Heusel :rocket:
Browse files

Merge branch 'disable-oom-alert-on-build-machines' into 'master'

prometheus: Move the OOM alert for build hosts to a longer timeframe

See merge request !908
parents f7078b51 10475a62
No related branches found
No related tags found
1 merge request!908prometheus: Move the OOM alert for build hosts to a longer timeframe
Pipeline #116214 passed
......@@ -21,7 +21,7 @@ groups:
description: "Swap is filling up (>80%)\n VALUE = {{ $value }}\n LABELS: {{ $labels }}"
- alert: HostOutOfMemory
expr: node_memory_MemAvailable_bytes / node_memory_MemTotal_bytes * 100 < 10
expr: node_memory_MemAvailable_bytes{instance!~"build.archlinux.org",instance!~"repro3.pkgbuild.com",instance!~"repro2.pkgbuild.com"} / node_memory_MemTotal_bytes * 100 < 10
for: 5m
labels:
severity: warning
......@@ -29,6 +29,15 @@ groups:
summary: "Host out of memory (instance {{ $labels.instance }})"
description: "Node memory is filling up (< 10% left)\n VALUE = {{ $value }}\n LABELS: {{ $labels }}"
- alert: BuildHostOutOfMemory
expr: node_memory_MemAvailable_bytes{instance~"build.archlinux.org",instance~"repro3.pkgbuild.com",instance~"repro2.pkgbuild.com"} / node_memory_MemTotal_bytes * 100 < 10
for: 12h
labels:
severity: warning
annotations:
summary: "Build host out of memory for a long time (instance {{ $labels.instance }})"
description: "Node memory is filling up (< 10% left)\n VALUE = {{ $value }}\n LABELS: {{ $labels }}"
- alert: HostMemoryUnderMemoryPressure
expr: rate(node_vmstat_pgmajfault[1m]) > 1000
for: 5m
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment