From acf63fd300777f377a947bf2539ca0972cbed81b Mon Sep 17 00:00:00 2001 From: Alexandre Iooss Date: Mon, 28 Dec 2020 12:54:12 +0100 Subject: [PATCH] Change memory formula in prometheus --- roles/prometheus/templates/prometheus/alert.rules.yml.j2 | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/roles/prometheus/templates/prometheus/alert.rules.yml.j2 b/roles/prometheus/templates/prometheus/alert.rules.yml.j2 index 8df9288f..477ed057 100644 --- a/roles/prometheus/templates/prometheus/alert.rules.yml.j2 +++ b/roles/prometheus/templates/prometheus/alert.rules.yml.j2 @@ -16,8 +16,9 @@ groups: summary: "{{ $labels.instance }} ({{ $labels.job }}) est invisible depuis plus de 3 minutes !" # Alert for out of memory + # Do not take into account memory not used by apps - alert: OutOfMemory - expr: (node_memory_MemFree_bytes + node_memory_Cached_bytes + node_memory_Buffers_bytes) / node_memory_MemTotal_bytes * 100 < 10 + expr: (node_memory_MemFree_bytes + node_memory_Cached_bytes + node_memory_Buffers_bytes + node_memory_PageTables_bytes + node_memory_VmallocUsed_bytes + node_memory_SwapCached_bytes + node_memory_Slab_bytes) / node_memory_MemTotal_bytes * 100 < 10 for: 5m labels: severity: warning