diff --git a/changelogs/unreleased/212882-add-cpu-mem-charts.yml b/changelogs/unreleased/212882-add-cpu-mem-charts.yml new file mode 100644 index 0000000000000000000000000000000000000000..52e645cead787b8d72745f032907e63f98bdf641 --- /dev/null +++ b/changelogs/unreleased/212882-add-cpu-mem-charts.yml @@ -0,0 +1,5 @@ +--- +title: Add CPU, memory usage charts to self monitoring default dashboard +merge_request: 33532 +author: +type: changed diff --git a/config/prometheus/self_monitoring_default.yml b/config/prometheus/self_monitoring_default.yml index dc2361fb3bc5cb1a50b88e440dd69467446c9727..53b47274ecd718431afd1f9e0eca1fb99326f869 100644 --- a/config/prometheus/self_monitoring_default.yml +++ b/config/prometheus/self_monitoring_default.yml @@ -1,6 +1,27 @@ dashboard: 'Default dashboard' priority: 1 panel_groups: + +- group: 'Resource usage' + panels: + - title: "Memory usage" + type: "line-chart" + y_label: "% memory used" + metrics: + - id: node_memory_usage_percentage + query_range: '(1 - (node_memory_MemAvailable_bytes or node_memory_MemFree_bytes + node_memory_Buffers_bytes + node_memory_Cached_bytes + node_memory_Slab_bytes) / node_memory_MemTotal_bytes) * 100' + unit: "%" + label: instance + + - title: "CPU usage" + type: "line-chart" + y_label: "% CPU used" + metrics: + - id: node_cpu_usage_percentage + query_range: '(avg without (mode,cpu) (1 - irate(node_cpu_seconds_total{mode="idle"}[5m]))) * 100' + unit: "%" + label: instance + - group: Web Service panels: - title: Web Service - Error Ratio