From 2988e9caf2087ee13ae0ce3559fd71b597b577ec Mon Sep 17 00:00:00 2001 From: brandonbutler Date: Wed, 13 Mar 2024 02:25:47 +0000 Subject: [PATCH] Add resource allocation metric alerts --- chart/proxmox-exporter/Chart.yaml | 2 +- .../templates/prometheusrule.yaml | 19 +++++++++++++++++++ 2 files changed, 20 insertions(+), 1 deletion(-) diff --git a/chart/proxmox-exporter/Chart.yaml b/chart/proxmox-exporter/Chart.yaml index 70e7d87..5c1e79f 100644 --- a/chart/proxmox-exporter/Chart.yaml +++ b/chart/proxmox-exporter/Chart.yaml @@ -15,7 +15,7 @@ type: application # This is the chart version. This version number should be incremented each time you make changes # to the chart and its templates, including the app version. # Versions are expected to follow Semantic Versioning (https://semver.org/) -version: 0.1.6 +version: 0.1.7 # This is the version number of the application being deployed. This version number should be # incremented each time you make changes to the application. Versions are not expected to diff --git a/chart/proxmox-exporter/templates/prometheusrule.yaml b/chart/proxmox-exporter/templates/prometheusrule.yaml index 5c00d33..8ca7d8f 100644 --- a/chart/proxmox-exporter/templates/prometheusrule.yaml +++ b/chart/proxmox-exporter/templates/prometheusrule.yaml @@ -122,4 +122,23 @@ spec: for: 5m labels: severity: warning + + - alert: ProxmoxCPUAllocationHigh + annotations: + summary: Proxmox node {{ printf "{{ $labels.node }}" }} has {{ printf "{{ $value }}" }}% of its CPU allocated to guests + description: It is recommended to keep more of your node's CPU unallocated for use by PVE and other server applications your Proxmox node runs + expr: | + 100 * (proxmox_node_cpus_allocated / proxmox_node_cpus_total) > 90 + for: 5m + labels: + severity: critical + - alert: ProxmoxMemoryAllocationHigh + annotations: + summary: Proxmox node {{ printf "{{ $labels.node }}" }} has {{ printf "{{ $value }}" }}% of its memory allocated to guests + description: It is recommended to keep more of your node's memory unallocated for use by PVE and other server applications your Proxmox node runs + expr: | + 100 * (proxmox_node_memory_allocated_bytes / proxmox_node_memory_total_bytes) > 90 + for: 5m + labels: + severity: critical {{- end }}