From e632c03547161544c97145133d54d45e6cabda00 Mon Sep 17 00:00:00 2001 From: Chi Wai Chan Date: Mon, 10 Mar 2025 17:25:25 +0800 Subject: [PATCH] Add alert rules for missing metrics Metrics can be missing due to cache expiration or connectivity issue between the exporter and OpenStack APIs. Also see issue [1] [1]: https://github.com/canonical/openstack-exporter-operator/issues/130 Change-Id: I081b7d6f704953ef3360ab6bbed20dcb2c59ec9f Signed-off-by: Chi Wai Chan --- .../src/prometheus_alert_rules/general.yaml | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/charms/openstack-exporter-k8s/src/prometheus_alert_rules/general.yaml b/charms/openstack-exporter-k8s/src/prometheus_alert_rules/general.yaml index 21c8a471..f01cb57a 100644 --- a/charms/openstack-exporter-k8s/src/prometheus_alert_rules/general.yaml +++ b/charms/openstack-exporter-k8s/src/prometheus_alert_rules/general.yaml @@ -14,3 +14,15 @@ groups: summary: OpenStack Services Down description: | The OpenStack service {{ $labels.service }} is down +- name: OpenStackMetrics + rules: + - alert: OpenStackMetricsMissing + expr: | + absent_over_time({__name__=~"openstack_(.+)_up"}[5m]) + labels: + severity: critical + annotations: + summary: OpenStack Metrics Missing + description: | + All OpenStack metrics are missing for over 5 minutes. This could be due to the + connectivity issue of the OpenStack APIs, or the cache of the metrics has expired.