summaryrefslogtreecommitdiffstats
path: root/monitoring
diff options
context:
space:
mode:
authorVallari Agrawal <val.agl002@gmail.com>2024-10-08 23:07:48 +0200
committerVallari Agrawal <vallari.agrawal@ibm.com>2024-11-11 12:53:03 +0100
commitf02e3128441f5bba95c6173d2acb61baa4111d01 (patch)
tree7c2704d67da733653b69a8ca8a42b7fedddddf59 /monitoring
parentMerge pull request #60626 from ivoalmeida/carbon-version-update (diff)
downloadceph-f02e3128441f5bba95c6173d2acb61baa4111d01.tar.xz
ceph-f02e3128441f5bba95c6173d2acb61baa4111d01.zip
monitoring: add 2 nvmeof alerts to prometheus_alerts.yaml
- `NVMeoFMissingListener`: trigger if all listeners are not created for each gateway in a subsystem - `NVMeoFZeroListenerSubsystem`: trigger if a subsystem has no listeners Signed-off-by: Vallari Agrawal <vallari.agrawal@ibm.com>
Diffstat (limited to 'monitoring')
-rw-r--r--monitoring/ceph-mixin/prometheus_alerts.yml18
1 files changed, 18 insertions, 0 deletions
diff --git a/monitoring/ceph-mixin/prometheus_alerts.yml b/monitoring/ceph-mixin/prometheus_alerts.yml
index ba6a6ded0a3..805ecb1188a 100644
--- a/monitoring/ceph-mixin/prometheus_alerts.yml
+++ b/monitoring/ceph-mixin/prometheus_alerts.yml
@@ -837,6 +837,24 @@ groups:
labels:
severity: "warning"
type: "ceph_default"
+ - alert: "NVMeoFMissingListener"
+ annotations:
+ description: "For every subsystem, each gateway should have a listener to balance traffic between gateways."
+ summary: "No listener added for {{ $labels.instance }} NVMe-oF Gateway to {{ $labels.nqn }} subsystem"
+ expr: "ceph_nvmeof_subsystem_listener_count == 0 and on(nqn) sum(ceph_nvmeof_subsystem_listener_count) by (nqn) > 0"
+ for: "10m"
+ labels:
+ severity: "warning"
+ type: "ceph_default"
+ - alert: "NVMeoFZeroListenerSubsystem"
+ annotations:
+ description: "NVMeoF gateway configuration incomplete; one of the subsystems have zero listeners."
+ summary: "No listeners added to {{ $labels.nqn }} subsystem"
+ expr: "sum(ceph_nvmeof_subsystem_listener_count) by (nqn) == 0"
+ for: "10m"
+ labels:
+ severity: "warning"
+ type: "ceph_default"
- alert: "NVMeoFHighHostCPU"
annotations:
description: "High CPU on a gateway host can lead to CPU contention and performance degradation"