Files
git.stella-ops.org/devops/services/exporter/alerts.yaml
2025-12-26 18:11:06 +02:00

43 lines
1.4 KiB
YAML

groups:
- name: exporter
rules:
- alert: ExporterThroughputLow
expr: rate(exporter_jobs_processed_total[5m]) < 1
for: 10m
labels:
severity: warning
team: devops
annotations:
summary: "Exporter throughput low"
description: "Processed <1 job/s over last 5m (current {{ $value }})."
- alert: ExporterFailuresHigh
expr: rate(exporter_jobs_failed_total[5m]) / rate(exporter_jobs_processed_total[5m]) > 0.02
for: 5m
labels:
severity: critical
team: devops
annotations:
summary: "Exporter failure rate >2%"
description: "Failure rate {{ $value | humanizePercentage }} over last 5m."
- alert: ExporterLatencyP95High
expr: histogram_quantile(0.95, sum(rate(exporter_job_duration_seconds_bucket[5m])) by (le)) > 3
for: 5m
labels:
severity: warning
team: devops
annotations:
summary: "Exporter job p95 latency high"
description: "Job p95 latency {{ $value }}s over last 5m (threshold 3s)."
- alert: ExporterQueueDepthHigh
expr: exporter_queue_depth > 500
for: 10m
labels:
severity: warning
team: devops
annotations:
summary: "Exporter queue depth high"
description: "Queue depth {{ $value }} exceeds 500 for >10m."