32 lines
		
	
	
		
			1.4 KiB
		
	
	
	
		
			YAML
		
	
	
	
	
	
			
		
		
	
	
			32 lines
		
	
	
		
			1.4 KiB
		
	
	
	
		
			YAML
		
	
	
	
	
	
| groups:
 | |
|   - name: zastava-runtime
 | |
|     interval: 30s
 | |
|     rules:
 | |
|       - alert: ZastavaRuntimeEventsSilent
 | |
|         expr: sum(rate(zastava_runtime_events_total[10m])) == 0
 | |
|         for: 15m
 | |
|         labels:
 | |
|           severity: warning
 | |
|           service: zastava-runtime
 | |
|         annotations:
 | |
|           summary: "Observer events stalled"
 | |
|           description: "No runtime events emitted in the last 15 minutes. Check observer DaemonSet health and container runtime mounts."
 | |
|       - alert: ZastavaRuntimeBackendLatencyHigh
 | |
|         expr: histogram_quantile(0.95, sum by (le) (rate(zastava_runtime_backend_latency_ms_bucket[5m]))) > 0.75
 | |
|         for: 10m
 | |
|         labels:
 | |
|           severity: critical
 | |
|           service: zastava-runtime
 | |
|         annotations:
 | |
|           summary: "Runtime backend latency p95 above 750 ms"
 | |
|           description: "Latency to Scanner runtime APIs is elevated. Inspect Scanner.WebService readiness, Authority OpTok issuance, and cluster network."
 | |
|       - alert: ZastavaAdmissionDenySpike
 | |
|         expr: sum(rate(zastava_admission_decisions_total{decision="deny"}[5m])) > 20
 | |
|         for: 5m
 | |
|         labels:
 | |
|           severity: warning
 | |
|           service: zastava-runtime
 | |
|         annotations:
 | |
|           summary: "Admission webhook denies exceeding threshold"
 | |
|           description: "Webhook is denying more than 20 pod admissions per minute. Confirm policy verdicts and consider fail-open exception for impacted namespaces."
 |