32 lines
		
	
	
		
			1.4 KiB
		
	
	
	
		
			YAML
		
	
	
	
	
	
			
		
		
	
	
			32 lines
		
	
	
		
			1.4 KiB
		
	
	
	
		
			YAML
		
	
	
	
	
	
groups:
 | 
						|
  - name: zastava-runtime
 | 
						|
    interval: 30s
 | 
						|
    rules:
 | 
						|
      - alert: ZastavaRuntimeEventsSilent
 | 
						|
        expr: sum(rate(zastava_runtime_events_total[10m])) == 0
 | 
						|
        for: 15m
 | 
						|
        labels:
 | 
						|
          severity: warning
 | 
						|
          service: zastava-runtime
 | 
						|
        annotations:
 | 
						|
          summary: "Observer events stalled"
 | 
						|
          description: "No runtime events emitted in the last 15 minutes. Check observer DaemonSet health and container runtime mounts."
 | 
						|
      - alert: ZastavaRuntimeBackendLatencyHigh
 | 
						|
        expr: histogram_quantile(0.95, sum by (le) (rate(zastava_runtime_backend_latency_ms_bucket[5m]))) > 0.75
 | 
						|
        for: 10m
 | 
						|
        labels:
 | 
						|
          severity: critical
 | 
						|
          service: zastava-runtime
 | 
						|
        annotations:
 | 
						|
          summary: "Runtime backend latency p95 above 750 ms"
 | 
						|
          description: "Latency to Scanner runtime APIs is elevated. Inspect Scanner.WebService readiness, Authority OpTok issuance, and cluster network."
 | 
						|
      - alert: ZastavaAdmissionDenySpike
 | 
						|
        expr: sum(rate(zastava_admission_decisions_total{decision="deny"}[5m])) > 20
 | 
						|
        for: 5m
 | 
						|
        labels:
 | 
						|
          severity: warning
 | 
						|
          service: zastava-runtime
 | 
						|
        annotations:
 | 
						|
          summary: "Admission webhook denies exceeding threshold"
 | 
						|
          description: "Webhook is denying more than 20 pod admissions per minute. Confirm policy verdicts and consider fail-open exception for impacted namespaces."
 |