groups: - name: symbols-availability rules: - alert: SymbolsDown expr: up{job="symbols"} == 0 for: 5m labels: severity: page service: symbols annotations: summary: "Symbols.Server instance is down" description: "symbols scrape target has been down for 5 minutes" - alert: SymbolsErrorRateHigh expr: rate(http_requests_total{job="symbols",status=~"5.."}[5m]) > 0 for: 2m labels: severity: critical service: symbols annotations: summary: "Symbols.Server error rate is elevated" description: "5xx responses detected for Symbols.Server"