groups: - name: functional_scaffold_alerts interval: 30s rules: - alert: HighErrorRate expr: rate(http_requests_total{status="error"}[5m]) > 0.05 for: 5m labels: severity: warning annotations: summary: "High error rate detected" description: "Error rate is {{ $value }} requests/sec for {{ $labels.endpoint }}" - alert: HighLatency expr: histogram_quantile(0.95, rate(http_request_duration_seconds_bucket[5m])) > 1 for: 5m labels: severity: warning annotations: summary: "High latency detected" description: "P95 latency is {{ $value }}s for {{ $labels.endpoint }}" - alert: ServiceDown expr: up{job="functional-scaffold"} == 0 for: 1m labels: severity: critical annotations: summary: "Service is down" description: "FunctionalScaffold service has been down for more than 1 minute" - alert: HighMemoryUsage expr: container_memory_usage_bytes{container="functional-scaffold"} / container_spec_memory_limit_bytes{container="functional-scaffold"} > 0.9 for: 5m labels: severity: warning annotations: summary: "High memory usage" description: "Memory usage is {{ $value | humanizePercentage }} of limit"