| - alert: LokiRequestErrors |
| {{ $labels.job }} {{ $labels.route }} is experiencing {{ printf "%.2f" $value }}% errors. |
| 100 * sum(rate(loki_request_duration_seconds_count{status_code=~"5.."}[2m])) by (namespace, job, route) |
| sum(rate(loki_request_duration_seconds_count[2m])) by (namespace, job, route) |
| - alert: LokiRequestPanics |
| {{ $labels.job }} is experiencing {{ printf "%.2f" $value }}% increase of panics. |
| sum(increase(loki_panic_total[10m])) by (namespace, job) > 0 |
| - alert: LokiRequestLatency |
| {{ $labels.job }} {{ $labels.route }} is experiencing {{ printf "%.2f" $value }}s 99th percentile latency. |
| namespace_job_route:loki_request_duration_seconds:99quantile{route!~"(?i).*tail.*"} > 1 |
| - alert: LokiTooManyCompactorsRunning |
| {{ $labels.cluster }} {{ $labels.namespace }} has had {{ printf "%.0f" $value }} compactors running for more than 5m. Only one compactor should run at a time. |
| sum(loki_boltdb_shipper_compactor_running) by (namespace, cluster) > 1 |
| - name: 'loki_canaries_alerts' |
| - alert: 'LokiCanaryLatency' |
| {{ $labels.job }} is experiencing {{ printf "%.2f" $value }}s 99th percentile latency. |
| histogram_quantile(0.99, sum(rate(loki_canary_response_latency_seconds_bucket[5m])) by (le, namespace, job)) > 5 |