|
6 | 6 | rules: [
|
7 | 7 | {
|
8 | 8 | alert: 'LokiRequestErrors',
|
9 |
| - expr: std.strReplace(||| |
10 |
| - 100 * sum(rate(loki_request_duration_seconds_count{status_code=~"5.."}[2m])) by (cluster, namespace, job, route) |
| 9 | + expr: ||| |
| 10 | + 100 * sum(rate(loki_request_duration_seconds_count{status_code=~"5.."}[2m])) by (%(group_by_cluster)s, job, route) |
11 | 11 | /
|
12 |
| - sum(rate(loki_request_duration_seconds_count[2m])) by (cluster, namespace, job, route) |
| 12 | + sum(rate(loki_request_duration_seconds_count[2m])) by (%(group_by_cluster)s, job, route) |
13 | 13 | > 10
|
14 |
| - |||, 'cluster', $._config.per_cluster_label), |
| 14 | + ||| % $._config, |
15 | 15 | 'for': '15m',
|
16 | 16 | labels: {
|
17 | 17 | severity: 'critical',
|
|
26 | 26 | {
|
27 | 27 | alert: 'LokiRequestPanics',
|
28 | 28 | expr: |||
|
29 |
| - sum(increase(loki_panic_total[10m])) by (%s, namespace, job) > 0 |
30 |
| - ||| % $._config.per_cluster_label, |
| 29 | + sum(increase(loki_panic_total[10m])) by (%(group_by_cluster)s, job) > 0 |
| 30 | + ||| % $._config, |
31 | 31 | labels: {
|
32 | 32 | severity: 'critical',
|
33 | 33 | },
|
|
41 | 41 | {
|
42 | 42 | alert: 'LokiRequestLatency',
|
43 | 43 | expr: |||
|
44 |
| - %s_namespace_job_route:loki_request_duration_seconds:99quantile{route!~"(?i).*tail.*|/schedulerpb.SchedulerForQuerier/QuerierLoop"} > 1 |
45 |
| - ||| % $._config.per_cluster_label, |
| 44 | + %(group_prefix_jobs)s_route:loki_request_duration_seconds:99quantile{route!~"(?i).*tail.*|/schedulerpb.SchedulerForQuerier/QuerierLoop"} > 1 |
| 45 | + ||| % $._config, |
46 | 46 | 'for': '15m',
|
47 | 47 | labels: {
|
48 | 48 | severity: 'critical',
|
|
57 | 57 | {
|
58 | 58 | alert: 'LokiTooManyCompactorsRunning',
|
59 | 59 | expr: |||
|
60 |
| - sum(loki_boltdb_shipper_compactor_running) by (%s, namespace) > 1 |
61 |
| - ||| % $._config.per_cluster_label, |
| 60 | + sum(loki_boltdb_shipper_compactor_running) by (%(group_by_cluster)s) > 1 |
| 61 | + ||| % $._config, |
62 | 62 | 'for': '5m',
|
63 | 63 | labels: {
|
64 | 64 | severity: 'warning',
|
|
0 commit comments