1
0
Fork 0
mirror of https://github.com/monitoring-mixins/website.git synced 2024-12-14 11:37:31 +00:00

assets,site/content: daily assets regeneration

This commit is contained in:
github-actions[bot] 2020-10-29 03:26:42 +00:00
parent 0cf29f33c3
commit a38aa71564
2 changed files with 120 additions and 97 deletions

View file

@ -308,7 +308,7 @@ groups:
summary: Thanos Store has high latency for store series gate requests.
expr: |
(
histogram_quantile(0.9, sum by (job, le) (rate(thanos_bucket_store_series_gate_duration_seconds_bucket{job=~"thanos-store.*"}[5m]))) > 2
histogram_quantile(0.99, sum by (job, le) (rate(thanos_bucket_store_series_gate_duration_seconds_bucket{job=~"thanos-store.*"}[5m]))) > 2
and
sum by (job) (rate(thanos_bucket_store_series_gate_duration_seconds_count{job=~"thanos-store.*"}[5m])) > 0
)
@ -337,7 +337,7 @@ groups:
summary: Thanos Store is having high latency for bucket operations.
expr: |
(
histogram_quantile(0.9, sum by (job, le) (rate(thanos_objstore_bucket_operation_duration_seconds_bucket{job=~"thanos-store.*"}[5m]))) > 2
histogram_quantile(0.99, sum by (job, le) (rate(thanos_objstore_bucket_operation_duration_seconds_bucket{job=~"thanos-store.*"}[5m]))) > 2
and
sum by (job) (rate(thanos_objstore_bucket_operation_duration_seconds_count{job=~"thanos-store.*"}[5m])) > 0
)
@ -483,8 +483,56 @@ groups:
for: 3m
labels:
severity: critical
- name: thanos-bucket-replicate.rules
rules:
- alert: ThanosBucketReplicateIsDown
annotations:
description: Thanos Replicate has disappeared from Prometheus target discovery.
summary: Thanos Replicate has disappeared from Prometheus target discovery.
expr: |
absent(up{job=~"thanos-bucket-replicate.*"})
for: 5m
labels:
severity: critical
- alert: ThanosBucketReplicateErrorRate
annotations:
description: Thanos Replicate failing to run, {{ $value | humanize }}% of attempts
failed.
summary: Thanose Replicate is failing to run.
expr: |
(
sum(rate(thanos_replicate_replication_runs_total{result="error", job=~"thanos-bucket-replicate.*"}[5m]))
/ on (namespace) group_left
sum(rate(thanos_replicate_replication_runs_total{job=~"thanos-bucket-replicate.*"}[5m]))
) * 100 >= 10
for: 5m
labels:
severity: critical
- alert: ThanosBucketReplicateRunLatency
annotations:
description: Thanos Replicate {{$labels.job}} has a 99th percentile latency
of {{ $value }} seconds for the replicate operations.
summary: Thanos Replicate has a high latency for replicate operations.
expr: |
(
histogram_quantile(0.99, sum by (job, le) (rate(thanos_replicate_replication_run_duration_seconds_bucket{job=~"thanos-bucket-replicate.*"}[5m]))) > 20
and
sum by (job) (rate(thanos_replicate_replication_run_duration_seconds_bucket{job=~"thanos-bucket-replicate.*"}[5m])) > 0
)
for: 5m
labels:
severity: critical
- name: thanos-component-absent.rules
rules:
- alert: ThanosBucketReplicateIsDown
annotations:
description: ThanosBucketReplicate has disappeared from Prometheus target discovery.
summary: thanos component has disappeared from Prometheus target discovery.
expr: |
absent(up{job=~"thanos-bucket-replicate.*"} == 1)
for: 5m
labels:
severity: critical
- alert: ThanosCompactIsDown
annotations:
description: ThanosCompact has disappeared from Prometheus target discovery.
@ -539,42 +587,3 @@ groups:
for: 5m
labels:
severity: critical
- name: thanos-bucket-replicate.rules
rules:
- alert: ThanosBucketReplicateIsDown
annotations:
description: Thanos Replicate has disappeared from Prometheus target discovery.
summary: Thanos Replicate has disappeared from Prometheus target discovery.
expr: |
absent(up{job=~"thanos-bucket-replicate.*"})
for: 5m
labels:
severity: critical
- alert: ThanosBucketReplicateErrorRate
annotations:
description: Thanos Replicate failing to run, {{ $value | humanize }}% of attempts
failed.
summary: Thanose Replicate is failing to run.
expr: |
(
sum(rate(thanos_replicate_replication_runs_total{result="error", job=~"thanos-bucket-replicate.*"}[5m]))
/ on (namespace) group_left
sum(rate(thanos_replicate_replication_runs_total{job=~"thanos-bucket-replicate.*"}[5m]))
) * 100 >= 10
for: 5m
labels:
severity: critical
- alert: ThanosBucketReplicateRunLatency
annotations:
description: Thanos Replicate {{$labels.job}} has a 99th percentile latency
of {{ $value }} seconds for the replicate operations.
summary: Thanos Replicate has a high latency for replicate operations.
expr: |
(
histogram_quantile(0.9, sum by (job, le) (rate(thanos_replicate_replication_run_duration_seconds_bucket{job=~"thanos-bucket-replicate.*"}[5m]))) > 20
and
sum by (job) (rate(thanos_replicate_replication_run_duration_seconds_bucket{job=~"thanos-bucket-replicate.*"}[5m])) > 0
)
for: 5m
labels:
severity: critical

View file

@ -436,7 +436,7 @@ annotations:
summary: Thanos Store has high latency for store series gate requests.
expr: |
(
histogram_quantile(0.9, sum by (job, le) (rate(thanos_bucket_store_series_gate_duration_seconds_bucket{job=~"thanos-store.*"}[5m]))) > 2
histogram_quantile(0.99, sum by (job, le) (rate(thanos_bucket_store_series_gate_duration_seconds_bucket{job=~"thanos-store.*"}[5m]))) > 2
and
sum by (job) (rate(thanos_bucket_store_series_gate_duration_seconds_count{job=~"thanos-store.*"}[5m])) > 0
)
@ -475,7 +475,7 @@ annotations:
summary: Thanos Store is having high latency for bucket operations.
expr: |
(
histogram_quantile(0.9, sum by (job, le) (rate(thanos_objstore_bucket_operation_duration_seconds_bucket{job=~"thanos-store.*"}[5m]))) > 2
histogram_quantile(0.99, sum by (job, le) (rate(thanos_objstore_bucket_operation_duration_seconds_bucket{job=~"thanos-store.*"}[5m]))) > 2
and
sum by (job) (rate(thanos_objstore_bucket_operation_duration_seconds_count{job=~"thanos-store.*"}[5m])) > 0
)
@ -682,8 +682,76 @@ labels:
severity: critical
{{< /code >}}
### thanos-bucket-replicate.rules
##### ThanosBucketReplicateIsDown
{{< code lang="yaml" >}}
alert: ThanosBucketReplicateIsDown
annotations:
description: Thanos Replicate has disappeared from Prometheus target discovery.
summary: Thanos Replicate has disappeared from Prometheus target discovery.
expr: |
absent(up{job=~"thanos-bucket-replicate.*"})
for: 5m
labels:
severity: critical
{{< /code >}}
##### ThanosBucketReplicateErrorRate
{{< code lang="yaml" >}}
alert: ThanosBucketReplicateErrorRate
annotations:
description: Thanos Replicate failing to run, {{ $value | humanize }}% of attempts
failed.
summary: Thanose Replicate is failing to run.
expr: |
(
sum(rate(thanos_replicate_replication_runs_total{result="error", job=~"thanos-bucket-replicate.*"}[5m]))
/ on (namespace) group_left
sum(rate(thanos_replicate_replication_runs_total{job=~"thanos-bucket-replicate.*"}[5m]))
) * 100 >= 10
for: 5m
labels:
severity: critical
{{< /code >}}
##### ThanosBucketReplicateRunLatency
{{< code lang="yaml" >}}
alert: ThanosBucketReplicateRunLatency
annotations:
description: Thanos Replicate {{$labels.job}} has a 99th percentile latency of {{
$value }} seconds for the replicate operations.
summary: Thanos Replicate has a high latency for replicate operations.
expr: |
(
histogram_quantile(0.99, sum by (job, le) (rate(thanos_replicate_replication_run_duration_seconds_bucket{job=~"thanos-bucket-replicate.*"}[5m]))) > 20
and
sum by (job) (rate(thanos_replicate_replication_run_duration_seconds_bucket{job=~"thanos-bucket-replicate.*"}[5m])) > 0
)
for: 5m
labels:
severity: critical
{{< /code >}}
### thanos-component-absent.rules
##### ThanosBucketReplicateIsDown
{{< code lang="yaml" >}}
alert: ThanosBucketReplicateIsDown
annotations:
description: ThanosBucketReplicate has disappeared from Prometheus target discovery.
summary: thanos component has disappeared from Prometheus target discovery.
expr: |
absent(up{job=~"thanos-bucket-replicate.*"} == 1)
for: 5m
labels:
severity: critical
{{< /code >}}
##### ThanosCompactIsDown
{{< code lang="yaml" >}}
@ -768,60 +836,6 @@ labels:
severity: critical
{{< /code >}}
### thanos-bucket-replicate.rules
##### ThanosBucketReplicateIsDown
{{< code lang="yaml" >}}
alert: ThanosBucketReplicateIsDown
annotations:
description: Thanos Replicate has disappeared from Prometheus target discovery.
summary: Thanos Replicate has disappeared from Prometheus target discovery.
expr: |
absent(up{job=~"thanos-bucket-replicate.*"})
for: 5m
labels:
severity: critical
{{< /code >}}
##### ThanosBucketReplicateErrorRate
{{< code lang="yaml" >}}
alert: ThanosBucketReplicateErrorRate
annotations:
description: Thanos Replicate failing to run, {{ $value | humanize }}% of attempts
failed.
summary: Thanose Replicate is failing to run.
expr: |
(
sum(rate(thanos_replicate_replication_runs_total{result="error", job=~"thanos-bucket-replicate.*"}[5m]))
/ on (namespace) group_left
sum(rate(thanos_replicate_replication_runs_total{job=~"thanos-bucket-replicate.*"}[5m]))
) * 100 >= 10
for: 5m
labels:
severity: critical
{{< /code >}}
##### ThanosBucketReplicateRunLatency
{{< code lang="yaml" >}}
alert: ThanosBucketReplicateRunLatency
annotations:
description: Thanos Replicate {{$labels.job}} has a 99th percentile latency of {{
$value }} seconds for the replicate operations.
summary: Thanos Replicate has a high latency for replicate operations.
expr: |
(
histogram_quantile(0.9, sum by (job, le) (rate(thanos_replicate_replication_run_duration_seconds_bucket{job=~"thanos-bucket-replicate.*"}[5m]))) > 20
and
sum by (job) (rate(thanos_replicate_replication_run_duration_seconds_bucket{job=~"thanos-bucket-replicate.*"}[5m])) > 0
)
for: 5m
labels:
severity: critical
{{< /code >}}
## Recording rules
{{< panel style="warning" >}}