mirror of
https://github.com/monitoring-mixins/website.git
synced 2024-12-15 17:50:48 +00:00
assets,site/content: daily assets regeneration
This commit is contained in:
parent
e579b5940a
commit
4f3c29e307
3 changed files with 128 additions and 14 deletions
|
@ -59,7 +59,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "sum(cortex_alertmanager_alerts{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
"expr": "sum(cluster_job_pod:cortex_alertmanager_alerts:sum{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"instant": true,
|
"instant": true,
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -135,7 +135,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "sum(cortex_alertmanager_silences{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
"expr": "sum(cluster_job_pod:cortex_alertmanager_silences:sum{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"instant": true,
|
"instant": true,
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -298,7 +298,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_alerts_received_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))\n-\nsum(rate(cortex_alertmanager_alerts_invalid_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))\n",
|
"expr": "sum(cluster_job:cortex_alertmanager_alerts_received_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})\n-\nsum(cluster_job:cortex_alertmanager_alerts_invalid_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})\n",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -307,7 +307,7 @@
|
||||||
"step": 10
|
"step": 10
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_alerts_invalid_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))",
|
"expr": "sum(cluster_job:cortex_alertmanager_alerts_invalid_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -396,7 +396,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_notifications_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))\n-\nsum(rate(cortex_alertmanager_notifications_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))\n",
|
"expr": "sum(cluster_job_integration:cortex_alertmanager_notifications_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})\n-\nsum(cluster_job_integration:cortex_alertmanager_notifications_failed_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})\n",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -405,7 +405,7 @@
|
||||||
"step": 10
|
"step": 10
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_notifications_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))",
|
"expr": "sum(cluster_job_integration:cortex_alertmanager_notifications_failed_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -482,7 +482,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "(\nsum(rate(cortex_alertmanager_notifications_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval])) by(integration)\n-\nsum(rate(cortex_alertmanager_notifications_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval])) by(integration)\n) > 0\nor on () vector(0)\n",
|
"expr": "(\nsum(cluster_job_integration:cortex_alertmanager_notifications_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}) by(integration)\n-\nsum(cluster_job_integration:cortex_alertmanager_notifications_failed_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}) by(integration)\n) > 0\nor on () vector(0)\n",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -491,7 +491,7 @@
|
||||||
"step": 10
|
"step": 10
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_notifications_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval])) by(integration)",
|
"expr": "sum(cluster_job_integration:cortex_alertmanager_notifications_failed_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}) by(integration)",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -1689,7 +1689,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "sum by(pod) (cortex_alertmanager_alerts{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
"expr": "sum by(pod) (cluster_job_pod:cortex_alertmanager_alerts:sum{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -1766,7 +1766,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "sum by(pod) (cortex_alertmanager_silences{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
"expr": "sum by(pod) (cluster_job_pod:cortex_alertmanager_silences:sum{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -2377,7 +2377,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_state_replication_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))\n-\nsum(rate(cortex_alertmanager_state_replication_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))\n",
|
"expr": "sum(cluster_job:cortex_alertmanager_state_replication_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})\n-\nsum(cluster_job:cortex_alertmanager_state_replication_failed_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})\n",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -2386,7 +2386,7 @@
|
||||||
"step": 10
|
"step": 10
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_state_replication_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))",
|
"expr": "sum(cluster_job:cortex_alertmanager_state_replication_failed_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -2463,7 +2463,7 @@
|
||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_partial_state_merges_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))\n-\nsum(rate(cortex_alertmanager_partial_state_merges_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))\n",
|
"expr": "sum(cluster_job:cortex_alertmanager_partial_state_merges_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})\n-\nsum(cluster_job:cortex_alertmanager_partial_state_merges_failed_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})\n",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
@ -2472,7 +2472,7 @@
|
||||||
"step": 10
|
"step": 10
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"expr": "sum(rate(cortex_alertmanager_partial_state_merges_failed_total{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"}[$__rate_interval]))",
|
"expr": "sum(cluster_job:cortex_alertmanager_partial_state_merges_failed_total:rate5m{cluster=~\"$cluster\", job=~\"($namespace)/alertmanager\"})",
|
||||||
"format": "time_series",
|
"format": "time_series",
|
||||||
"interval": "15s",
|
"interval": "15s",
|
||||||
"intervalFactor": 2,
|
"intervalFactor": 2,
|
||||||
|
|
|
@ -659,3 +659,35 @@ groups:
|
||||||
labels:
|
labels:
|
||||||
reason: memory_usage
|
reason: memory_usage
|
||||||
record: cluster_namespace_deployment_reason:required_replicas:count
|
record: cluster_namespace_deployment_reason:required_replicas:count
|
||||||
|
- name: cortex_alertmanager_rules
|
||||||
|
rules:
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job, pod) (cortex_alertmanager_alerts)
|
||||||
|
record: cluster_job_pod:cortex_alertmanager_alerts:sum
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job, pod) (cortex_alertmanager_silences)
|
||||||
|
record: cluster_job_pod:cortex_alertmanager_silences:sum
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_alerts_received_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_alerts_received_total:rate5m
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_alerts_invalid_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_alerts_invalid_total:rate5m
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job, integration) (rate(cortex_alertmanager_notifications_total[5m]))
|
||||||
|
record: cluster_job_integration:cortex_alertmanager_notifications_total:rate5m
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job, integration) (rate(cortex_alertmanager_notifications_failed_total[5m]))
|
||||||
|
record: cluster_job_integration:cortex_alertmanager_notifications_failed_total:rate5m
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_state_replication_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_state_replication_total:rate5m
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_state_replication_failed_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_state_replication_failed_total:rate5m
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_partial_state_merges_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_partial_state_merges_total:rate5m
|
||||||
|
- expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_partial_state_merges_failed_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_partial_state_merges_failed_total:rate5m
|
||||||
|
|
|
@ -2446,6 +2446,88 @@ labels:
|
||||||
record: cluster_namespace_deployment_reason:required_replicas:count
|
record: cluster_namespace_deployment_reason:required_replicas:count
|
||||||
{{< /code >}}
|
{{< /code >}}
|
||||||
|
|
||||||
|
### cortex_alertmanager_rules
|
||||||
|
|
||||||
|
##### cluster_job_pod:cortex_alertmanager_alerts:sum
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job, pod) (cortex_alertmanager_alerts)
|
||||||
|
record: cluster_job_pod:cortex_alertmanager_alerts:sum
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job_pod:cortex_alertmanager_silences:sum
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job, pod) (cortex_alertmanager_silences)
|
||||||
|
record: cluster_job_pod:cortex_alertmanager_silences:sum
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job:cortex_alertmanager_alerts_received_total:rate5m
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_alerts_received_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_alerts_received_total:rate5m
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job:cortex_alertmanager_alerts_invalid_total:rate5m
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_alerts_invalid_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_alerts_invalid_total:rate5m
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job_integration:cortex_alertmanager_notifications_total:rate5m
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job, integration) (rate(cortex_alertmanager_notifications_total[5m]))
|
||||||
|
record: cluster_job_integration:cortex_alertmanager_notifications_total:rate5m
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job_integration:cortex_alertmanager_notifications_failed_total:rate5m
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job, integration) (rate(cortex_alertmanager_notifications_failed_total[5m]))
|
||||||
|
record: cluster_job_integration:cortex_alertmanager_notifications_failed_total:rate5m
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job:cortex_alertmanager_state_replication_total:rate5m
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_state_replication_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_state_replication_total:rate5m
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job:cortex_alertmanager_state_replication_failed_total:rate5m
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_state_replication_failed_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_state_replication_failed_total:rate5m
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job:cortex_alertmanager_partial_state_merges_total:rate5m
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_partial_state_merges_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_partial_state_merges_total:rate5m
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
|
##### cluster_job:cortex_alertmanager_partial_state_merges_failed_total:rate5m
|
||||||
|
|
||||||
|
{{< code lang="yaml" >}}
|
||||||
|
expr: |
|
||||||
|
sum by (cluster, job) (rate(cortex_alertmanager_partial_state_merges_failed_total[5m]))
|
||||||
|
record: cluster_job:cortex_alertmanager_partial_state_merges_failed_total:rate5m
|
||||||
|
{{< /code >}}
|
||||||
|
|
||||||
## Dashboards
|
## Dashboards
|
||||||
Following dashboards are generated from mixins and hosted on github:
|
Following dashboards are generated from mixins and hosted on github:
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue