1
0
Fork 0
mirror of https://github.com/monitoring-mixins/website.git synced 2024-12-14 11:37:31 +00:00

assets,site/content: daily assets regeneration

This commit is contained in:
github-actions[bot] 2021-01-06 03:45:40 +00:00
parent 267cb741c5
commit fcebd26f4e
8 changed files with 612 additions and 34 deletions

View file

@ -432,6 +432,23 @@ groups:
for: 5m
labels:
severity: critical
- alert: CortexBucketIndexNotUpdated
annotations:
message: Cortex bucket index for tenant {{ $labels.user }} in {{ $labels.namespace
}} has not been updated since {{ $value | humanizeDuration }}.
expr: |
min by(namespace, user) (time() - cortex_bucket_index_last_successful_update_timestamp_seconds) > 7200
labels:
severity: critical
- alert: CortexTenantHasPartialBlocks
annotations:
message: Cortex tenant {{ $labels.user }} in {{ $labels.namespace }} has {{
$value }} partial blocks.
expr: |
max by(namespace, user) (cortex_bucket_blocks_partials_count) > 0
for: 6h
labels:
severity: warning
- name: cortex_compactor_alerts
rules:
- alert: CortexCompactorHasNotSuccessfullyCleanedUpBlocks

View file

@ -614,7 +614,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
}

View file

@ -242,11 +242,11 @@
"steppedLine": false,
"targets": [
{
"expr": "sum by(instance) (go_memstats_heap_inuse_bytes{cluster=~\"$cluster\", job=~\"($namespace)/compactor\"})",
"expr": "sum by(pod) (go_memstats_heap_inuse_bytes{cluster=~\"$cluster\", job=~\"($namespace)/compactor\"})",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
}
@ -497,7 +497,7 @@
"steppedLine": false,
"targets": [
{
"expr": "sum by(instance, device) (rate(node_disk_written_bytes_total[$__rate_interval])) + ignoring(pod) group_right() (label_replace(count by(pod, instance, device) (container_fs_writes_bytes_total{cluster=~\"$cluster\", namespace=~\"$namespace\",container=\"compactor\",device!~\".*sda.*\"}), \"device\", \"$1\", \"device\", \"/dev/(.*)\") * 0)\n",
"expr": "sum by(pod, device) (rate(node_disk_written_bytes_total[$__rate_interval])) + ignoring(pod) group_right() (label_replace(count by(pod, device) (container_fs_writes_bytes_total{cluster=~\"$cluster\", namespace=~\"$namespace\",container=\"compactor\",device!~\".*sda.*\"}), \"device\", \"$1\", \"device\", \"/dev/(.*)\") * 0)\n",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
@ -574,7 +574,7 @@
"steppedLine": false,
"targets": [
{
"expr": "sum by(instance, device) (rate(node_disk_read_bytes_total[$__rate_interval])) + ignoring(pod) group_right() (label_replace(count by(pod, instance, device) (container_fs_writes_bytes_total{cluster=~\"$cluster\", namespace=~\"$namespace\",container=\"compactor\",device!~\".*sda.*\"}), \"device\", \"$1\", \"device\", \"/dev/(.*)\") * 0)\n",
"expr": "sum by(pod, device) (rate(node_disk_read_bytes_total[$__rate_interval])) + ignoring(pod) group_right() (label_replace(count by(pod, device) (container_fs_writes_bytes_total{cluster=~\"$cluster\", namespace=~\"$namespace\",container=\"compactor\",device!~\".*sda.*\"}), \"device\", \"$1\", \"device\", \"/dev/(.*)\") * 0)\n",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,

View file

@ -172,7 +172,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
}

View file

@ -252,7 +252,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{cluster}} / {{namespace}} / {{instance}}",
"legendFormat": "{{cluster}} / {{namespace}} / {{pod}}",
"legendLink": null,
"step": 10
}
@ -436,7 +436,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{cluster}} / {{namespace}} / {{instance}}",
"legendFormat": "{{cluster}} / {{namespace}} / {{pod}}",
"legendLink": null,
"step": 10
}
@ -2361,6 +2361,297 @@
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "max(cortex_bucket_index_loaded{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"})",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "Max",
"legendLink": null,
"step": 10
},
{
"expr": "min(cortex_bucket_index_loaded{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"})",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "Min",
"legendLink": null,
"step": 10
},
{
"expr": "avg(cortex_bucket_index_loaded{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"})",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "Average",
"legendLink": null,
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Bucket indexes loaded (per querier)",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
},
{
"aliasColors": {
"failed": "#E24D42",
"successful": "#7EB26D"
},
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 10,
"id": 28,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 4,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(cortex_bucket_index_loads_total{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"}[$__rate_interval])) - sum(rate(cortex_bucket_index_load_failures_total{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"}[$__rate_interval]))",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "successful",
"legendLink": null,
"step": 10
},
{
"expr": "sum(rate(cortex_bucket_index_load_failures_total{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"}[$__rate_interval]))",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "failed",
"legendLink": null,
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Bucket indexes load / sec",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 29,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "histogram_quantile(0.99, sum(rate(cortex_bucket_index_load_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"}[$__interval])) by (le)) * 1e3",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "99th Percentile",
"refId": "A",
"step": 10
},
{
"expr": "histogram_quantile(0.50, sum(rate(cortex_bucket_index_load_duration_seconds_bucket{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"}[$__interval])) by (le)) * 1e3",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "50th Percentile",
"refId": "B",
"step": 10
},
{
"expr": "sum(rate(cortex_bucket_index_load_duration_seconds_sum{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"}[$__interval])) * 1e3 / sum(rate(cortex_bucket_index_load_duration_seconds_count{cluster=~\"$cluster\", job=~\"($namespace)/(querier|cortex$)\"}[$__interval]))",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "Average",
"refId": "C",
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Bucket indexes load latency",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "ms",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": true,
"title": "",
"titleSize": "h6"
},
{
"collapse": false,
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 30,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(cortex_bucket_store_series_blocks_queried_sum{component=\"store-gateway\",cluster=~\"$cluster\", job=~\"($namespace)/(store-gateway|cortex$)\"}[$__rate_interval]))",
@ -2415,7 +2706,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 10,
"id": 28,
"id": 31,
"legend": {
"avg": false,
"current": false,
@ -2492,7 +2783,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 10,
"id": 29,
"id": 32,
"legend": {
"avg": false,
"current": false,
@ -2567,7 +2858,7 @@
"repeatIteration": null,
"repeatRowId": null,
"showTitle": true,
"title": "Store-gateway - Blocks",
"title": "Store-gateway - Blocks storage",
"titleSize": "h6"
},
{
@ -2581,7 +2872,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 30,
"id": 33,
"legend": {
"avg": false,
"current": false,
@ -2676,7 +2967,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 31,
"id": 34,
"legend": {
"avg": false,
"current": false,
@ -2771,7 +3062,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 32,
"id": 35,
"legend": {
"avg": false,
"current": false,
@ -2860,7 +3151,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 33,
"id": 36,
"legend": {
"avg": false,
"current": false,
@ -2889,7 +3180,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
}
@ -2940,7 +3231,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 10,
"id": 34,
"id": 37,
"legend": {
"avg": false,
"current": false,
@ -3029,7 +3320,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 10,
"id": 35,
"id": 38,
"legend": {
"avg": false,
"current": false,
@ -3127,7 +3418,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 36,
"id": 39,
"legend": {
"avg": false,
"current": false,
@ -3156,7 +3447,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
}
@ -3204,7 +3495,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 37,
"id": 40,
"legend": {
"avg": false,
"current": false,

View file

@ -471,7 +471,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}-creation",
"legendFormat": "{{pod}}-creation",
"legendLink": null,
"step": 10
},
@ -480,7 +480,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}-deletion",
"legendFormat": "{{pod}}-deletion",
"legendLink": null,
"step": 10
}
@ -557,7 +557,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}-creation",
"legendFormat": "{{pod}}-creation",
"legendLink": null,
"step": 10
},
@ -566,7 +566,7 @@
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}-deletion",
"legendFormat": "{{pod}}-deletion",
"legendLink": null,
"step": 10
}

View file

@ -616,7 +616,7 @@
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"description": "Shows rate of execution for all meta files from blocks in the bucket into the memory.",
"description": "Shows deletion rate of blocks already marked for deletion.",
"fill": 10,
"id": 8,
"legend": {
@ -641,6 +641,249 @@
"span": 4,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(thanos_compact_blocks_cleaned_total{namespace=\"$namespace\",job=~\"$job\"}[$interval])) by (job)",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Blocks cleanup {{job}}",
"legendLink": null,
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Deletion Rate",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"description": "Shows deletion failures rate of blocks already marked for deletion.",
"fill": 1,
"id": 9,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(thanos_compact_block_cleanup_failures_total{namespace=\"$namespace\",job=~\"$job\"}[$interval])) by (job)",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Blocks cleanup failures {{job}}",
"legendLink": null,
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Deletion Error Rate",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"description": "Shows rate at which blocks are marked for deletion (from GC and retention policy).",
"fill": 1,
"id": 10,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(thanos_compact_blocks_marked_for_deletion_total{namespace=\"$namespace\",job=~\"$job\"}[$interval])) by (job)",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "Blocks marked {{job}}",
"legendLink": null,
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Marking Rate",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": true,
"title": "Blocks deletion",
"titleSize": "h6"
},
{
"collapse": false,
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"description": "Shows rate of execution for all meta files from blocks in the bucket into the memory.",
"fill": 10,
"id": 11,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 4,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(thanos_blocks_meta_syncs_total{namespace=\"$namespace\",job=~\"$job\"}[$interval])) by (job)",
@ -697,7 +940,7 @@
"datasource": "$datasource",
"description": "Shows ratio of errors compared to the total number of executed meta file sync.",
"fill": 10,
"id": 9,
"id": 12,
"legend": {
"avg": false,
"current": false,
@ -774,7 +1017,7 @@
"datasource": "$datasource",
"description": "Shows how long has it taken to execute meta file sync, in quantiles.",
"fill": 1,
"id": 10,
"id": 13,
"legend": {
"avg": false,
"current": false,
@ -879,7 +1122,7 @@
"datasource": "$datasource",
"description": "Shows rate of execution for operations against the bucket.",
"fill": 10,
"id": 11,
"id": 14,
"legend": {
"avg": false,
"current": false,
@ -958,7 +1201,7 @@
"datasource": "$datasource",
"description": "Shows ratio of errors compared to the total number of executed operations against the bucket.",
"fill": 10,
"id": 12,
"id": 15,
"legend": {
"avg": false,
"current": false,
@ -1035,7 +1278,7 @@
"datasource": "$datasource",
"description": "Shows how long has it taken to execute operations against the bucket, in quantiles.",
"fill": 1,
"id": 13,
"id": 16,
"legend": {
"avg": false,
"current": false,
@ -1139,7 +1382,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 14,
"id": 17,
"legend": {
"avg": false,
"current": false,
@ -1255,7 +1498,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 15,
"id": 18,
"legend": {
"avg": false,
"current": false,
@ -1331,7 +1574,7 @@
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 16,
"id": 19,
"legend": {
"avg": false,
"current": false,

View file

@ -653,6 +653,33 @@ labels:
severity: critical
{{< /code >}}
##### CortexBucketIndexNotUpdated
{{< code lang="yaml" >}}
alert: CortexBucketIndexNotUpdated
annotations:
message: Cortex bucket index for tenant {{ $labels.user }} in {{ $labels.namespace
}} has not been updated since {{ $value | humanizeDuration }}.
expr: |
min by(namespace, user) (time() - cortex_bucket_index_last_successful_update_timestamp_seconds) > 7200
labels:
severity: critical
{{< /code >}}
##### CortexTenantHasPartialBlocks
{{< code lang="yaml" >}}
alert: CortexTenantHasPartialBlocks
annotations:
message: Cortex tenant {{ $labels.user }} in {{ $labels.namespace }} has {{ $value
}} partial blocks.
expr: |
max by(namespace, user) (cortex_bucket_blocks_partials_count) > 0
for: 6h
labels:
severity: warning
{{< /code >}}
### cortex_compactor_alerts
##### CortexCompactorHasNotSuccessfullyCleanedUpBlocks