1
0
Fork 0
mirror of https://github.com/monitoring-mixins/website.git synced 2024-12-14 11:37:31 +00:00

assets,site/content: daily assets regeneration

This commit is contained in:
github-actions[bot] 2024-10-25 03:33:09 +00:00
parent c989764d94
commit 6825ac3a6f
191 changed files with 39171 additions and 56331 deletions

View file

@ -183,7 +183,6 @@
"y": 0
},
"id": 3,
"interval": "1m",
"options": {
"legend": {
"calcs": [ ],
@ -203,6 +202,7 @@
},
"expr": "rate(mssql_batch_requests_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}"
}
@ -275,7 +275,6 @@
"y": 8
},
"id": 4,
"interval": "1m",
"options": {
"legend": {
"calcs": [ ],
@ -293,8 +292,9 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "increase(mssql_kill_connection_errors_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])",
"expr": "increase(mssql_kill_connection_errors_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval:])",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}"
}
@ -367,7 +367,6 @@
"y": 8
},
"id": 5,
"interval": "1m",
"options": {
"legend": {
"calcs": [ ],
@ -387,6 +386,7 @@
},
"expr": "rate(mssql_deadlocks_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}"
}
@ -758,7 +758,6 @@
"y": 41
},
"id": 11,
"interval": "1m",
"options": {
"legend": {
"calcs": [ ],
@ -776,8 +775,9 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "increase(mssql_io_stall_seconds_total{job=~\"$job\", instance=~\"$instance\", db=~\"$database\", operation=\"write\"}[$__rate_interval])",
"expr": "increase(mssql_io_stall_seconds_total{job=~\"$job\", instance=~\"$instance\", db=~\"$database\", operation=\"write\"}[$__rate_interval:])",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}} - {{db}}"
}
@ -846,7 +846,6 @@
"y": 41
},
"id": 12,
"interval": "1m",
"options": {
"legend": {
"calcs": [ ],
@ -864,8 +863,9 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "increase(mssql_io_stall_seconds_total{job=~\"$job\", instance=~\"$instance\", db=~\"$database\", operation=\"read\"}[$__rate_interval])",
"expr": "increase(mssql_io_stall_seconds_total{job=~\"$job\", instance=~\"$instance\", db=~\"$database\", operation=\"read\"}[$__rate_interval:])",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}} - {{db}}"
}
@ -938,7 +938,6 @@
"y": 49
},
"id": 13,
"interval": "1m",
"options": {
"legend": {
"calcs": [ ],
@ -956,8 +955,9 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "increase(mssql_log_growths_total{job=~\"$job\", instance=~\"$instance\", db=~\"$database\"}[$__rate_interval])",
"expr": "increase(mssql_log_growths_total{job=~\"$job\", instance=~\"$instance\", db=~\"$database\"}[$__rate_interval:])",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}} - {{db}}"
}

View file

@ -363,7 +363,6 @@
"y": 8
},
"id": 5,
"interval": "1m",
"options": {
"legend": {
"calcs": [ ],
@ -381,8 +380,9 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "increase(mssql_page_fault_count_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])",
"expr": "increase(mssql_page_fault_count_total{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval:])",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
"legendFormat": "{{instance}}"
}

View file

@ -142,17 +142,19 @@
},
"gridPos": {
"h": 6,
"w": 24
"w": 24,
"x": 0,
"y": 0
},
"id": 1,
"interval": "30s",
"maxDataPoints": 100,
"options": {
"tooltip": {
"mode": "multi",
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -182,7 +184,9 @@
},
"gridPos": {
"h": 18,
"w": 24
"w": 24,
"x": 0,
"y": 18
},
"id": 2,
"options": {
@ -192,7 +196,7 @@
"showTime": false,
"wrapLogMessage": true
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -207,7 +211,7 @@
}
],
"refresh": "1m",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"aerospike-mixin"
],

View file

@ -36,7 +36,7 @@ groups:
(
rate(alertmanager_notifications_failed_total{job="alertmanager"}[5m])
/
rate(alertmanager_notifications_total{job="alertmanager"}[5m])
ignoring (reason) group_left rate(alertmanager_notifications_total{job="alertmanager"}[5m])
)
> 0.01
for: 5m
@ -53,7 +53,7 @@ groups:
min by (job, integration) (
rate(alertmanager_notifications_failed_total{job="alertmanager", integration=~`.*`}[5m])
/
rate(alertmanager_notifications_total{job="alertmanager", integration=~`.*`}[5m])
ignoring (reason) group_left rate(alertmanager_notifications_total{job="alertmanager", integration=~`.*`}[5m])
)
> 0.01
for: 5m
@ -70,7 +70,7 @@ groups:
min by (job, integration) (
rate(alertmanager_notifications_failed_total{job="alertmanager", integration!~`.*`}[5m])
/
rate(alertmanager_notifications_total{job="alertmanager", integration!~`.*`}[5m])
ignoring (reason) group_left rate(alertmanager_notifications_total{job="alertmanager", integration!~`.*`}[5m])
)
> 0.01
for: 5m

View file

@ -142,17 +142,19 @@
},
"gridPos": {
"h": 6,
"w": 24
"w": 24,
"x": 0,
"y": 0
},
"id": 1,
"interval": "30s",
"maxDataPoints": 100,
"options": {
"tooltip": {
"mode": "multi",
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -182,7 +184,9 @@
},
"gridPos": {
"h": 18,
"w": 24
"w": 24,
"x": 0,
"y": 18
},
"id": 2,
"options": {
@ -192,7 +196,7 @@
"showTime": false,
"wrapLogMessage": true
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -207,7 +211,7 @@
}
],
"refresh": "1m",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"apache-activemq-mixin"
],

View file

@ -1264,6 +1264,28 @@
"type": "query",
"useTags": false
},
{
"allValue": ".*",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 2,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(airflow_scheduler_tasks_executable{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },

View file

@ -1475,7 +1475,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{job=~\"$job\", couchdb_cluster=~\"$couchdb_cluster\", instance=~\"$instance\", filename=\"/var/log/couchdb/couchdb.log\"} |~ \"$log_level\"",
"expr": "{job=~\"$job\", couchdb_cluster=~\"$couchdb_cluster\", instance=~\"$instance\"} |= `` | (filename=~\"/var/log/couchdb/couchdb.log\" or log_type=\"couchdb\") |~ \"$log_level\"",
"queryType": "range",
"refId": "A"
}

View file

@ -344,7 +344,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{job=~\"$job\", hadoop_cluster=~\"$hadoop_cluster\", instance=~\"$instance\", filename=~\".*/hadoop/logs/.*-datanode.*.log\"} |= ``",
"expr": "{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"} |= `` | (filename=~\".*/hadoop/logs/.*-datanode.*.log\" or log_type=\"datanode\")",
"queryType": "range",
"refId": "A"
}
@ -406,6 +406,28 @@
"type": "query",
"useTags": false
},
{
"allValue": ".*",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 2,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(hadoop_datanode_ramdiskblocksevictedwithoutread{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },

View file

@ -839,7 +839,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{job=~\"$job\", hadoop_cluster=~\"$hadoop_cluster\", instance=~\"$instance\", filename=~\".*/hadoop/logs/.*-namenode.*.log\"} |= ``",
"expr": "{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"} |= `` | (filename=~\".*/hadoop/logs/.*-namenode.*.log\" or log_type=\"namenode\")",
"queryType": "range",
"refId": "A"
}
@ -901,6 +901,28 @@
"type": "query",
"useTags": false
},
{
"allValue": ".*",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 2,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(hadoop_namenode_blockstotal{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },

View file

@ -1596,7 +1596,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{job=~\"$job\", hadoop_cluster=~\"$hadoop_cluster\", instance=~\"$instance\", filename=~\".*/hadoop/logs/.*-nodemanager.*.log\"} |= ``",
"expr": "{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"} |= `` | (filename=~\".*/hadoop/logs/.*-nodemanager.*.log\" or log_type=\"nodemanager\")",
"queryType": "range",
"refId": "A"
}
@ -1658,6 +1658,28 @@
"type": "query",
"useTags": false
},
{
"allValue": ".*",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 2,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(hadoop_nodemanager_availablegb{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },

View file

@ -907,7 +907,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{job=~\"$job\", hadoop_cluster=~\"$hadoop_cluster\", instance=~\"$instance\", filename=~\".*/hadoop/logs/.*-resourcemanager.*.log\"} |= ``",
"expr": "{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"} |= `` | (filename=~\".*/hadoop/logs/.*-resourcemanager.*.log\" or log_type=\"resourcemanager\")",
"queryType": "range",
"refId": "A"
}
@ -969,6 +969,28 @@
"type": "query",
"useTags": false
},
{
"allValue": ".*",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 2,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(hadoop_resourcemanager_activeapplications{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },

View file

@ -142,17 +142,19 @@
},
"gridPos": {
"h": 6,
"w": 24
"w": 24,
"x": 0,
"y": 0
},
"id": 1,
"interval": "30s",
"maxDataPoints": 100,
"options": {
"tooltip": {
"mode": "multi",
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -182,7 +184,9 @@
},
"gridPos": {
"h": 18,
"w": 24
"w": 24,
"x": 0,
"y": 18
},
"id": 2,
"options": {
@ -192,7 +196,7 @@
"showTime": false,
"wrapLogMessage": true
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -207,7 +211,7 @@
}
],
"refresh": "1m",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"apache-hbase-mixin"
],

View file

@ -1473,7 +1473,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{job=~\"$job\", filename=~\"/var/log/mesos/master/.*\", mesos_cluster=~\"$mesos_cluster\"} |= ``",
"expr": "{job=~\"$job\", instance=~\"$instance\", mesos_cluster=~\"$mesos_cluster\"} |= `` | (filename=~\"/var/log/mesos/master/.*\" or log_type=\"master\")",
"queryType": "range",
"refId": "A"
}
@ -1509,7 +1509,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{job=~\"$job\", filename=~\"/var/log/mesos/agent/.*\", mesos_cluster=~\"$mesos_cluster\"} |= ``",
"expr": "{job=~\"$job\", instance=~\"$instance\", mesos_cluster=~\"$mesos_cluster\"} |= `` | (filename=~\"/var/log/mesos/agent/.*\" or log_type=\"agent\")",
"queryType": "range",
"refId": "A"
}
@ -1571,6 +1571,28 @@
"type": "query",
"useTags": false
},
{
"allValue": ".*",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 2,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(mesos_exporter_build_info{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },
@ -1583,7 +1605,7 @@
"multi": true,
"name": "instance",
"options": [ ],
"query": "label_values(mesos_exporter_build_info{job=~\"$job\", instance=~\"$instance\"}, instance)",
"query": "label_values(mesos_exporter_build_info{job=~\"$job\"}, instance)",
"refresh": 2,
"regex": "",
"sort": 1,

View file

@ -142,17 +142,19 @@
},
"gridPos": {
"h": 6,
"w": 24
"w": 24,
"x": 0,
"y": 0
},
"id": 1,
"interval": "30s",
"maxDataPoints": 100,
"options": {
"tooltip": {
"mode": "multi",
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -182,7 +184,9 @@
},
"gridPos": {
"h": 18,
"w": 24
"w": 24,
"x": 0,
"y": 18
},
"id": 2,
"options": {
@ -192,7 +196,7 @@
"showTime": false,
"wrapLogMessage": true
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -207,7 +211,7 @@
}
],
"refresh": "1m",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"apache-solr-mixin"
],

View file

@ -1807,7 +1807,7 @@
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(cassandra_cache_size{job=~\"$job\"}, cluster)",
"query": "label_values(solr_metrics_core_errors_total{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,

View file

@ -1303,7 +1303,7 @@
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(cassandra_cache_size{job=~\"$job\"}, cluster)",
"query": "label_values(solr_metrics_core_errors_total{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,

View file

@ -8,7 +8,7 @@ groups:
80 percent.
summary: The instance has a CPU usage higher than the configured threshold.
expr: |
sum by (job, instance) (jvm_process_cpu_load{job=~"integrations/tomcat"}) > 80
sum by (job,instance) (jvm_process_cpu_load{job=~"integrations/tomcat"}) > 80
for: 5m
labels:
severity: critical
@ -19,7 +19,7 @@ groups:
of 80 percent.
summary: The instance has a higher memory usage than the configured threshold.
expr: |
sum(jvm_memory_usage_used_bytes{job=~"integrations/tomcat"}) by (job, instance) / sum(jvm_physical_memory_bytes{job=~"integrations/tomcat"}) by (job, instance) * 100 > 80
sum(jvm_memory_usage_used_bytes{job=~"integrations/tomcat"}) by (job,instance) / sum(jvm_physical_memory_bytes{job=~"integrations/tomcat"}) by (job,instance) * 100 > 80
for: 5m
labels:
severity: critical
@ -30,7 +30,7 @@ groups:
the threshold of 5 percent.
summary: There are a high number of request errors.
expr: |
sum by (job, instance) (increase(tomcat_errorcount_total[5m]) / increase(tomcat_requestcount_total[5m]) * 100) > 5
sum by (job,instance) (increase(tomcat_errorcount_total{job=~"integrations/tomcat"}[5m]) / increase(tomcat_requestcount_total{job=~"integrations/tomcat"}[5m]) * 100) > 5
for: 5m
labels:
severity: critical
@ -41,7 +41,7 @@ groups:
300ms.
summary: The processing time has been moderately high.
expr: |
sum by (job, instance) (increase(tomcat_processingtime_total[5m]) / increase(tomcat_requestcount_total[5m])) > 300
sum by (job,instance) (increase(tomcat_processingtime_total{job=~"integrations/tomcat"}[5m]) / increase(tomcat_requestcount_total{job=~"integrations/tomcat"}[5m])) > 300
for: 5m
labels:
severity: warning

View file

@ -370,7 +370,7 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "sum(rate(tomcat_servlet_requestcount_total{instance=~\"$instance\", job=~\"$job\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__rate_interval])) by (job, instance)",
"expr": "sum(rate(tomcat_servlet_requestcount_total{job=~\"$job\", instance=~\"$instance\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__rate_interval])) by (job, instance)",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}} - total requests"
@ -379,7 +379,7 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "sum(rate(tomcat_servlet_errorcount_total{instance=~\"$instance\", job=~\"$job\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__rate_interval])) by (job, instance)",
"expr": "sum(rate(tomcat_servlet_errorcount_total{job=~\"$job\", instance=~\"$instance\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__rate_interval])) by (job, instance)",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}} - total errors"
@ -388,7 +388,7 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "rate(tomcat_servlet_requestcount_total{instance=~\"$instance\", job=~\"$job\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__rate_interval])",
"expr": "rate(tomcat_servlet_requestcount_total{job=~\"$job\", instance=~\"$instance\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__rate_interval])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}} - {{module}}{{servlet}} - requests"
@ -397,7 +397,7 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "rate(tomcat_servlet_errorcount_total{instance=~\"$instance\", job=~\"$job\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__rate_interval])",
"expr": "rate(tomcat_servlet_errorcount_total{job=~\"$job\", instance=~\"$instance\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__rate_interval])",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}} - {{module}}{{servlet}} - errors"
@ -488,7 +488,7 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "sum(increase(tomcat_servlet_processingtime_total{instance=~\"$instance\", job=~\"$job\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__interval:] offset -$__interval) / clamp_min(increase(tomcat_servlet_requestcount_total{instance=~\"$instance\", job=~\"$job\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__interval:] offset -$__interval), 1)) by (job, instance)",
"expr": "sum(increase(tomcat_servlet_processingtime_total{job=~\"$job\", instance=~\"$instance\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__interval:] offset -$__interval) / clamp_min(increase(tomcat_servlet_requestcount_total{job=~\"$job\", instance=~\"$instance\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__interval:] offset -$__interval), 1)) by (job, instance)",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
@ -498,7 +498,7 @@
"datasource": {
"uid": "${prometheus_datasource}"
},
"expr": "increase(tomcat_servlet_processingtime_total{instance=~\"$instance\", job=~\"$job\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__interval:] offset -$__interval) / clamp_min(increase(tomcat_servlet_requestcount_total{instance=~\"$instance\", job=~\"$job\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__interval:] offset -$__interval), 1)",
"expr": "increase(tomcat_servlet_processingtime_total{job=~\"$job\", instance=~\"$instance\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__interval:] offset -$__interval) / clamp_min(increase(tomcat_servlet_requestcount_total{job=~\"$job\", instance=~\"$instance\", module=~\"$host$context\", servlet=~\"$servlet\"}[$__interval:] offset -$__interval), 1)",
"format": "time_series",
"interval": "1m",
"intervalFactor": 2,
@ -551,6 +551,28 @@
"type": "query",
"useTags": false
},
{
"allValue": ".*",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 2,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(tomcat_bytesreceived_total{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": "",
"current": { },
@ -563,7 +585,7 @@
"multi": false,
"name": "instance",
"options": [ ],
"query": "label_values(tomcat_bytesreceived_total, instance)",
"query": "label_values(tomcat_bytesreceived_total{job=~\"$job\"}, instance)",
"refresh": 1,
"regex": "",
"sort": 0,
@ -585,7 +607,7 @@
"multi": true,
"name": "host",
"options": [ ],
"query": "label_values(tomcat_session_sessioncounter_total{instance=~\"$instance\"}, host)",
"query": "label_values(tomcat_session_sessioncounter_total{job=~\"$job\"}, host)",
"refresh": 1,
"regex": "",
"sort": 0,
@ -607,7 +629,7 @@
"multi": true,
"name": "context",
"options": [ ],
"query": "label_values(tomcat_session_sessioncounter_total{host=~\"$host\"}, context)",
"query": "label_values(tomcat_session_sessioncounter_total{job=~\"$job\", host=~\"$host\"}, context)",
"refresh": 1,
"regex": "",
"sort": 0,
@ -629,7 +651,7 @@
"multi": true,
"name": "servlet",
"options": [ ],
"query": "label_values(tomcat_servlet_requestcount_total{module=~\"$host$context\"}, servlet)",
"query": "label_values(tomcat_servlet_requestcount_total{job=~\"$job\", module=~\"$host$context\"}, servlet)",
"refresh": 1,
"regex": "",
"sort": 0,

View file

@ -813,7 +813,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{filename=~\"/var/log/tomcat.*/catalina.out|/opt/tomcat/logs/catalina.out|/Program Files/Apache Software Foundation/Tomcat .*..*/logs/catalina.out\",job=~\"$job\", instance=~\"$instance\"} |= ``",
"expr": "{job=~\"$job\", instance=~\"$instance\"} |= `` | (filename=~\"/var/log/tomcat.*/catalina.out|/opt/tomcat/logs/catalina.out|/Program Files/Apache Software Foundation/Tomcat .*..*/logs/catalina.out\" or log_type=\"catalina.out\")",
"queryType": "range",
"refId": "A"
}
@ -876,19 +876,19 @@
"useTags": false
},
{
"allValue": "",
"allValue": ".*",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 0,
"includeAll": false,
"label": "Instance",
"multi": false,
"name": "instance",
"hide": 2,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(tomcat_bytesreceived_total, instance)",
"refresh": 1,
"query": "label_values(tomcat_bytesreceived_total{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
@ -898,7 +898,29 @@
"useTags": false
},
{
"allValue": "",
"allValue": ".+",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
},
"hide": 0,
"includeAll": true,
"label": "Instance",
"multi": true,
"name": "instance",
"options": [ ],
"query": "label_values(tomcat_bytesreceived_total{job=~\"$job\"}, instance)",
"refresh": 2,
"regex": "",
"sort": 1,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
@ -909,7 +931,7 @@
"multi": true,
"name": "protocol",
"options": [ ],
"query": "label_values(tomcat_bytesreceived_total, protocol)",
"query": "label_values(tomcat_bytesreceived_total{job=~\"$job\"}, protocol)",
"refresh": 1,
"regex": "",
"sort": 0,
@ -920,7 +942,7 @@
"useTags": false
},
{
"allValue": "",
"allValue": ".+",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"
@ -931,7 +953,7 @@
"multi": true,
"name": "port",
"options": [ ],
"query": "label_values(tomcat_bytesreceived_total, port)",
"query": "label_values(tomcat_bytesreceived_total{job=~\"$job\"}, port)",
"refresh": 1,
"regex": "",
"sort": 0,

View file

@ -1,7 +1,7 @@
{
"__inputs": [ ],
"__requires": [ ],
"description": "A dashboard that monitors the Blackbox-exporter. It is created using the blackbox-exporter-mixin for the the (blackbox-exporter)[https://github.com/prometheus/blackbox-exporter].",
"description": "A dashboard that monitors the Blackbox-exporter. It is created using the [blackbox-exporter-mixin](https://github.com/adinhodovic/blackbox-exporter-mixin) for the the (blackbox-exporter)[https://github.com/prometheus/blackbox_exporter].",
"editable": true,
"panels": [
{
@ -70,7 +70,7 @@
},
"textMode": "value_and_name"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -120,7 +120,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -173,7 +173,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -222,7 +222,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -259,7 +259,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -326,7 +326,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -379,7 +379,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -437,7 +437,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -491,7 +491,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -542,7 +542,7 @@
},
"textMode": "name"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -590,7 +590,7 @@
"colorMode": "background",
"graphMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -643,7 +643,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -681,7 +681,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -720,7 +720,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -757,7 +757,7 @@
]
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -808,7 +808,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -871,7 +871,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -894,7 +894,7 @@
"type": "timeseries"
}
],
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"blackbox-exporter",
"blackbox-exporter-mixin"

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

View file

@ -19,7 +19,7 @@ groups:
This may cause problems for Pod scheduling
summary: API calls to Cilium Agent API to create or update Endpoints are failing.
expr: sum(rate(cilium_k8s_client_api_calls_total{method=~"(PUT|POST|PATCH)", endpoint="endpoint",return_code!~"2[0-9][0-9]"}[5m]))
by (pod, method, return_code)
by (pod, method, return_code) > 0
for: 5m
labels:
severity: warning
@ -31,7 +31,7 @@ groups:
summary: Cilium Endpoint API endpoint rate limiter is reporting errors while
doing endpoint create.
expr: sum(rate(cilium_api_limiter_processed_requests_total{api_call=~"endpoint-create",
outcome="fail"}[1m])) by (pod, api_call)
outcome="fail"}[1m])) by (pod, api_call) > 0
for: 5m
labels:
severity: info
@ -43,7 +43,7 @@ groups:
This could indicate issues with Ciliums ability to create endpoints which can result in failure to schedule Kubernetes Pods.
summary: API calls to Cilium Endpoints API are failing due to server errors.
expr: sum(rate(cilium_agent_api_process_time_seconds_count{return_code=~"5[0-9][0-9]",
path="/v1/endpoint"}[5m])) by (pod, return_code)
path="/v1/endpoint"}[5m])) by (pod, return_code) > 0
for: 5m
labels:
severity: warning
@ -133,7 +133,7 @@ groups:
error rate for response code: {{$labels.response_code}} on endpoint {{$labels.endpoint}}.'
summary: Cilium Agent API on Pod is experiencing a high error rate.
expr: sum(rate(cilium_k8s_client_api_calls_total{endpoint!="metrics",return_code!~"2[0-9][0-9]"}[5m]))
by (pod, endpoint, return_code)
by (pod, endpoint, return_code) > 0
for: 5m
labels:
severity: info
@ -224,3 +224,52 @@ groups:
for: 15m
labels:
severity: info
- name: Cilium Clustermesh
rules:
- alert: CiliumAgentRemoteClusterNotReady
annotations:
description: Agent can't mesh with {{$labels.target_cluster}}
summary: Agent can't mesh with remote cluster.
expr: count(cilium_clustermesh_remote_cluster_readiness_status < 1) by (source_cluster,
target_cluster) > 0
for: 5m
labels:
severity: critical
- alert: CiliumAgentRemoteClusterFailing
annotations:
description: Agent fails to mesh with {{$labels.target_cluster}}
summary: Agent fails to mesh with remote cluster.
expr: sum(rate(cilium_clustermesh_remote_cluster_failures[5m])) by (source_cluster,
target_cluster) > 0
for: 5m
labels:
severity: critical
- name: Cilium Kvstoremesh
rules:
- alert: CiliumKvstoremeshRemoteClusterNotReady
annotations:
description: Kvstoremesh can't mesh with {{$labels.target_cluster}}
summary: Kvstoremesh can't mesh with remote cluster.
expr: count(cilium_kvstoremesh_remote_cluster_readiness_status < 1) by (source_cluster,
target_cluster) > 0
for: 5m
labels:
severity: critical
- alert: CiliumKvstoremeshRemoteClusterFailing
annotations:
description: Kvstoremesh fails to mesh with {{$labels.target_cluster}}
summary: Kvstoremesh fails to mesh with remote cluster.
expr: sum(rate(cilium_kvstoremesh_remote_cluster_failures[5m])) by (source_cluster,
target_cluster) > 0
for: 5m
labels:
severity: critical
- alert: CiliumKvstoremeshErrors
annotations:
description: Kvstoremesh fails to mesh with {{$labels.target_cluster}}
summary: Kvstoremesh fails to mesh with remote cluster.
expr: sum(rate(cilium_kvstoremesh_kvstore_sync_errors_total[5m])) by (source_cluster)
> 0
for: 5m
labels:
severity: critical

View file

@ -142,17 +142,19 @@
},
"gridPos": {
"h": 6,
"w": 24
"w": 24,
"x": 0,
"y": 0
},
"id": 1,
"interval": "30s",
"maxDataPoints": 100,
"options": {
"tooltip": {
"mode": "multi",
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -182,7 +184,9 @@
},
"gridPos": {
"h": 18,
"w": 24
"w": 24,
"x": 0,
"y": 18
},
"id": 2,
"options": {
@ -192,7 +196,7 @@
"showTime": false,
"wrapLogMessage": true
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -207,7 +211,7 @@
}
],
"refresh": "1m",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"clickhouse-mixin"
],

View file

@ -1,699 +0,0 @@
{
"annotations": {
"list": [ ]
},
"editable": true,
"gnetId": null,
"graphTooltip": 0,
"hideControls": false,
"links": [ ],
"refresh": "10s",
"rows": [
{
"collapse": false,
"height": "100px",
"panels": [
{
"aliasColors": { },
"bars": false,
"colorBackground": true,
"colors": [
"#d44a3a",
"rgba(237, 129, 40, 0.89)",
"#299c46"
],
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"format": "none",
"id": 1,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"repeat": "instance",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 12,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "consul_up{job=~\"$job\",instance=~\"$instance\"}",
"format": "time_series",
"instant": true,
"refId": "A"
}
],
"thresholds": "0.5,0.5",
"timeFrom": null,
"timeShift": null,
"title": "$instance",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "singlestat",
"valueMaps": [
{
"op": "=",
"text": "DOWN",
"value": "0"
},
{
"op": "=",
"text": "UP",
"value": "1"
}
],
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": false,
"title": "Up",
"titleSize": "h6"
},
{
"collapse": false,
"height": "100px",
"panels": [
{
"aliasColors": { },
"bars": false,
"colorBackground": true,
"colors": [
"rgba(237, 129, 40, 0.89)",
"rgba(237, 129, 40, 0.89)",
"#299c46"
],
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"format": "none",
"id": 2,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"repeat": "instance",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 12,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "(rate(consul_raft_leader_lastcontact_count{job=~\"$job\",instance=~\"$instance\"}[$__rate_interval]) > bool 0)\n or\n(consul_up{job=~\"$job\",instance=~\"$instance\"} == bool 0)\n",
"format": "time_series",
"instant": true,
"refId": "A"
}
],
"thresholds": "0.5,0.5",
"timeFrom": null,
"timeShift": null,
"title": "$instance",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "singlestat",
"valueMaps": [
{
"op": "=",
"text": "FOLLOWER",
"value": "0"
},
{
"op": "=",
"text": "LEADER",
"value": "1"
}
],
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": false,
"title": "Leader",
"titleSize": "h6"
},
{
"collapse": false,
"height": "100px",
"panels": [
{
"aliasColors": { },
"bars": false,
"colorBackground": true,
"colors": [
"#d44a3a",
"rgba(237, 129, 40, 0.89)",
"#299c46"
],
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"format": "none",
"id": 3,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"repeat": "instance",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 12,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "consul_raft_leader{job=~\"$job\",instance=~\"$instance\"}",
"format": "time_series",
"instant": true,
"refId": "A"
}
],
"thresholds": "0.5,0.5",
"timeFrom": null,
"timeShift": null,
"title": "$instance",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "singlestat",
"valueMaps": [
{
"op": "=",
"text": "NO LEADER",
"value": "0"
},
{
"op": "=",
"text": "HAS LEADER",
"value": "1"
}
],
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": false,
"title": "Has Leader",
"titleSize": "h6"
},
{
"collapse": false,
"height": "100px",
"panels": [
{
"aliasColors": { },
"bars": false,
"colorBackground": true,
"colors": [
"#d44a3a",
"rgba(237, 129, 40, 0.89)",
"#299c46"
],
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"format": "none",
"id": 4,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"repeat": "instance",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 12,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "consul_raft_peers{job=~\"$job\",instance=~\"$instance\"}",
"format": "time_series",
"instant": true,
"refId": "A"
}
],
"thresholds": "1,2",
"timeFrom": null,
"timeShift": null,
"title": "$instance",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "singlestat",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": false,
"title": "# Peers",
"titleSize": "h6"
},
{
"collapse": false,
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 10,
"id": 5,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 6,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(consul_http_request_count{job=~\"$job\"}[$__rate_interval])) by (instance)",
"format": "time_series",
"legendFormat": "{{instance}}",
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "QPS",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 6,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 6,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "max(consul_http_request{job=~\"$job\", quantile=\"0.99\"}) by (instance)",
"format": "time_series",
"legendFormat": "99th Percentile",
"legendLink": "{{instance}}"
},
{
"expr": "max(consul_http_request{job=~\"$job\", quantile=\"0.5\"}) by (instance)",
"format": "time_series",
"legendFormat": "50th Percentile",
"legendLink": "{{instance}}"
},
{
"expr": "sum(rate(consul_http_request{job=~\"$job\"}[$__rate_interval])) by (instance) / sum(rate(consul_http_request{job=~\"$job\"}[$__rate_interval])) by (instance)",
"format": "time_series",
"legendFormat": "Average",
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Latency",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "ms",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": true,
"title": "Consul Server",
"titleSize": "h6"
}
],
"schemaVersion": 14,
"style": "dark",
"tags": [ ],
"templating": {
"list": [
{
"current": {
"text": "default",
"value": "default"
},
"hide": 0,
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",
"refresh": 1,
"regex": "",
"type": "datasource"
},
{
"allValue": ".+",
"current": {
"selected": true,
"text": "All",
"value": "$__all"
},
"datasource": "$datasource",
"hide": 0,
"includeAll": true,
"label": "job",
"multi": true,
"name": "job",
"options": [ ],
"query": "label_values(consul_up, job)",
"refresh": 1,
"regex": "",
"sort": 2,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": {
"selected": true,
"text": "All",
"value": "$__all"
},
"datasource": "$datasource",
"hide": 0,
"includeAll": true,
"label": "instance",
"multi": true,
"name": "instance",
"options": [ ],
"query": "label_values(consul_up{job=~\"$job\"}, instance)",
"refresh": 1,
"regex": "",
"sort": 2,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
}
]
},
"time": {
"from": "now-1h",
"to": "now"
},
"timepicker": {
"refresh_intervals": [
"5s",
"10s",
"30s",
"1m",
"5m",
"15m",
"30m",
"1h",
"2h",
"1d"
],
"time_options": [
"5m",
"15m",
"1h",
"6h",
"12h",
"24h",
"2d",
"7d",
"30d"
]
},
"timezone": "utc",
"title": "Consul Overview",
"uid": "f71ad233ae18512edec190eee2558346",
"version": 0
}

View file

@ -33,18 +33,6 @@ groups:
for: 15m
labels:
severity: warning
- alert: CortexTableSyncFailure
annotations:
message: |
{{ $labels.job }} is experiencing {{ printf "%.2f" $value }}% errors syncing tables.
expr: |
100 * rate(cortex_table_manager_sync_duration_seconds_count{status_code!~"2.."}[15m])
/
rate(cortex_table_manager_sync_duration_seconds_count[15m])
> 10
for: 30m
labels:
severity: critical
- alert: CortexQueriesIncorrect
annotations:
message: |
@ -113,26 +101,6 @@ groups:
changes(process_start_time_seconds{job=~".+(cortex|ingester.*)"}[30m]) >= 2
labels:
severity: warning
- alert: CortexTransferFailed
annotations:
message: |
{{ $labels.job }}/{{ $labels.instance }} transfer failed.
expr: |
max_over_time(cortex_shutdown_duration_seconds_count{op="transfer",status!="success"}[15m])
for: 5m
labels:
severity: critical
- alert: CortexOldChunkInMemory
annotations:
message: |
{{ $labels.job }}/{{ $labels.instance }} has very old unflushed chunk in memory.
expr: |
(time() - cortex_oldest_unflushed_chunk_timestamp_seconds > 36000)
and
(cortex_oldest_unflushed_chunk_timestamp_seconds > 0)
for: 5m
labels:
severity: warning
- alert: CortexKVStoreFailure
annotations:
message: |
@ -224,48 +192,6 @@ groups:
for: 5m
labels:
severity: critical
- name: cortex_wal_alerts
rules:
- alert: CortexWALCorruption
annotations:
message: |
{{ $labels.job }}/{{ $labels.instance }} has a corrupted WAL or checkpoint.
expr: |
increase(cortex_ingester_wal_corruptions_total[5m]) > 0
labels:
severity: critical
- alert: CortexCheckpointCreationFailed
annotations:
message: |
{{ $labels.job }}/{{ $labels.instance }} failed to create checkpoint.
expr: |
increase(cortex_ingester_checkpoint_creations_failed_total[10m]) > 0
labels:
severity: warning
- alert: CortexCheckpointCreationFailed
annotations:
message: |
{{ $labels.job }}/{{ $labels.instance }} is failing to create checkpoint.
expr: |
increase(cortex_ingester_checkpoint_creations_failed_total[1h]) > 1
labels:
severity: critical
- alert: CortexCheckpointDeletionFailed
annotations:
message: |
{{ $labels.job }}/{{ $labels.instance }} failed to delete checkpoint.
expr: |
increase(cortex_ingester_checkpoint_deletions_failed_total[10m]) > 0
labels:
severity: warning
- alert: CortexCheckpointDeletionFailed
annotations:
message: |
{{ $labels.instance }} is failing to delete checkpoint.
expr: |
increase(cortex_ingester_checkpoint_deletions_failed_total[2h]) > 1
labels:
severity: critical
- name: cortex-rollout-alerts
rules:
- alert: CortexRolloutStuck
@ -314,29 +240,12 @@ groups:
severity: warning
- name: cortex-provisioning
rules:
- alert: CortexProvisioningMemcachedTooSmall
annotations:
message: |
Chunk memcached cluster in {{ $labels.cluster }}/{{ $labels.namespace }} is too small, should be at least {{ printf "%.2f" $value }}GB.
expr: |
(
4 *
sum by (cluster, namespace) (cortex_ingester_memory_series * cortex_ingester_chunk_size_bytes_sum / cortex_ingester_chunk_size_bytes_count)
/ 1e9
)
>
(
sum by (cluster, namespace) (memcached_limit_bytes{job=~".+/memcached"}) / 1e9
)
for: 15m
labels:
severity: warning
- alert: CortexProvisioningTooManyActiveSeries
annotations:
message: |
The number of in-memory series per ingester in {{ $labels.cluster }}/{{ $labels.namespace }} is too high.
expr: |
avg by (cluster, namespace) (cortex_ingester_memory_series) > 1.6e6
avg by (cluster, namespace) (cortex_ingester_memory_series) > 3.2e6
for: 2h
labels:
severity: warning
@ -345,7 +254,7 @@ groups:
message: |
Ingesters in {{ $labels.cluster }}/{{ $labels.namespace }} ingest too many samples per second.
expr: |
avg by (cluster, namespace) (rate(cortex_ingester_ingested_samples_total[1m])) > 80e3
avg by (cluster, namespace) (rate(cortex_ingester_ingested_samples_total[1m])) > 160e3
for: 15m
labels:
severity: warning

File diff suppressed because it is too large Load diff

View file

@ -27,30 +27,40 @@
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 1,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"seriesOverrides": [
{
"alias": "limit",
@ -58,89 +68,64 @@
"fill": 0
}
],
"spaceLength": 10,
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum by(pod) (rate(container_cpu_usage_seconds_total{cluster=~\"$cluster\", namespace=~\"$namespace\",container=~\"compactor\"}[$__rate_interval]))",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
"legendLink": null
},
{
"expr": "min(container_spec_cpu_quota{cluster=~\"$cluster\", namespace=~\"$namespace\",container=~\"compactor\"} / container_spec_cpu_period{cluster=~\"$cluster\", namespace=~\"$namespace\",container=~\"compactor\"})",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "limit",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "CPU",
"tooltip": {
"sort": 2
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 2,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "bytes"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 2,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"seriesOverrides": [
{
"alias": "limit",
@ -148,45 +133,28 @@
"fill": 0
}
],
"spaceLength": 10,
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "max by(pod) (container_memory_working_set_bytes{cluster=~\"$cluster\", namespace=~\"$namespace\",container=~\"compactor\"})",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
"legendLink": null
},
{
"expr": "min(container_spec_memory_limit_bytes{cluster=~\"$cluster\", namespace=~\"$namespace\",container=~\"compactor\"} > 0)",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "limit",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Memory (workingset)",
"tooltip": {
"sort": 2
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"type": "timeseries",
"yaxes": [
{
"format": "bytes",
@ -207,61 +175,55 @@
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 3,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "bytes"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 3,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum by(pod) (go_memstats_heap_inuse_bytes{cluster=~\"$cluster\", job=~\"($namespace)/compactor.*\"})",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Memory (go heap inuse)",
"tooltip": {
"sort": 2
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"type": "timeseries",
"yaxes": [
{
"format": "bytes",
@ -294,63 +256,55 @@
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "Bps"
},
"overrides": [ ]
},
"fill": 10,
"id": 4,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 6,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum by(pod) (rate(container_network_receive_bytes_total{cluster=~\"$cluster\", namespace=~\"$namespace\",pod=~\"compactor.*\"}[$__rate_interval]))",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Receive Bandwidth",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"type": "timeseries",
"yaxes": [
{
"format": "Bps",
@ -371,63 +325,55 @@
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "Bps"
},
"overrides": [ ]
},
"fill": 10,
"id": 5,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 6,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum by(pod) (rate(container_network_transmit_bytes_total{cluster=~\"$cluster\", namespace=~\"$namespace\",pod=~\"compactor.*\"}[$__rate_interval]))",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Transmit Bandwidth",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"type": "timeseries",
"yaxes": [
{
"format": "Bps",
@ -460,63 +406,55 @@
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "Bps"
},
"overrides": [ ]
},
"fill": 10,
"id": 6,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum by(instance, pod, device) (\n rate(\n node_disk_written_bytes_total[$__rate_interval]\n )\n)\n+\nignoring(pod) group_right() (\n label_replace(\n count by(\n instance,\n pod,\n device\n )\n (\n container_fs_writes_bytes_total{\n cluster=~\"$cluster\", namespace=~\"$namespace\",\n container=\"compactor\",\n device!~\".*sda.*\"\n }\n ),\n \"device\",\n \"$1\",\n \"device\",\n \"/dev/(.*)\"\n ) * 0\n)\n\n",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "{{pod}} - {{device}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Disk Writes",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"type": "timeseries",
"yaxes": [
{
"format": "Bps",
@ -537,63 +475,55 @@
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "Bps"
},
"overrides": [ ]
},
"fill": 10,
"id": 7,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "sum by(instance, pod, device) (\n rate(\n node_disk_read_bytes_total[$__rate_interval]\n )\n) + ignoring(pod) group_right() (\n label_replace(\n count by(\n instance,\n pod,\n device\n )\n (\n container_fs_writes_bytes_total{\n cluster=~\"$cluster\", namespace=~\"$namespace\",\n container=\"compactor\",\n device!~\".*sda.*\"\n }\n ),\n \"device\",\n \"$1\",\n \"device\",\n \"/dev/(.*)\"\n ) * 0\n)\n\n",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "{{pod}} - {{device}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Disk Reads",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"type": "timeseries",
"yaxes": [
{
"format": "Bps",
@ -614,63 +544,52 @@
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 8,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "percentunit"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 8,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "max by(persistentvolumeclaim) (\n kubelet_volume_stats_used_bytes{cluster=~\"$cluster\", namespace=~\"$namespace\"} /\n kubelet_volume_stats_capacity_bytes{cluster=~\"$cluster\", namespace=~\"$namespace\"}\n)\nand\ncount by(persistentvolumeclaim) (\n kube_persistentvolumeclaim_labels{\n cluster=~\"$cluster\", namespace=~\"$namespace\",\n label_name=\"compactor\"\n }\n)\n",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "{{persistentvolumeclaim}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Disk Space Utilization",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"type": "timeseries",
"yaxes": [
{
"format": "percentunit",
@ -712,7 +631,7 @@
"value": "default"
},
"hide": 0,
"label": null,
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",

File diff suppressed because it is too large Load diff

View file

@ -27,81 +27,55 @@
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "instances"
},
"overrides": [ ]
},
"fill": 10,
"id": 1,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 12,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "count(cortex_config_hash{cluster=~\"$cluster\", namespace=~\"$namespace\"}) by (sha256)",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "sha256:{{sha256}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Startup config file hashes",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "instances",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
}
],
"repeat": null,
@ -116,81 +90,55 @@
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "instances"
},
"overrides": [ ]
},
"fill": 10,
"id": 2,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 0,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 12,
"stack": true,
"steppedLine": false,
"targets": [
{
"expr": "count(cortex_runtime_config_hash{cluster=~\"$cluster\", namespace=~\"$namespace\"}) by (sha256)",
"format": "time_series",
"interval": "15s",
"intervalFactor": 2,
"legendFormat": "sha256:{{sha256}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Runtime config file hashes",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "instances",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
}
],
"repeat": null,
@ -214,7 +162,7 @@
"value": "default"
},
"hide": 0,
"label": null,
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

View file

@ -49,195 +49,142 @@
"height": "400px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 2,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 1,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [
{
"matcher": {
"id": "byName",
"options": "__name__"
},
"properties": [
{
"id": "custom.hidden",
"value": true
}
]
},
{
"matcher": {
"id": "byName",
"options": "Time"
},
"properties": [
{
"id": "custom.hidden",
"value": true
}
]
},
{
"matcher": {
"id": "byName",
"options": "cluster"
},
"properties": [
{
"id": "displayName",
"value": "Cluster"
}
]
},
{
"matcher": {
"id": "byName",
"options": "namespace"
},
"properties": [
{
"id": "displayName",
"value": "Namespace"
}
]
},
{
"matcher": {
"id": "byName",
"options": "deployment"
},
"properties": [
{
"id": "displayName",
"value": "Service"
}
]
},
{
"matcher": {
"id": "byName",
"options": "reason"
},
"properties": [
{
"id": "displayName",
"value": "Reason"
}
]
},
{
"matcher": {
"id": "byName",
"options": "Value"
},
"properties": [
{
"id": "displayName",
"value": "Required Replicas"
}
]
}
]
},
"lines": true,
"linewidth": 1,
"id": 2,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"sort": {
"col": 0,
"desc": false
},
"spaceLength": 10,
"span": 12,
"stack": false,
"steppedLine": false,
"styles": [
{
"alias": "Time",
"dateFormat": "YYYY-MM-DD HH:mm:ss",
"pattern": "Time",
"type": "hidden"
},
{
"alias": "Required Replicas",
"colorMode": null,
"colors": [ ],
"dateFormat": "YYYY-MM-DD HH:mm:ss",
"decimals": 0,
"link": false,
"linkTargetBlank": false,
"linkTooltip": "Drill down",
"linkUrl": "",
"pattern": "Value",
"thresholds": [ ],
"type": "number",
"unit": "short"
},
{
"alias": "Cluster",
"colorMode": null,
"colors": [ ],
"dateFormat": "YYYY-MM-DD HH:mm:ss",
"decimals": 2,
"link": false,
"linkTargetBlank": false,
"linkTooltip": "Drill down",
"linkUrl": "",
"pattern": "__name__",
"thresholds": [ ],
"type": "hidden",
"unit": "short"
},
{
"alias": "Cluster",
"colorMode": null,
"colors": [ ],
"dateFormat": "YYYY-MM-DD HH:mm:ss",
"decimals": 2,
"link": false,
"linkTargetBlank": false,
"linkTooltip": "Drill down",
"linkUrl": "",
"pattern": "cluster",
"thresholds": [ ],
"type": "number",
"unit": "short"
},
{
"alias": "Service",
"colorMode": null,
"colors": [ ],
"dateFormat": "YYYY-MM-DD HH:mm:ss",
"decimals": 2,
"link": false,
"linkTargetBlank": false,
"linkTooltip": "Drill down",
"linkUrl": "",
"pattern": "deployment",
"thresholds": [ ],
"type": "number",
"unit": "short"
},
{
"alias": "Namespace",
"colorMode": null,
"colors": [ ],
"dateFormat": "YYYY-MM-DD HH:mm:ss",
"decimals": 2,
"link": false,
"linkTargetBlank": false,
"linkTooltip": "Drill down",
"linkUrl": "",
"pattern": "namespace",
"thresholds": [ ],
"type": "number",
"unit": "short"
},
{
"alias": "Reason",
"colorMode": null,
"colors": [ ],
"dateFormat": "YYYY-MM-DD HH:mm:ss",
"decimals": 2,
"link": false,
"linkTargetBlank": false,
"linkTooltip": "Drill down",
"linkUrl": "",
"pattern": "reason",
"thresholds": [ ],
"type": "number",
"unit": "short"
},
{
"alias": "",
"colorMode": null,
"colors": [ ],
"dateFormat": "YYYY-MM-DD HH:mm:ss",
"decimals": 2,
"pattern": "/.*/",
"thresholds": [ ],
"type": "string",
"unit": "short"
}
],
"targets": [
{
"expr": "sort_desc(\n cluster_namespace_deployment_reason:required_replicas:count{cluster=~\"$cluster\", namespace=~\"$namespace\"}\n > ignoring(reason) group_left\n cluster_namespace_deployment:actual_replicas:count{cluster=~\"$cluster\", namespace=~\"$namespace\"}\n)\n",
"format": "table",
"instant": true,
"intervalFactor": 2,
"legendFormat": "",
"refId": "A",
"step": 10
"refId": "A"
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Workload-based scaling",
"tooltip": {
"shared": false,
"sort": 0,
"value_type": "individual"
},
"transform": "table",
"type": "table",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "table"
}
],
"repeat": null,
@ -261,7 +208,7 @@
"value": "default"
},
"hide": 0,
"label": null,
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",

View file

@ -171,7 +171,7 @@
"value": "default"
},
"hide": 0,
"label": null,
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

View file

@ -501,7 +501,7 @@ groups:
cortex_ingester_memory_series
)[24h:]
)
/ 1500000
/ 3000000
)
labels:
deployment: ingester
@ -510,7 +510,7 @@ groups:
- expr: |
ceil(
sum by (cluster, namespace) (cortex_overrides{limit_name="max_global_series_per_user"})
* 3 * 0.59999999999999998 / 1500000
* 3 * 0.59999999999999998 / 3000000
)
labels:
deployment: ingester

View file

@ -1 +1 @@
null
{}

View file

@ -1,754 +0,0 @@
{
"__inputs": [ ],
"__requires": [ ],
"annotations": {
"list": [ ]
},
"editable": false,
"gnetId": null,
"graphTooltip": 0,
"hideControls": false,
"id": null,
"links": [
{
"asDropdown": false,
"icon": "external link",
"includeVars": true,
"keepTime": true,
"tags": [
"docker"
],
"targetBlank": false,
"title": "Docker Dashboards",
"type": "dashboards",
"url": ""
}
],
"panels": [
{
"collapse": false,
"collapsed": false,
"gridPos": {
"h": 0,
"w": 0,
"x": 0,
"y": 2
},
"id": 2,
"panels": [ ],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": true,
"title": "Overview",
"titleSize": "h6",
"type": "row"
},
{
"datasource": "$loki_datasource",
"description": "Total number of log lines including errors and warnings.",
"fieldConfig": {
"defaults": {
"links": [ ],
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "rgb(192, 216, 255)",
"value": 0
}
]
},
"unit": "short"
}
},
"gridPos": {
"h": 4,
"w": 4,
"x": 0,
"y": 2
},
"id": 3,
"links": [ ],
"options": {
"colorMode": "value",
"graphMode": "none",
"justifyMode": "auto",
"orientation": "auto",
"reduceOptions": {
"calcs": [
"sum"
],
"fields": "",
"values": false
},
"textMode": "auto"
},
"pluginVersion": "7",
"targets": [
{
"expr": "sum(count_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"}[$__interval]))",
"legendFormat": "",
"refId": "A"
}
],
"title": "Total Log Lines",
"transparent": false,
"type": "stat"
},
{
"datasource": "$loki_datasource",
"description": "Total number of log lines of level: warning.",
"fieldConfig": {
"defaults": {
"links": [ ],
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "rgb(255, 152, 48)",
"value": 0
}
]
},
"unit": "short"
}
},
"gridPos": {
"h": 4,
"w": 4,
"x": 4,
"y": 2
},
"id": 4,
"links": [ ],
"options": {
"colorMode": "value",
"graphMode": "none",
"justifyMode": "auto",
"orientation": "auto",
"reduceOptions": {
"calcs": [
"sum"
],
"fields": "",
"values": false
},
"textMode": "auto"
},
"pluginVersion": "7",
"targets": [
{
"expr": "sum(count_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} |= \"Warning\" [$__interval]))",
"legendFormat": "",
"refId": "A"
}
],
"title": "Warnings",
"transparent": false,
"type": "stat"
},
{
"datasource": "$loki_datasource",
"description": "Total number of log lines of level: error.",
"fieldConfig": {
"defaults": {
"links": [ ],
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "rgb(242, 73, 92)",
"value": 0
}
]
},
"unit": "short"
}
},
"gridPos": {
"h": 4,
"w": 4,
"x": 8,
"y": 2
},
"id": 5,
"links": [ ],
"options": {
"colorMode": "value",
"graphMode": "none",
"justifyMode": "auto",
"orientation": "auto",
"reduceOptions": {
"calcs": [
"sum"
],
"fields": "",
"values": false
},
"textMode": "auto"
},
"pluginVersion": "7",
"targets": [
{
"expr": "sum(count_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} |= \"Error\" [$__interval]))",
"legendFormat": "",
"refId": "A"
}
],
"title": "Errors",
"transparent": false,
"type": "stat"
},
{
"datasource": "$loki_datasource",
"description": "Percentage of log lines with level: Error out of total log lines.",
"fieldConfig": {
"defaults": {
"links": [ ],
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "rgb(255, 166, 176)",
"value": 0
},
{
"color": "rgb(255, 115, 131)",
"value": 25
},
{
"color": "rgb(196, 22, 42)",
"value": 50
}
]
},
"unit": "percent"
}
},
"gridPos": {
"h": 4,
"w": 4,
"x": 12,
"y": 2
},
"id": 6,
"links": [ ],
"options": {
"colorMode": "value",
"graphMode": "none",
"justifyMode": "auto",
"orientation": "auto",
"reduceOptions": {
"calcs": [
"lastNotNull"
],
"fields": "",
"values": false
},
"textMode": "auto"
},
"pluginVersion": "7",
"targets": [
{
"expr": "sum( count_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} |= \"Error\" [$__interval]) ) / sum( count_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} [$__interval]) )",
"legendFormat": "",
"refId": "A"
}
],
"title": "Error Percentage",
"transparent": false,
"type": "stat"
},
{
"datasource": "$loki_datasource",
"description": "Total number of bytes for log lines including errors and warnings.",
"fieldConfig": {
"defaults": {
"links": [ ],
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "rgb(184, 119, 217)",
"value": 0
}
]
},
"unit": "bytes"
}
},
"gridPos": {
"h": 4,
"w": 4,
"x": 16,
"y": 2
},
"id": 7,
"links": [ ],
"options": {
"colorMode": "value",
"graphMode": "none",
"justifyMode": "auto",
"orientation": "auto",
"reduceOptions": {
"calcs": [
"sum"
],
"fields": "",
"values": false
},
"textMode": "auto"
},
"pluginVersion": "7",
"targets": [
{
"expr": "sum(bytes_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} [$__interval]))",
"legendFormat": "",
"refId": "A"
}
],
"title": "Bytes Used",
"transparent": false,
"type": "stat"
},
{
"datasource": {
"type": "loki",
"uid": "${loki_datasource}"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "fixed"
},
"custom": {
"axisLabel": "",
"axisPlacement": "auto",
"axisSoftMin": 0,
"fillOpacity": 50,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"lineWidth": 1,
"scaleDistribution": {
"type": "linear"
}
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
}
]
},
"unit": "short"
},
"overrides": [
{
"matcher": {
"id": "byFrameRefID",
"options": "A"
},
"properties": [
{
"id": "displayName",
"value": "Lines"
},
{
"id": "color",
"value": {
"fixedColor": "super-light-blue",
"mode": "fixed"
}
}
]
},
{
"matcher": {
"id": "byFrameRefID",
"options": "B"
},
"properties": [
{
"id": "displayName",
"value": "Warnings"
},
{
"id": "color",
"value": {
"fixedColor": "orange",
"mode": "fixed"
}
}
]
},
{
"matcher": {
"id": "byFrameRefID",
"options": "C"
},
"properties": [
{
"id": "displayName",
"value": "Errors"
},
{
"id": "color",
"value": {
"fixedColor": "red",
"mode": "fixed"
}
}
]
}
]
},
"gridPos": {
"h": 6,
"w": 24,
"x": 0,
"y": 6
},
"id": 8,
"interval": "10s",
"maxDataPoints": 25,
"options": {
"barRadius": 0.25,
"barWidth": 0.69999999999999996,
"groupWidth": 0.5,
"legend": {
"calcs": [ ],
"displayMode": "list",
"placement": "bottom"
},
"orientation": "auto",
"showValue": "never",
"stacking": "none",
"tooltip": {
"mode": "multi",
"sort": "none"
},
"xTickLabelRotation": 0,
"xTickLabelSpacing": 100
},
"targets": [
{
"datasource": {
"type": "loki",
"uid": "${loki_datasource}"
},
"expr": "sum(count_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"}[$__interval]))",
"refId": "A"
},
{
"datasource": {
"type": "loki",
"uid": "${loki_datasource}"
},
"expr": "sum(count_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} |= \"Warning\" [$__interval]))",
"hide": false,
"refId": "B"
},
{
"datasource": {
"type": "loki",
"uid": "${loki_datasource}"
},
"expr": "sum(count_over_time({job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} |= \"Error\" [$__interval]))",
"hide": false,
"refId": "C"
}
],
"title": "Historical Logs / Warnings / Errors",
"type": "barchart"
},
{
"collapse": true,
"collapsed": true,
"gridPos": {
"h": 0,
"w": 0,
"x": 0,
"y": 12
},
"id": 9,
"panels": [
{
"datasource": "$loki_datasource",
"gridPos": {
"h": 8,
"w": 24,
"x": 0,
"y": 12
},
"id": 10,
"options": {
"showLabels": false,
"showTime": true,
"sortOrder": "Descending",
"wrapLogMessage": true
},
"span": 12,
"targets": [
{
"expr": "{job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} |= \"Error\"",
"legendFormat": "",
"refId": "A"
}
],
"timeFrom": null,
"timeShift": null,
"title": "Errors",
"type": "logs"
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": true,
"title": "Errors",
"titleSize": "h6",
"type": "row"
},
{
"collapse": true,
"collapsed": true,
"gridPos": {
"h": 0,
"w": 0,
"x": 0,
"y": 20
},
"id": 11,
"panels": [
{
"datasource": "$loki_datasource",
"gridPos": {
"h": 8,
"w": 24,
"x": 0,
"y": 20
},
"id": 12,
"options": {
"showLabels": false,
"showTime": true,
"sortOrder": "Descending",
"wrapLogMessage": true
},
"span": 12,
"targets": [
{
"expr": "{job=~\"$job\", instance=~\"$instance\", container=~\"$container\"} |= \"Warning\"",
"legendFormat": "",
"refId": "A"
}
],
"timeFrom": null,
"timeShift": null,
"title": "Warnings",
"type": "logs"
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": true,
"title": "Warnings",
"titleSize": "h6",
"type": "row"
},
{
"collapse": true,
"collapsed": true,
"gridPos": {
"h": 0,
"w": 0,
"x": 0,
"y": 28
},
"id": 13,
"panels": [
{
"datasource": "$loki_datasource",
"gridPos": {
"h": 8,
"w": 24,
"x": 0,
"y": 28
},
"id": 14,
"options": {
"showLabels": false,
"showTime": true,
"sortOrder": "Descending",
"wrapLogMessage": true
},
"span": 12,
"targets": [
{
"expr": "{job=~\"$job\", instance=~\"$instance\", container=~\"$container\"}",
"legendFormat": "",
"refId": "A"
}
],
"timeFrom": null,
"timeShift": null,
"title": "Full Log File",
"type": "logs"
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": true,
"title": "Complete Log File",
"titleSize": "h6",
"type": "row"
}
],
"refresh": "1m",
"rows": [ ],
"schemaVersion": 14,
"style": "dark",
"tags": [
"docker"
],
"templating": {
"list": [
{
"current": {
"text": "default",
"value": "default"
},
"hide": 0,
"label": "Prometheus Data Source",
"name": "prometheus_datasource",
"options": [ ],
"query": "prometheus",
"refresh": 1,
"regex": "",
"type": "datasource"
},
{
"current": {
"text": "default",
"value": "default"
},
"hide": 0,
"label": "Loki Data Source",
"name": "loki_datasource",
"options": [ ],
"query": "loki",
"refresh": 1,
"regex": "",
"type": "datasource"
},
{
"allValue": ".+",
"current": { },
"datasource": "$prometheus_datasource",
"hide": 0,
"includeAll": true,
"label": "Job",
"multi": true,
"name": "job",
"options": [ ],
"query": "label_values(machine_scrape_error, job)",
"refresh": 1,
"regex": "",
"sort": 1,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },
"datasource": "$prometheus_datasource",
"hide": 0,
"includeAll": true,
"label": "Instance",
"multi": true,
"name": "instance",
"options": [ ],
"query": "label_values(machine_scrape_error{job=~\"$job\"}, instance)",
"refresh": 1,
"regex": "",
"sort": 1,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },
"datasource": "$prometheus_datasource",
"hide": 0,
"includeAll": true,
"label": "Container",
"multi": true,
"name": "container",
"options": [ ],
"query": "label_values(container_last_seen{job=~\"$job\", instance=~\"$instance\"}, name)",
"refresh": 1,
"regex": "",
"sort": 1,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
}
]
},
"time": {
"from": "now-1h",
"to": "now"
},
"timepicker": {
"refresh_intervals": [
"5s",
"10s",
"30s",
"1m",
"5m",
"15m",
"30m",
"1h",
"2h",
"1d"
],
"time_options": [
"5m",
"15m",
"1h",
"6h",
"12h",
"24h",
"2d",
"7d",
"30d"
]
},
"timezone": "default",
"title": "Docker Logs",
"uid": "integration-docker-logs",
"version": 0
}

File diff suppressed because it is too large Load diff

View file

@ -1 +1 @@
null
{}

View file

@ -150,7 +150,7 @@ groups:
quota as the writes to etcd will be disabled when it is full.'
summary: etcd cluster database is running full.
expr: |
(last_over_time(etcd_mvcc_db_total_size_in_bytes[5m]) / last_over_time(etcd_server_quota_backend_bytes[5m]))*100 > 95
(last_over_time(etcd_mvcc_db_total_size_in_bytes{job=~".*etcd.*"}[5m]) / last_over_time(etcd_server_quota_backend_bytes{job=~".*etcd.*"}[5m]))*100 > 95
for: 10m
labels:
severity: critical
@ -162,7 +162,7 @@ groups:
be disruptive.'
summary: etcd cluster database growing very fast.
expr: |
predict_linear(etcd_mvcc_db_total_size_in_bytes[4h], 4*60*60) > etcd_server_quota_backend_bytes
predict_linear(etcd_mvcc_db_total_size_in_bytes{job=~".*etcd.*"}[4h], 4*60*60) > etcd_server_quota_backend_bytes{job=~".*etcd.*"}
for: 10m
labels:
severity: warning
@ -176,7 +176,7 @@ groups:
summary: etcd database size in use is less than 50% of the actual allocated
storage.
expr: |
(last_over_time(etcd_mvcc_db_total_size_in_use_in_bytes[5m]) / last_over_time(etcd_mvcc_db_total_size_in_bytes[5m])) < 0.5 and etcd_mvcc_db_total_size_in_use_in_bytes > 104857600
(last_over_time(etcd_mvcc_db_total_size_in_use_in_bytes{job=~".*etcd.*"}[5m]) / last_over_time(etcd_mvcc_db_total_size_in_bytes{job=~".*etcd.*"}[5m])) < 0.5 and etcd_mvcc_db_total_size_in_use_in_bytes{job=~".*etcd.*"} > 104857600
for: 10m
labels:
severity: warning

File diff suppressed because it is too large Load diff

View file

@ -819,7 +819,7 @@
"useTags": false
},
{
"allValue": "",
"allValue": ".+",
"current": { },
"datasource": {
"uid": "${prometheus_datasource}"

View file

@ -6,8 +6,8 @@ groups:
message: '{{ $labels.namespace }}/{{ $labels.job }}/{{ $labels.handler }} is
experiencing {{ $value | humanize }}% errors'
expr: |
100 * namespace_job_handler_statuscode:grafana_http_request_duration_seconds_count:rate5m{handler!~"/api/datasources/proxy/:id.*|/api/ds/query|/api/tsdb/query", status_code=~"5.."}
/ ignoring (status_code)
100 * sum without (status_code) (namespace_job_handler_statuscode:grafana_http_request_duration_seconds_count:rate5m{handler!~"/api/datasources/proxy/:id.*|/api/ds/query|/api/tsdb/query", status_code=~"5.."})
/
sum without (status_code) (namespace_job_handler_statuscode:grafana_http_request_duration_seconds_count:rate5m{handler!~"/api/datasources/proxy/:id.*|/api/ds/query|/api/tsdb/query"})
> 50
for: 5m

View file

@ -438,7 +438,6 @@
}
],
"schemaVersion": 30,
"style": "dark",
"tags": [ ],
"templating": {
"list": [

View file

@ -6,7 +6,7 @@ groups:
description: HAProxy {{$labels.job}} on {{$labels.instance}} is dropping logs.
summary: HAProxy is dropping logs.
expr: rate(haproxy_process_dropped_logs_total[5m]) != 0
for: 5s
for: 10m
labels:
severity: critical
- alert: HAProxyBackendCheckFlapping
@ -15,7 +15,7 @@ groups:
has flapping checks.
summary: HAProxy backend checks are flapping.
expr: rate(haproxy_backend_check_up_down_total[5m]) != 0
for: 1m
for: 10m
labels:
severity: critical
- alert: HAProxyServerCheckFlapping
@ -24,6 +24,6 @@ groups:
has flapping checks.
summary: HAProxy server checks are flapping.
expr: rate(haproxy_server_check_up_down_total[5m]) != 0
for: 1m
for: 10m
labels:
severity: critical

View file

@ -1445,7 +1445,7 @@
"uid": "${loki_datasource}"
},
"editorMode": "code",
"expr": "{job=~\"$job\", filename=~\"/var/mqm/qmgrs/.*/errors/.*LOG\", qmgr=~\"$qmgr\"} |= ``",
"expr": "{job=~\"$job\", qmgr=~\"$qmgr\"} |= `` | (filename=~\"/var/mqm/qmgrs/.*/errors/.*LOG\" or log_type=\"mq-qmgr-error\")",
"queryType": "range",
"refId": "A"
}

View file

@ -142,17 +142,19 @@
},
"gridPos": {
"h": 6,
"w": 24
"w": 24,
"x": 0,
"y": 0
},
"id": 1,
"interval": "30s",
"maxDataPoints": 100,
"options": {
"tooltip": {
"mode": "multi",
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -182,7 +184,9 @@
},
"gridPos": {
"h": 18,
"w": 24
"w": 24,
"x": 0,
"y": 18
},
"id": 2,
"options": {
@ -192,7 +196,7 @@
"showTime": false,
"wrapLogMessage": true
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -207,7 +211,7 @@
}
],
"refresh": "1m",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"influxdb-mixin"
],

View file

@ -147,17 +147,19 @@
},
"gridPos": {
"h": 6,
"w": 24
"w": 24,
"x": 0,
"y": 0
},
"id": 1,
"interval": "30s",
"maxDataPoints": 100,
"options": {
"tooltip": {
"mode": "multi",
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -187,7 +189,9 @@
},
"gridPos": {
"h": 18,
"w": 24
"w": 24,
"x": 0,
"y": 18
},
"id": 2,
"options": {
@ -197,7 +201,7 @@
"showTime": false,
"wrapLogMessage": false
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -212,7 +216,7 @@
}
],
"refresh": "1m",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"istio"
],

View file

@ -56,7 +56,7 @@
"options": {
"graphMode": "none"
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -105,7 +105,7 @@
"options": {
"graphMode": "none"
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -154,7 +154,7 @@
"options": {
"graphMode": "none"
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -222,7 +222,7 @@
"options": {
"graphMode": "none"
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -271,7 +271,7 @@
"options": {
"graphMode": "none"
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -320,7 +320,7 @@
"options": {
"graphMode": "none"
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -372,7 +372,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -442,7 +442,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -543,7 +543,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -693,7 +693,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -787,7 +787,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -1123,7 +1123,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -1183,7 +1183,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {

View file

@ -72,7 +72,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -122,7 +122,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -177,7 +177,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -231,7 +231,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -338,7 +338,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -482,7 +482,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -537,7 +537,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -591,7 +591,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -657,7 +657,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -707,7 +707,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -762,7 +762,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -816,7 +816,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -923,7 +923,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -1067,7 +1067,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -1122,7 +1122,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -1176,7 +1176,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {

View file

@ -72,7 +72,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -122,7 +122,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -177,7 +177,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -231,7 +231,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -338,7 +338,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -482,7 +482,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -537,7 +537,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -591,7 +591,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -657,7 +657,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -707,7 +707,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -762,7 +762,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -816,7 +816,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -923,7 +923,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -1067,7 +1067,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -1122,7 +1122,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {
@ -1176,7 +1176,7 @@
"sort": "desc"
}
},
"pluginVersion": "v10.0.0",
"pluginVersion": "v11.0.0",
"targets": [
{
"datasource": {

View file

@ -3,16 +3,18 @@ groups:
rules:
- alert: JaegerAgentUDPPacketsBeingDropped
annotations:
message: |
description: |
{{ $labels.job }} {{ $labels.instance }} is dropping {{ printf "%.2f" $value }} UDP packets per second.
summary: Jaeger agent is dropping UDP packets.
expr: rate(jaeger_agent_thrift_udp_server_packets_dropped_total[1m]) > 1
for: 15m
labels:
severity: warning
- alert: JaegerAgentHTTPServerErrs
annotations:
message: |
description: |
{{ $labels.job }} {{ $labels.instance }} is experiencing {{ printf "%.2f" $value }}% HTTP errors.
summary: Jaeger agent is experiencing HTTP errors.
expr: 100 * sum(rate(jaeger_agent_http_server_errors_total[1m])) by (instance,
job, namespace) / sum(rate(jaeger_agent_http_server_total[1m])) by (instance,
job, namespace)> 1
@ -21,8 +23,9 @@ groups:
severity: warning
- alert: JaegerClientSpansDropped
annotations:
message: |
description: |
service {{ $labels.job }} {{ $labels.instance }} is dropping {{ printf "%.2f" $value }}% spans.
summary: Jaeger client is dropping spans.
expr: 100 * sum(rate(jaeger_reporter_spans{result=~"dropped|err"}[1m])) by (instance,
job, namespace) / sum(rate(jaeger_reporter_spans[1m])) by (instance, job, namespace)>
1
@ -31,8 +34,9 @@ groups:
severity: warning
- alert: JaegerAgentSpansDropped
annotations:
message: |
description: |
agent {{ $labels.job }} {{ $labels.instance }} is dropping {{ printf "%.2f" $value }}% spans.
summary: Jaeger agent is dropping spans.
expr: 100 * sum(rate(jaeger_agent_reporter_batches_failures_total[1m])) by (instance,
job, namespace) / sum(rate(jaeger_agent_reporter_batches_submitted_total[1m]))
by (instance, job, namespace)> 1
@ -41,16 +45,18 @@ groups:
severity: warning
- alert: JaegerCollectorQueueNotDraining
annotations:
message: |
description: |
collector {{ $labels.job }} {{ $labels.instance }} is not able to drain the queue.
summary: Jaeger collector is not able to drain the queue.
expr: avg_over_time(jaeger_collector_queue_length[10m]) > 1000
for: 15m
labels:
severity: warning
- alert: JaegerCollectorDroppingSpans
annotations:
message: |
description: |
collector {{ $labels.job }} {{ $labels.instance }} is dropping {{ printf "%.2f" $value }}% spans.
summary: Jaeger collector is dropping spans.
expr: 100 * sum(rate(jaeger_collector_spans_dropped_total[1m])) by (instance,
job, namespace) / sum(rate(jaeger_collector_spans_received_total[1m])) by (instance,
job, namespace)> 1
@ -59,8 +65,9 @@ groups:
severity: warning
- alert: JaegerSamplingUpdateFailing
annotations:
message: |
description: |
{{ $labels.job }} {{ $labels.instance }} is failing {{ printf "%.2f" $value }}% in updating sampling policies.
summary: Jaeger's sampling update is failing.
expr: 100 * sum(rate(jaeger_sampler_queries{result="err"}[1m])) by (instance,
job, namespace) / sum(rate(jaeger_sampler_queries[1m])) by (instance, job, namespace)>
1
@ -69,8 +76,9 @@ groups:
severity: warning
- alert: JaegerCollectorPersistenceSlow
annotations:
message: |
description: |
{{ $labels.job }} {{ $labels.instance }} is slow at persisting spans.
summary: Jaeger collector is slow at persisting spans.
expr: histogram_quantile(0.99, sum by (le) (rate(jaeger_collector_save_latency_bucket[1m])))
> 0.5
for: 15m
@ -78,8 +86,9 @@ groups:
severity: warning
- alert: JaegerThrottlingUpdateFailing
annotations:
message: |
description: |
{{ $labels.job }} {{ $labels.instance }} is failing {{ printf "%.2f" $value }}% in updating throttling policies.
summary: Jaeger's throttling update is failing.
expr: 100 * sum(rate(jaeger_throttler_updates{result="err"}[1m])) by (instance,
job, namespace) / sum(rate(jaeger_throttler_updates[1m])) by (instance, job,
namespace)> 1
@ -88,8 +97,9 @@ groups:
severity: warning
- alert: JaegerQueryReqsFailing
annotations:
message: |
description: |
{{ $labels.job }} {{ $labels.instance }} is seeing {{ printf "%.2f" $value }}% query errors on {{ $labels.operation }}.
summary: Jaeger queries are failing.
expr: 100 * sum(rate(jaeger_query_requests_total{result="err"}[1m])) by (instance,
job, namespace) / sum(rate(jaeger_query_requests_total[1m])) by (instance, job,
namespace)> 1
@ -98,8 +108,9 @@ groups:
severity: warning
- alert: JaegerCassandraWritesFailing
annotations:
message: |
description: |
{{ $labels.job }} {{ $labels.instance }} is seeing {{ printf "%.2f" $value }}% query errors on {{ $labels.operation }}.
summary: Jaeger writes to Cassandra are failing.
expr: 100 * sum(rate(jaeger_cassandra_errors_total[1m])) by (instance, job, namespace)
/ sum(rate(jaeger_cassandra_attempts_total[1m])) by (instance, job, namespace)>
1
@ -108,8 +119,9 @@ groups:
severity: warning
- alert: JaegerCassandraReadsFailing
annotations:
message: |
description: |
{{ $labels.job }} {{ $labels.instance }} is seeing {{ printf "%.2f" $value }}% query errors on {{ $labels.operation }}.
summary: Jaeger reads from Cassandra are failing.
expr: 100 * sum(rate(jaeger_cassandra_read_errors_total[1m])) by (instance, job,
namespace) / sum(rate(jaeger_cassandra_read_attempts_total[1m])) by (instance,
job, namespace)> 1

View file

@ -50,7 +50,6 @@
{
"expr": "sum(rate(jaeger_query_requests_total{result=\"err\"}[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "error",
"refId": "A",
"step": 10
@ -58,7 +57,6 @@
{
"expr": "sum(rate(jaeger_query_requests_total[1m])) - sum(rate(jaeger_query_requests_total{result=\"err\"}[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "success",
"refId": "B",
"step": 10
@ -134,7 +132,6 @@
{
"expr": "histogram_quantile(0.99, sum(rate(jaeger_query_latency_bucket[1m])) by (le, instance))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendLink": null
}
@ -224,7 +221,6 @@
{
"expr": "sum(rate(jaeger_cassandra_read_errors_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "error",
"refId": "A",
"step": 10
@ -232,7 +228,6 @@
{
"expr": "sum(rate(jaeger_cassandra_read_attempts_total[1m])) - sum(rate(jaeger_cassandra_read_errors_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "success",
"refId": "B",
"step": 10
@ -308,7 +303,6 @@
{
"expr": "histogram_quantile(0.99, sum(rate(jaeger_cassandra_read_latency_ok_bucket[1m])) by (le, instance))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendLink": null
}
@ -369,7 +363,7 @@
"value": "default"
},
"hide": 0,
"label": "Data Source",
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",

View file

@ -50,7 +50,6 @@
{
"expr": "sum(rate(jaeger_reporter_spans{result=~\"dropped|err\"}[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "error",
"refId": "A",
"step": 10
@ -58,7 +57,6 @@
{
"expr": "sum(rate(jaeger_reporter_spans[1m])) - sum(rate(jaeger_reporter_spans{result=~\"dropped|err\"}[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "success",
"refId": "B",
"step": 10
@ -134,7 +132,6 @@
{
"expr": "sum(rate(jaeger_reporter_spans{result=~\"dropped|err\"}[1m])) by (namespace) / scalar(sum(rate(jaeger_reporter_spans[1m])))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{namespace}}",
"legendLink": null
}
@ -224,7 +221,6 @@
{
"expr": "sum(rate(jaeger_agent_reporter_batches_failures_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "error",
"refId": "A",
"step": 10
@ -232,7 +228,6 @@
{
"expr": "sum(rate(jaeger_agent_reporter_batches_submitted_total[1m])) - sum(rate(jaeger_agent_reporter_batches_failures_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "success",
"refId": "B",
"step": 10
@ -308,7 +303,6 @@
{
"expr": "sum(rate(jaeger_agent_reporter_batches_failures_total[1m])) by (cluster) / scalar(sum(rate(jaeger_agent_reporter_batches_submitted_total[1m])))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{cluster}}",
"legendLink": null
}
@ -398,7 +392,6 @@
{
"expr": "sum(rate(jaeger_collector_spans_dropped_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "error",
"refId": "A",
"step": 10
@ -406,7 +399,6 @@
{
"expr": "sum(rate(jaeger_collector_spans_received_total[1m])) - sum(rate(jaeger_collector_spans_dropped_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "success",
"refId": "B",
"step": 10
@ -482,7 +474,6 @@
{
"expr": "sum(rate(jaeger_collector_spans_dropped_total[1m])) by (instance) / scalar(sum(rate(jaeger_collector_spans_received_total[1m])))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendLink": null
}
@ -569,7 +560,6 @@
{
"expr": "sum by (svc) (rate(jaeger_collector_traces_saved_by_svc_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{svc}}",
"legendLink": null
}
@ -644,7 +634,6 @@
{
"expr": "sum by (svc) (rate(jaeger_collector_spans_saved_by_svc_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{svc}}",
"legendLink": null
}
@ -731,7 +720,6 @@
{
"expr": "jaeger_collector_queue_length",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendLink": null
}
@ -806,7 +794,6 @@
{
"expr": "histogram_quantile(0.95, sum(rate(jaeger_collector_in_queue_latency_bucket[1m])) by (le, instance))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{instance}}",
"legendLink": null
}
@ -896,7 +883,6 @@
{
"expr": "sum(rate(jaeger_cassandra_errors_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "error",
"refId": "A",
"step": 10
@ -904,7 +890,6 @@
{
"expr": "sum(rate(jaeger_cassandra_attempts_total[1m])) - sum(rate(jaeger_cassandra_errors_total[1m]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "success",
"refId": "B",
"step": 10
@ -980,7 +965,6 @@
{
"expr": "histogram_quantile(0.95, sum by (job, le) (rate(jaeger_collector_save_latency_bucket[1m])))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{job}}",
"legendLink": null
}
@ -1041,7 +1025,7 @@
"value": "default"
},
"hide": 0,
"label": "Data Source",
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",

File diff suppressed because it is too large Load diff

View file

@ -1,14 +1 @@
groups:
- name: jvm
rules:
- alert: JvmMemoryFillingUp
annotations:
description: JVM memory usage is at {{ printf "%%.0f" $value }} percent over
the last 5 minutes on {{$labels.instance}}, which is above the threshold of
80%.
summary: JVM memory filling up.
expr: |
jvm_memory_bytes_used / jvm_memory_bytes_max{area="heap"} > 0.8
for: 5m
labels:
severity: warning
null

View file

@ -1,577 +0,0 @@
{
"__inputs": [
{
"description": "A prometheus datasource with JMX Exporter scraping",
"label": "Data Source",
"name": "datasource",
"pluginId": "prometheus",
"pluginName": "Prometheus",
"type": "datasource"
}
],
"__requires": [
{
"id": "grafana",
"name": "Grafana",
"type": "grafana",
"version": "4.5.0-pre1"
},
{
"id": "graph",
"name": "Graph",
"type": "panel",
"version": ""
},
{
"id": "prometheus",
"name": "Prometheus",
"type": "datasource",
"version": "1.0.0"
}
],
"annotations": {
"list": [ ]
},
"description": "Dashboard for JVM metrics with Prometheus / JMX Exporter",
"editable": true,
"gnetId": 3066,
"graphTooltip": 0,
"hideControls": false,
"id": null,
"links": [ ],
"refresh": "30s",
"rows": [
{
"collapse": false,
"height": 250,
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "${datasource}",
"fill": 1,
"id": 2,
"legend": {
"alignAsTable": true,
"avg": true,
"current": true,
"max": true,
"min": true,
"rightSide": true,
"show": true,
"total": false,
"values": true
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"repeat": null,
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 12,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "jvm_memory_bytes_used{job=~\"$job\", instance=~\"$instance\"}",
"format": "time_series",
"interval": "",
"legendFormat": "{{area}} memory [{{instance}}]",
"metric": "jvm_memory_bytes_used",
"refId": "A",
"step": 5
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Memory used",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "bytes",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": false,
"title": "Dashboard Row",
"titleSize": "h6"
},
{
"collapse": false,
"height": 250,
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "${datasource}",
"fill": 1,
"id": 3,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 6,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "jvm_threads_current{job=~\"$job\", instance=~\"$instance\"}",
"format": "time_series",
"legendFormat": "current [{{instance}}]",
"metric": "jvm_threads_current",
"refId": "A",
"step": 10
},
{
"expr": "jvm_threads_daemon{job=~\"$job\", instance=~\"$instance\"}",
"format": "time_series",
"legendFormat": "daemon [{{instance}}]",
"metric": "jvm_threads_daemon",
"refId": "B",
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Threads used",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"decimals": 0,
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "${datasource}",
"fill": 1,
"id": 4,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 6,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "jvm_classes_loaded{job=~\"$job\", instance=~\"$instance\"}",
"format": "time_series",
"interval": "",
"legendFormat": "loaded [{{instance}}]",
"metric": "jvm_classes_loaded",
"refId": "A",
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Class loading",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"decimals": 0,
"format": "short",
"label": "",
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": false,
"title": "Dashboard Row",
"titleSize": "h6"
},
{
"collapse": false,
"height": 250,
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "${datasource}",
"fill": 1,
"id": 5,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 6,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "rate(jvm_gc_collection_seconds_sum{job=~\"$job\", instance=~\"$instance\"}[$__rate_interval])",
"format": "time_series",
"interval": "",
"legendFormat": "{{gc}} [{{instance}}]",
"metric": "jvm_gc_collection_seconds_sum",
"refId": "A",
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "GC time rate",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "s",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
]
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "${datasource}",
"fill": 1,
"id": 6,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"span": 6,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "jvm_gc_collection_seconds_count{job=~\"$job\", instance=~\"$instance\"}",
"format": "time_series",
"interval": "",
"legendFormat": "{{gc}} [{{instance}}]",
"metric": "",
"refId": "A",
"step": 10
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "GC count",
"tooltip": {
"shared": true,
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"decimals": 0,
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": true
}
]
}
],
"repeat": null,
"repeatIteration": null,
"repeatRowId": null,
"showTitle": false,
"title": "Dashboard Row",
"titleSize": "h6"
}
],
"schemaVersion": 14,
"style": "dark",
"tags": [
"JVM",
"prometheus"
],
"templating": {
"list": [
{
"current": { },
"hide": 0,
"includeAll": false,
"label": "Data Source",
"multi": false,
"name": "datasource",
"options": [ ],
"query": "prometheus",
"queryValue": "",
"refresh": 1,
"regex": "",
"skipUrlSync": false,
"type": "datasource"
},
{
"allValue": ".+",
"current": { },
"datasource": "${datasource}",
"hide": 0,
"includeAll": true,
"label": "job",
"multi": true,
"name": "job",
"options": [ ],
"query": "label_values(jvm_memory_bytes_used,job)",
"refresh": 1,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": { },
"datasource": "${datasource}",
"hide": 0,
"includeAll": true,
"label": "instance",
"multi": true,
"name": "instance",
"options": [ ],
"query": "label_values(jvm_memory_bytes_used{job=~\"$job\"},instance)",
"refresh": 1,
"regex": "",
"sort": 0,
"tagValuesQuery": "",
"tags": [ ],
"tagsQuery": "",
"type": "query",
"useTags": false
}
]
},
"time": {
"from": "now-30m",
"to": "now"
},
"timepicker": {
"refresh_intervals": [
"5s",
"10s",
"30s",
"1m",
"5m",
"15m",
"30m",
"1h",
"2h",
"1d"
],
"time_options": [
"5m",
"15m",
"1h",
"6h",
"12h",
"24h",
"2d",
"7d",
"30d"
]
},
"timezone": "",
"title": "JVM overview - Prometheus",
"uid": "1602068683-1",
"version": 12
}

View file

@ -1 +1 @@
null
{}

View file

@ -1,101 +1 @@
groups:
- name: Kafka_Alerts
rules:
- alert: KafkaOfflinePartitonCount
annotations:
description: Kafka cluster {{ $labels.kafka_cluster }} has {{ $value }} offline
partitions. After successful leader election, if the leader for partition
dies, then the partition moves to the OfflinePartition state. Offline partitions
are not available for reading and writing. Restart the brokers, if needed,
and check the logs for errors.
summary: Kafka has offline partitons.
expr: sum without(instance) (kafka_controller_kafkacontroller_offlinepartitionscount{job="integrations/kafka"})
> 0
for: 5m
labels:
severity: critical
- alert: KafkaUnderReplicatedPartitionCount
annotations:
description: Kafka instance {{ $labels.instance }} in cluster {{ $labels.kafka_cluster
}} has {{ $value }} under replicated partitons
summary: Kafka has under replicated partitons.
expr: |
sum without() (kafka_server_replicamanager_underreplicatedpartitions{job="integrations/kafka"}) > 0
for: 5m
labels:
severity: critical
- alert: KafkaActiveController
annotations:
description: Kafka cluster {{ $labels.kafka_cluster }} has {{ $value }} broker(s)
reporting as the active controller in the last 5 minute interval. During steady
state there should be only one active controller per cluster.
summary: Kafka has no active controller.
expr: sum without(instance) (kafka_controller_kafkacontroller_activecontrollercount{job="integrations/kafka"})
!= 1
for: 5m
labels:
severity: critical
- alert: KafkaUncleanLeaderElection
annotations:
description: Kafka cluster {{ $labels.kafka_cluster }} has {{ $value }} unclean
partition leader elections reported in the last 5 minute interval. When unclean
leader election is held among out-of-sync replicas, there is a possibility
of data loss if any messages were not synced prior to the loss of the former
leader. So if the number of unclean elections is greater than 0, investigate
broker logs to determine why leaders were re-elected, and look for WARN or
ERROR messages. Consider setting the broker configuration parameter unclean.leader.election.enable
to false so that a replica outside of the set of in-sync replicas is never
elected leader.
summary: Kafka has unclean leader elections.
expr: max without(instance) (rate(kafka_controller_controllerstats_uncleanleaderelectionspersec{job="integrations/kafka"}[5m]))
!= 0
for: 5m
labels:
severity: critical
- alert: KafkaISRExpandRate
annotations:
description: Kafka instance {{ $labels.instance }} in cluster {{ $labels.kafka_cluster
}} ISR is expanding by {{ $value }} per second. If a broker goes down, ISR
for some of the partitions shrink. When that broker is up again, ISRs are
expanded once the replicas are fully caught up. Other than that, the expected
value for ISR expansion rate is 0. If ISR is expanding and shrinking frequently,
adjust Allowed replica lag.
summary: Kafka ISR Expansion Rate is expanding.
expr: |
sum without() (rate(kafka_server_replicamanager_isrexpandspersec{job="integrations/kafka"}[5m])) != 0
for: 5m
labels:
severity: warning
- alert: KafkaISRShrinkRate
annotations:
description: Kafka instance {{ $labels.instance }} in cluster {{ $labels.kafka_cluster
}} ISR is shrinking by {{ $value }} per second. If a broker goes down, ISR
for some of the partitions shrink. When that broker is up again, ISRs are
expanded once the replicas are fully caught up. Other than that, the expected
value for ISR shrink rate is 0. If ISR is expanding and shrinking frequently,
adjust Allowed replica lag.
summary: Kafka ISR Expansion Rate is shrinking.
expr: |
sum without() (rate(kafka_server_replicamanager_isrshrinkspersec{job="integrations/kafka"}[5m])) != 0
for: 5m
labels:
severity: warning
- alert: KafkaBrokerCount
annotations:
description: Kafka cluster {{ $labels.kafka_cluster }} broker count is 0.
summary: Kafka has no Brokers online.
expr: count without(instance) (kafka_server_kafkaserver_brokerstate{job="integrations/kafka"})
== 0
for: 5m
labels:
severity: critical
- alert: KafkaZookeeperSyncConnect
annotations:
description: Kafka instance {{ $labels.instance }} in cluster {{ $labels.kafka_cluster
}} Zookeeper Sync Disconected.
summary: Kafka Zookeeper Sync Disconected.
expr: |
avg without() (kafka_server_sessionexpirelistener_zookeepersyncconnectspersec{job="integrations/kafka"}) < 0
for: 5m
labels:
severity: warning
null

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

View file

@ -1,833 +0,0 @@
{
"annotations": {
"list": [
{
"builtIn": 1,
"datasource": {
"type": "datasource",
"uid": "grafana"
},
"enable": true,
"hide": true,
"iconColor": "rgba(0, 211, 255, 1)",
"name": "Annotations & Alerts",
"target": {
"limit": 100,
"matchAny": false,
"tags": [ ],
"type": "dashboard"
},
"type": "dashboard"
}
]
},
"description": "Kafka lag overview",
"editable": true,
"fiscalYearStartMonth": 0,
"gnetId": 7589,
"graphTooltip": 0,
"id": 52,
"links": [ ],
"liveNow": false,
"panels": [
{
"datasource": {
"uid": "${datasource}"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 0,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": true,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"min": 0,
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "short"
},
"overrides": [ ]
},
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 0
},
"id": 14,
"links": [ ],
"options": {
"legend": {
"calcs": [
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "bottom",
"showLegend": true,
"width": 480
},
"tooltip": {
"mode": "multi",
"sort": "none"
}
},
"pluginVersion": "9.2.7",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"exemplar": true,
"expr": "sum(rate(kafka_topic_partition_current_offset{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic=~\"$topic\"}[$__rate_interval])) by (topic)",
"format": "time_series",
"interval": "",
"intervalFactor": 1,
"legendFormat": "{{topic}}",
"refId": "B"
}
],
"title": "Message in per second",
"type": "timeseries"
},
{
"datasource": {
"uid": "${datasource}"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 0,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": true,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "short"
},
"overrides": [ ]
},
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 0
},
"id": 16,
"links": [ ],
"options": {
"legend": {
"calcs": [
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "bottom",
"showLegend": true,
"width": 480
},
"tooltip": {
"mode": "multi",
"sort": "none"
}
},
"pluginVersion": "9.2.7",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"exemplar": true,
"expr": "sum(increase(kafka_topic_partition_current_offset{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic=~\"$topic\"}[5m])/5) by (topic)",
"format": "time_series",
"interval": "",
"intervalFactor": 1,
"legendFormat": "{{topic}}",
"refId": "A"
}
],
"title": "Message in per minute",
"type": "timeseries"
},
{
"datasource": {
"uid": "$datasource"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 10,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "short"
},
"overrides": [ ]
},
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 10
},
"id": 20,
"options": {
"legend": {
"calcs": [
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "bottom",
"showLegend": true
},
"tooltip": {
"mode": "multi",
"sort": "none"
}
},
"pluginVersion": "9.2.7",
"targets": [
{
"datasource": {
"uid": "$datasource"
},
"exemplar": true,
"expr": "sum(rate(kafka_consumergroup_current_offset{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic=~\"$topic\"}[$__rate_interval])) by (consumergroup, topic)",
"interval": "",
"legendFormat": "{{consumergroup}} (topic: {{topic}})",
"refId": "A"
}
],
"title": "Message consume per second",
"type": "timeseries"
},
{
"datasource": {
"uid": "${datasource}"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 0,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": true,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "short"
},
"overrides": [ ]
},
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 10
},
"id": 18,
"links": [ ],
"options": {
"legend": {
"calcs": [
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "bottom",
"showLegend": true,
"width": 480
},
"tooltip": {
"mode": "multi",
"sort": "none"
}
},
"pluginVersion": "9.2.7",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"exemplar": true,
"expr": "sum(increase(kafka_consumergroup_current_offset{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic=~\"$topic\"}[5m])/5) by (consumergroup, topic)",
"format": "time_series",
"interval": "",
"intervalFactor": 1,
"legendFormat": "{{consumergroup}} (topic: {{topic}})",
"refId": "A"
}
],
"title": "Message consume per minute",
"type": "timeseries"
},
{
"datasource": {
"uid": "$datasource"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 10,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "short"
},
"overrides": [ ]
},
"gridPos": {
"h": 10,
"w": 12,
"x": 0,
"y": 20
},
"id": 22,
"options": {
"legend": {
"calcs": [
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "bottom",
"showLegend": true
},
"tooltip": {
"mode": "multi",
"sort": "none"
}
},
"pluginVersion": "9.2.7",
"targets": [
{
"datasource": {
"uid": "$datasource"
},
"exemplar": true,
"expr": "avg(kafka_consumer_lag_millis{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic=~\"$topic\"}/1000) by (consumergroup, topic)",
"interval": "",
"legendFormat": "{{consumergroup}} (topic: {{topic}})",
"refId": "A"
}
],
"title": "Lag by consumer group in seconds",
"type": "timeseries"
},
{
"datasource": {
"uid": "${datasource}"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 0,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": true,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"min": 0,
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "short"
},
"overrides": [ ]
},
"gridPos": {
"h": 10,
"w": 12,
"x": 12,
"y": 20
},
"id": 12,
"links": [ ],
"options": {
"legend": {
"calcs": [
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "bottom",
"showLegend": true,
"width": 480
},
"tooltip": {
"mode": "multi",
"sort": "desc"
}
},
"pluginVersion": "9.2.7",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"exemplar": true,
"expr": "avg(kafka_consumergroup_uncommitted_offsets{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic=~\"$topic\"}) by (consumergroup, topic)",
"format": "time_series",
"instant": false,
"interval": "",
"intervalFactor": 1,
"legendFormat": "{{consumergroup}} (topic: {{topic}})",
"refId": "A"
}
],
"title": "Lag by consumer group",
"type": "timeseries"
},
{
"datasource": {
"type": "prometheus",
"uid": "$datasource"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"fillOpacity": 80,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"lineWidth": 1,
"scaleDistribution": {
"type": "linear"
}
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
}
]
}
},
"overrides": [ ]
},
"gridPos": {
"h": 6,
"w": 24,
"x": 0,
"y": 30
},
"id": 8,
"links": [ ],
"options": {
"barRadius": 0,
"barWidth": 0.84999999999999998,
"groupWidth": 0.69999999999999996,
"legend": {
"calcs": [ ],
"displayMode": "list",
"placement": "bottom",
"showLegend": false
},
"orientation": "auto",
"showValue": "auto",
"stacking": "none",
"tooltip": {
"mode": "single",
"sort": "none"
},
"xTickLabelRotation": 0,
"xTickLabelSpacing": 0
},
"pluginVersion": "9.2.7",
"targets": [
{
"datasource": {
"uid": "$datasource"
},
"exemplar": true,
"expr": "sum by(topic) (kafka_topic_partitions{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic=~\"$topic\"})",
"format": "table",
"instant": true,
"interval": "",
"intervalFactor": 1,
"legendFormat": "{{topic}}",
"refId": "A"
}
],
"title": "Partitions per topic",
"type": "barchart"
}
],
"refresh": "30s",
"schemaVersion": 37,
"style": "dark",
"tags": [
"kafka-integration"
],
"templating": {
"list": [
{
"label": "Data source",
"name": "datasource",
"query": "prometheus",
"type": "datasource"
},
{
"allValue": ".+",
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"includeAll": true,
"label": "Job",
"multi": true,
"name": "job",
"query": "label_values(kafka_topic_partition_current_offset{job=\"integrations/kafka\"}, job)",
"refresh": 2,
"sort": 1,
"type": "query"
},
{
"allValue": ".+",
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"includeAll": true,
"label": "Kafka_cluster",
"multi": true,
"name": "kafka_cluster",
"query": "label_values(kafka_topic_partition_current_offset{job=\"integrations/kafka\",job=~\"$job\"}, kafka_cluster)",
"refresh": 2,
"sort": 1,
"type": "query"
},
{
"allValue": ".+",
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"includeAll": true,
"label": "Instance",
"multi": true,
"name": "instance",
"query": "label_values(kafka_topic_partition_current_offset{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\"}, instance)",
"refresh": 2,
"sort": 1,
"type": "query"
},
{
"allValue": ".+",
"current": {
"selected": false,
"text": "All",
"value": "$__all"
},
"datasource": {
"uid": "${datasource}"
},
"definition": "label_values(kafka_topic_partition_current_offset{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic!='__consumer_offsets',topic!='--kafka'}, topic)",
"hide": 0,
"includeAll": true,
"label": "Topic",
"multi": true,
"name": "topic",
"options": [ ],
"query": {
"query": "label_values(kafka_topic_partition_current_offset{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\", topic!='__consumer_offsets',topic!='--kafka'}, topic)",
"refId": "StandardVariableQuery"
},
"refresh": 2,
"regex": "",
"skipUrlSync": false,
"sort": 1,
"tagValuesQuery": "",
"type": "query",
"useTags": false
}
]
},
"time": {
"from": "now-1h",
"to": "now"
},
"timepicker": {
"refresh_intervals": [
"5s",
"10s",
"30s",
"1m",
"5m",
"15m",
"30m",
"1h",
"2h",
"1d"
],
"time_options": [
"5m",
"15m",
"1h",
"6h",
"12h",
"24h",
"2d",
"7d",
"30d"
]
},
"timezone": "browser",
"title": "Kafka lag overview",
"uid": "jwPKIsniz",
"version": 6
}

File diff suppressed because it is too large Load diff

View file

@ -1,750 +0,0 @@
{
"annotations": {
"list": [
{
"builtIn": 1,
"datasource": {
"type": "datasource",
"uid": "grafana"
},
"enable": true,
"hide": true,
"iconColor": "rgba(0, 211, 255, 1)",
"name": "Annotations & Alerts",
"type": "dashboard"
}
]
},
"editable": true,
"fiscalYearStartMonth": 0,
"graphTooltip": 0,
"id": 4,
"links": [ ],
"liveNow": false,
"panels": [
{
"datasource": {
"uid": "${datasource}"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisBorderShow": false,
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 10,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"insertNulls": false,
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"min": 0,
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "short"
},
"overrides": [ ]
},
"gridPos": {
"h": 9,
"w": 24,
"x": 0,
"y": 0
},
"id": 2,
"options": {
"legend": {
"calcs": [
"mean",
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "right",
"showLegend": true
},
"tooltip": {
"mode": "multi",
"sort": "none"
}
},
"pluginVersion": "10.2.3",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"expr": "sum without(instance) (rate(kafka_server_brokertopicmetrics_messagesinpersec{job=\"integrations/kafka\",job=~\"$job\",cluster=~\"$cluster\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\",topic=~\"$topic\"}[$__rate_interval]))",
"interval": "",
"legendFormat": "{{topic}}",
"refId": "A"
}
],
"title": "Messages In",
"type": "timeseries"
},
{
"datasource": {
"uid": "${datasource}"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisBorderShow": false,
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 10,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"insertNulls": false,
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "binBps"
},
"overrides": [ ]
},
"gridPos": {
"h": 9,
"w": 12,
"x": 0,
"y": 9
},
"id": 3,
"options": {
"legend": {
"calcs": [
"mean",
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "bottom",
"showLegend": true
},
"tooltip": {
"mode": "multi",
"sort": "none"
}
},
"pluginVersion": "10.2.3",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"expr": "sum without(instance) (rate(kafka_server_brokertopicmetrics_bytesinpersec{job=\"integrations/kafka\",job=~\"$job\",cluster=~\"$cluster\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\",topic=~\"$topic\"}[$__rate_interval]))",
"interval": "",
"legendFormat": "{{topic}}",
"refId": "A"
}
],
"title": "Bytes In",
"type": "timeseries"
},
{
"datasource": {
"uid": "${datasource}"
},
"fieldConfig": {
"defaults": {
"color": {
"mode": "palette-classic"
},
"custom": {
"axisBorderShow": false,
"axisCenteredZero": false,
"axisColorMode": "text",
"axisLabel": "",
"axisPlacement": "auto",
"barAlignment": 0,
"drawStyle": "line",
"fillOpacity": 10,
"gradientMode": "none",
"hideFrom": {
"legend": false,
"tooltip": false,
"viz": false
},
"insertNulls": false,
"lineInterpolation": "linear",
"lineWidth": 1,
"pointSize": 5,
"scaleDistribution": {
"type": "linear"
},
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
},
"thresholdsStyle": {
"mode": "off"
}
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
},
"unit": "binBps"
},
"overrides": [ ]
},
"gridPos": {
"h": 9,
"w": 12,
"x": 12,
"y": 9
},
"id": 4,
"options": {
"legend": {
"calcs": [
"mean",
"lastNotNull",
"max"
],
"displayMode": "table",
"placement": "bottom",
"showLegend": true
},
"tooltip": {
"mode": "multi",
"sort": "none"
}
},
"pluginVersion": "10.2.3",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"expr": "sum without(instance) (rate(kafka_server_brokertopicmetrics_bytesoutpersec{job=\"integrations/kafka\",job=~\"$job\",cluster=~\"$cluster\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\",topic=~\"$topic\"}[$__rate_interval]))",
"interval": "",
"legendFormat": "{{topic}}",
"refId": "A"
}
],
"title": "Bytes Out",
"type": "timeseries"
},
{
"datasource": {
"uid": "${datasource}"
},
"description": "",
"fieldConfig": {
"defaults": {
"custom": {
"cellOptions": {
"type": "auto"
},
"filterable": false,
"inspect": false
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
}
},
"overrides": [
{
"matcher": {
"id": "byName",
"options": "partition"
},
"properties": [
{
"id": "custom.width",
"value": 103
}
]
},
{
"matcher": {
"id": "byName",
"options": "offset"
},
"properties": [
{
"id": "custom.width",
"value": 226
}
]
}
]
},
"gridPos": {
"h": 8,
"w": 12,
"x": 0,
"y": 18
},
"id": 6,
"options": {
"cellHeight": "sm",
"footer": {
"countRows": false,
"fields": "",
"reducer": [
"sum"
],
"show": false
},
"showHeader": true,
"sortBy": [
{
"desc": false,
"displayName": "partition"
}
]
},
"pluginVersion": "10.2.3",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"expr": "kafka_log_log_logstartoffset{job=\"integrations/kafka\",job=~\"$job\",cluster=~\"$cluster\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\",topic=~\"$topic\"}",
"format": "table",
"instant": true,
"interval": "",
"legendFormat": "",
"refId": "A"
}
],
"title": "Start Offset",
"transformations": [
{
"id": "organize",
"options": {
"excludeByName": {
"Time": true,
"__name__": true,
"env": true,
"instance": false,
"job": true
},
"indexByName": {
"Time": 0,
"Value": 7,
"__name__": 1,
"env": 2,
"instance": 3,
"job": 4,
"partition": 6,
"topic": 5
},
"renameByName": {
"Value": "offset"
}
}
}
],
"type": "table"
},
{
"datasource": {
"uid": "${datasource}"
},
"description": "",
"fieldConfig": {
"defaults": {
"custom": {
"cellOptions": {
"type": "auto"
},
"filterable": false,
"inspect": false
},
"mappings": [ ],
"thresholds": {
"mode": "absolute",
"steps": [
{
"color": "green",
"value": null
},
{
"color": "red",
"value": 80
}
]
}
},
"overrides": [
{
"matcher": {
"id": "byName",
"options": "partition"
},
"properties": [
{
"id": "custom.width",
"value": 103
}
]
},
{
"matcher": {
"id": "byName",
"options": "offset"
},
"properties": [
{
"id": "custom.width",
"value": 226
}
]
}
]
},
"gridPos": {
"h": 8,
"w": 12,
"x": 12,
"y": 18
},
"id": 7,
"options": {
"cellHeight": "sm",
"footer": {
"countRows": false,
"fields": "",
"reducer": [
"sum"
],
"show": false
},
"showHeader": true,
"sortBy": [
{
"desc": false,
"displayName": "partition"
}
]
},
"pluginVersion": "10.2.3",
"targets": [
{
"datasource": {
"uid": "${datasource}"
},
"expr": "kafka_log_log_logendoffset{job=\"integrations/kafka\",job=~\"$job\",cluster=~\"$cluster\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\",topic=~\"$topic\"}",
"format": "table",
"instant": true,
"interval": "",
"legendFormat": "",
"refId": "A"
}
],
"title": "End Offset",
"transformations": [
{
"id": "organize",
"options": {
"excludeByName": {
"Time": true,
"__name__": true,
"env": true,
"instance": false,
"job": true
},
"indexByName": {
"Time": 0,
"Value": 7,
"__name__": 1,
"env": 2,
"instance": 3,
"job": 4,
"partition": 6,
"topic": 5
},
"renameByName": {
"Value": "offset"
}
}
}
],
"type": "table"
}
],
"refresh": "30s",
"schemaVersion": 39,
"tags": [
"kafka-integration"
],
"templating": {
"list": [
{
"current": {
"selected": false,
"text": "default",
"value": "default"
},
"hide": 0,
"includeAll": false,
"label": "Data source",
"multi": false,
"name": "datasource",
"options": [ ],
"query": "prometheus",
"refresh": 1,
"regex": "",
"skipUrlSync": false,
"type": "datasource"
},
{
"allValue": ".+",
"current": {
"selected": false,
"text": [
"All"
],
"value": [
"$__all"
]
},
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"definition": "",
"hide": 0,
"includeAll": true,
"label": "Job",
"multi": true,
"name": "job",
"options": [ ],
"query": "label_values(kafka_log_log_size{job=\"integrations/kafka\"}, job)",
"refresh": 2,
"regex": "",
"skipUrlSync": false,
"sort": 1,
"type": "query"
},
{
"allValue": ".*",
"current": {
"selected": false,
"text": [
"All"
],
"value": [
"$__all"
]
},
"datasource": {
"uid": "$datasource"
},
"definition": "",
"hide": 0,
"includeAll": true,
"label": "Cluster",
"multi": true,
"name": "cluster",
"options": [ ],
"query": "label_values(kafka_server_kafkaserver_brokerstate{job=~\"$job\"}, cluster)",
"refresh": 2,
"regex": "",
"skipUrlSync": false,
"sort": 1,
"tagValuesQuery": "",
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"allValue": ".+",
"current": {
"selected": false,
"text": [
"All"
],
"value": [
"$__all"
]
},
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"definition": "",
"hide": 0,
"includeAll": true,
"label": "Kafka_cluster",
"multi": true,
"name": "kafka_cluster",
"options": [ ],
"query": "label_values(kafka_log_log_size{job=\"integrations/kafka\",job=~\"$job\"}, kafka_cluster)",
"refresh": 2,
"regex": "",
"skipUrlSync": false,
"sort": 1,
"type": "query"
},
{
"allValue": ".+",
"current": {
"selected": false,
"text": [
"All"
],
"value": [
"$__all"
]
},
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"definition": "",
"hide": 0,
"includeAll": true,
"label": "Instance",
"multi": true,
"name": "instance",
"options": [ ],
"query": "label_values(kafka_log_log_size{job=\"integrations/kafka\",job=~\"$job\",kafka_cluster=~\"$kafka_cluster\"}, instance)",
"refresh": 2,
"regex": "",
"skipUrlSync": false,
"sort": 1,
"type": "query"
},
{
"allValue": ".+",
"current": {
"selected": false,
"text": "All",
"value": "$__all"
},
"datasource": {
"uid": "${datasource}"
},
"definition": "label_values(kafka_log_log_size{job=\"integrations/kafka\",job=~\"$job\",cluster=~\"$cluster\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\"},topic)",
"hide": 0,
"includeAll": true,
"label": "Topic name",
"multi": true,
"name": "topic",
"options": [ ],
"query": "label_values(kafka_log_log_size{job=\"integrations/kafka\",job=~\"$job\",cluster=~\"$cluster\",kafka_cluster=~\"$kafka_cluster\",instance=~\"$instance\"},topic)",
"refresh": 2,
"regex": "",
"skipUrlSync": false,
"sort": 0,
"tagValuesQuery": "",
"tagsQuery": "",
"type": "query",
"useTags": false
}
]
},
"time": {
"from": "now-30m",
"to": "now"
},
"timepicker": { },
"timezone": "",
"title": "Kafka Topics",
"uid": "vQT4b1-Mz",
"version": 2,
"weekStart": ""
}

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

View file

@ -1 +1 @@
null
{}

View file

@ -115,7 +115,7 @@ groups:
summary: StatefulSet update has not been rolled out.
expr: |
(
max without (revision) (
max by(namespace, statefulset, job, cluster) (
kube_statefulset_status_current_revision{job="kube-state-metrics"}
unless
kube_statefulset_status_update_revision{job="kube-state-metrics"}
@ -514,9 +514,9 @@ groups:
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorbudgetburn
summary: The API server is burning too much error budget.
expr: |
sum(apiserver_request:burnrate1h) > (14.40 * 0.01000)
and
sum(apiserver_request:burnrate5m) > (14.40 * 0.01000)
sum by(cluster) (apiserver_request:burnrate1h) > (14.40 * 0.01000)
and on(cluster)
sum by(cluster) (apiserver_request:burnrate5m) > (14.40 * 0.01000)
for: 2m
labels:
long: 1h
@ -528,9 +528,9 @@ groups:
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorbudgetburn
summary: The API server is burning too much error budget.
expr: |
sum(apiserver_request:burnrate6h) > (6.00 * 0.01000)
and
sum(apiserver_request:burnrate30m) > (6.00 * 0.01000)
sum by(cluster) (apiserver_request:burnrate6h) > (6.00 * 0.01000)
and on(cluster)
sum by(cluster) (apiserver_request:burnrate30m) > (6.00 * 0.01000)
for: 15m
labels:
long: 6h
@ -542,9 +542,9 @@ groups:
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorbudgetburn
summary: The API server is burning too much error budget.
expr: |
sum(apiserver_request:burnrate1d) > (3.00 * 0.01000)
and
sum(apiserver_request:burnrate2h) > (3.00 * 0.01000)
sum by(cluster) (apiserver_request:burnrate1d) > (3.00 * 0.01000)
and on(cluster)
sum by(cluster) (apiserver_request:burnrate2h) > (3.00 * 0.01000)
for: 1h
labels:
long: 1d
@ -556,9 +556,9 @@ groups:
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorbudgetburn
summary: The API server is burning too much error budget.
expr: |
sum(apiserver_request:burnrate3d) > (1.00 * 0.01000)
and
sum(apiserver_request:burnrate6h) > (1.00 * 0.01000)
sum by(cluster) (apiserver_request:burnrate3d) > (1.00 * 0.01000)
and on(cluster)
sum by(cluster) (apiserver_request:burnrate6h) > (1.00 * 0.01000)
for: 3h
labels:
long: 3d
@ -573,7 +573,7 @@ groups:
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeclientcertificateexpiration
summary: Client certificate is about to expire.
expr: |
apiserver_client_certificate_expiration_seconds_count{job="kube-apiserver"} > 0 and on(job) histogram_quantile(0.01, sum by (job, le) (rate(apiserver_client_certificate_expiration_seconds_bucket{job="kube-apiserver"}[5m]))) < 604800
apiserver_client_certificate_expiration_seconds_count{job="kube-apiserver"} > 0 and on(cluster, job) histogram_quantile(0.01, sum by (cluster, job, le) (rate(apiserver_client_certificate_expiration_seconds_bucket{job="kube-apiserver"}[5m]))) < 604800
for: 5m
labels:
severity: warning
@ -584,7 +584,7 @@ groups:
runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeclientcertificateexpiration
summary: Client certificate is about to expire.
expr: |
apiserver_client_certificate_expiration_seconds_count{job="kube-apiserver"} > 0 and on(job) histogram_quantile(0.01, sum by (job, le) (rate(apiserver_client_certificate_expiration_seconds_bucket{job="kube-apiserver"}[5m]))) < 86400
apiserver_client_certificate_expiration_seconds_count{job="kube-apiserver"} > 0 and on(cluster, job) histogram_quantile(0.01, sum by (cluster, job, le) (rate(apiserver_client_certificate_expiration_seconds_bucket{job="kube-apiserver"}[5m]))) < 86400
for: 5m
labels:
severity: critical
@ -628,7 +628,7 @@ groups:
summary: The kubernetes apiserver has terminated {{ $value | humanizePercentage
}} of its incoming requests.
expr: |
sum(rate(apiserver_request_terminations_total{job="kube-apiserver"}[10m])) / ( sum(rate(apiserver_request_total{job="kube-apiserver"}[10m])) + sum(rate(apiserver_request_terminations_total{job="kube-apiserver"}[10m])) ) > 0.20
sum by(cluster) (rate(apiserver_request_terminations_total{job="kube-apiserver"}[10m])) / ( sum by(cluster) (rate(apiserver_request_total{job="kube-apiserver"}[10m])) + sum by(cluster) (rate(apiserver_request_terminations_total{job="kube-apiserver"}[10m])) ) > 0.20
for: 5m
labels:
severity: warning

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -17,7 +30,7 @@
"options": {
"content": "The SLO (service level objective) and other metrics displayed on this dashboard are for informational purposes only."
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"title": "Notice",
"type": "text"
},
@ -41,7 +54,7 @@
},
"id": 2,
"interval": "1m",
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -87,7 +100,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -121,7 +134,7 @@
},
"id": 4,
"interval": "1m",
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -219,7 +232,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -263,7 +276,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -306,7 +319,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -340,7 +353,7 @@
},
"id": 8,
"interval": "1m",
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -438,7 +451,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -482,7 +495,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -525,7 +538,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -568,7 +581,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -611,7 +624,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -657,7 +670,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -699,7 +712,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -742,7 +755,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -784,7 +797,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -800,7 +813,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -33,14 +46,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -79,14 +92,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -150,14 +163,14 @@
"y": 9
},
"id": 3,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -166,7 +179,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -175,7 +188,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "avg by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "avg by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -184,7 +197,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "avg by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "avg by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -193,7 +206,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -202,7 +215,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -211,7 +224,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -220,7 +233,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
}
@ -315,14 +328,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "avg by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "avg by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -361,14 +374,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "avg by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "avg by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -407,14 +420,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -453,14 +466,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -499,14 +512,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -545,14 +558,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -591,14 +604,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -637,14 +650,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (namespace) (\n rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -683,14 +696,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (instance) (rate(node_netstat_Tcp_RetransSegs{cluster=\"$cluster\"}[$__rate_interval]) / rate(node_netstat_Tcp_OutSegs{cluster=\"$cluster\"}[$__rate_interval]))",
"expr": "sum by (instance) (\n rate(node_netstat_Tcp_RetransSegs{cluster=\"$cluster\"}[$__rate_interval]) / rate(node_netstat_Tcp_OutSegs{cluster=\"$cluster\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -729,14 +742,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (instance) (rate(node_netstat_TcpExt_TCPSynRetrans{cluster=\"$cluster\"}[$__rate_interval]) / rate(node_netstat_Tcp_RetransSegs{cluster=\"$cluster\"}[$__rate_interval]))",
"expr": "sum by (instance) (\n rate(node_netstat_TcpExt_TCPSynRetrans{cluster=\"$cluster\"}[$__rate_interval]) / rate(node_netstat_Tcp_RetransSegs{cluster=\"$cluster\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -745,7 +758,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -22,7 +35,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -73,7 +86,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -124,7 +137,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -175,7 +188,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -226,7 +239,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -301,7 +314,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -352,7 +365,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -403,7 +416,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -454,7 +467,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -505,7 +518,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -521,7 +534,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -8,7 +21,7 @@
},
"fieldConfig": {
"defaults": {
"unit": "none"
"unit": "percentunit"
}
},
"gridPos": {
@ -22,7 +35,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -57,7 +70,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -92,7 +105,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -127,7 +140,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -162,7 +175,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -197,7 +210,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -247,7 +260,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -306,7 +319,7 @@
"y": 12
},
"id": 8,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -463,7 +476,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -558,7 +571,7 @@
"y": 24
},
"id": 10,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -735,7 +748,7 @@
"y": 30
},
"id": 11,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -879,7 +892,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -930,7 +943,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -981,7 +994,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1032,7 +1045,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1083,7 +1096,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1134,7 +1147,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1185,7 +1198,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1236,7 +1249,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1287,7 +1300,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1338,7 +1351,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1409,7 +1422,7 @@
"y": 96
},
"id": 22,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1518,7 +1531,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -22,7 +35,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -57,7 +70,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -92,7 +105,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -127,7 +140,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -229,7 +242,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -244,7 +257,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.cpu\"})",
"expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.cpu\"}))",
"legendFormat": "quota - requests"
},
{
@ -252,7 +265,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.cpu\"})",
"expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.cpu\"}))",
"legendFormat": "quota - limits"
}
],
@ -304,7 +317,7 @@
"y": 14
},
"id": 6,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -487,7 +500,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -502,7 +515,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.memory\"})",
"expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.memory\"}))",
"legendFormat": "quota - requests"
},
{
@ -510,7 +523,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.memory\"})",
"expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.memory\"}))",
"legendFormat": "quota - limits"
}
],
@ -565,7 +578,7 @@
"y": 28
},
"id": 8,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -755,7 +768,7 @@
"y": 35
},
"id": 9,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -899,7 +912,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -950,7 +963,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1001,7 +1014,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1052,7 +1065,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1103,7 +1116,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1154,7 +1167,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1205,7 +1218,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1256,7 +1269,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1327,7 +1340,7 @@
"y": 70
},
"id": 18,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1436,7 +1449,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -81,14 +94,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(kube_node_status_capacity{cluster=\"$cluster\", node=~\"$node\", resource=\"cpu\"})",
"expr": "sum(kube_node_status_capacity{cluster=\"$cluster\", job=\"kube-state-metrics\", node=~\"$node\", resource=\"cpu\"})",
"legendFormat": "max capacity"
},
{
@ -148,7 +161,7 @@
"y": 6
},
"id": 2,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -310,14 +323,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(kube_node_status_capacity{cluster=\"$cluster\", node=~\"$node\", resource=\"memory\"})",
"expr": "sum(kube_node_status_capacity{cluster=\"$cluster\", job=\"kube-state-metrics\", node=~\"$node\", resource=\"memory\"})",
"legendFormat": "max capacity"
},
{
@ -380,7 +393,7 @@
"y": 18
},
"id": 4,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -496,7 +509,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -89,7 +102,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -195,7 +208,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -237,7 +250,7 @@
"y": 14
},
"id": 3,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -420,7 +433,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -481,7 +494,7 @@
"y": 28
},
"id": 5,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -651,7 +664,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -702,7 +715,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -753,7 +766,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -804,7 +817,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -855,7 +868,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -906,7 +919,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -957,7 +970,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1016,7 +1029,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1075,7 +1088,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1126,7 +1139,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1180,7 +1193,7 @@
"y": 70
},
"id": 16,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1289,7 +1302,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -37,7 +50,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -96,7 +109,7 @@
"y": 7
},
"id": 2,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -227,7 +240,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -289,7 +302,7 @@
"y": 21
},
"id": 4,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -440,7 +453,7 @@
"y": 28
},
"id": 5,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -584,7 +597,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -635,7 +648,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -686,7 +699,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -737,7 +750,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -788,7 +801,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -839,7 +852,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -890,7 +903,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -941,7 +954,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -957,7 +970,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -89,7 +102,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -104,7 +117,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.cpu\"})",
"expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=~\"requests.cpu|cpu\"}))",
"legendFormat": "quota - requests"
},
{
@ -112,7 +125,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.cpu\"})",
"expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=~\"limits.cpu\"}))",
"legendFormat": "quota - limits"
}
],
@ -176,7 +189,7 @@
"y": 7
},
"id": 2,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -384,7 +397,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -399,7 +412,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"requests.memory\"})",
"expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=~\"requests.memory|memory\"}))",
"legendFormat": "quota - requests"
},
{
@ -407,7 +420,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "scalar(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=\"limits.memory\"})",
"expr": "scalar(max(kube_resourcequota{cluster=\"$cluster\", namespace=\"$namespace\", type=\"hard\",resource=~\"limits.memory\"}))",
"legendFormat": "quota - limits"
}
],
@ -474,7 +487,7 @@
"y": 21
},
"id": 4,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -650,7 +663,7 @@
"y": 28
},
"id": 5,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -794,7 +807,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -845,7 +858,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -896,7 +909,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -947,7 +960,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -998,7 +1011,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1049,7 +1062,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1100,7 +1113,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1151,7 +1164,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1167,7 +1180,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -22,7 +35,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -57,7 +70,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -92,7 +105,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -127,7 +140,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -162,7 +175,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -197,7 +210,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -248,7 +261,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -299,7 +312,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -350,7 +363,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -401,7 +414,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -460,7 +473,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -519,7 +532,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -570,7 +583,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -621,7 +634,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -672,7 +685,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -723,7 +736,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -774,7 +787,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -825,7 +838,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -876,7 +889,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -927,7 +940,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1002,7 +1015,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1053,7 +1066,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1104,7 +1117,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1155,7 +1168,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -1171,7 +1184,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -40,14 +53,14 @@
"y": 0
},
"id": 1,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval]))",
"expr": "sum (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -93,14 +106,14 @@
"y": 0
},
"id": 2,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval]))",
"expr": "sum (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -164,14 +177,14 @@
"y": 9
},
"id": 3,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -180,7 +193,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -189,7 +202,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -198,7 +211,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -207,7 +220,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
},
@ -216,7 +229,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"format": "table",
"instant": true
}
@ -303,14 +316,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -349,14 +362,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -395,14 +408,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -441,14 +454,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -487,14 +500,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum by (namespace) (rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval]))",
"expr": "sum by (pod) (\n rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace!=\"\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -533,14 +546,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])) by (pod)",
"expr": "sum by (pod) (\n rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=~\"$namespace\"}[$__rate_interval])\n * on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n)\n",
"legendFormat": "__auto"
}
],
@ -549,7 +562,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -26,14 +39,14 @@
"displayMode": "basic",
"showUnfilled": false
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -65,14 +78,14 @@
"displayMode": "basic",
"showUnfilled": false
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -136,14 +149,14 @@
"y": 9
},
"id": 3,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"format": "table",
"instant": true
},
@ -152,7 +165,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"format": "table",
"instant": true
},
@ -161,7 +174,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(avg(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"expr": "sort_desc(avg(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"format": "table",
"instant": true
},
@ -170,7 +183,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(avg(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"expr": "sort_desc(avg(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"format": "table",
"instant": true
},
@ -179,7 +192,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"expr": "sort_desc(sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"format": "table",
"instant": true
},
@ -188,7 +201,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"expr": "sort_desc(sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"format": "table",
"instant": true
},
@ -197,7 +210,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"expr": "sort_desc(sum(rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"format": "table",
"instant": true
},
@ -206,7 +219,7 @@
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"expr": "sort_desc(sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod) kube_pod_info{cluster=\"$cluster\",namespace=\"$namespace\",host_network=\"false\"}\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload, workload_type))\n",
"format": "table",
"instant": true
}
@ -322,14 +335,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -373,14 +386,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -424,14 +437,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(avg(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(avg(rate(container_network_receive_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -475,14 +488,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(avg(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(avg(rate(container_network_transmit_bytes_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -526,14 +539,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(sum(rate(container_network_receive_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -577,14 +590,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(sum(rate(container_network_transmit_packets_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -628,14 +641,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(sum(rate(container_network_receive_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -679,14 +692,14 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
"type": "prometheus",
"uid": "${datasource}"
},
"expr": "sort_desc(sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"expr": "sort_desc(sum(rate(container_network_transmit_packets_dropped_total{cluster=\"$cluster\",namespace=\"$namespace\"}[$__rate_interval])\n* on (cluster,namespace,pod) group_left ()\n topk by (cluster,namespace,pod) (\n 1,\n max by (cluster,namespace,pod) (kube_pod_info{host_network=\"false\"})\n )\n* on (cluster,namespace,pod)\ngroup_left(workload,workload_type) namespace_workload_pod:kube_pod_owner:relabel{cluster=\"$cluster\",namespace=\"$namespace\", workload=~\".+\", workload_type=~\"$type\"}) by (workload))\n",
"legendFormat": "__auto"
}
],
@ -695,7 +708,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -37,7 +50,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -99,7 +112,7 @@
},
"id": 2,
"interval": "1m",
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -149,7 +162,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -211,7 +224,7 @@
},
"id": 4,
"interval": "1m",
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -227,7 +240,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -40,7 +53,7 @@
"y": 0
},
"id": 1,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -93,7 +106,7 @@
"y": 0
},
"id": 2,
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -139,7 +152,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -185,7 +198,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -231,7 +244,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -277,7 +290,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -323,7 +336,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -369,7 +382,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -385,7 +398,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -22,7 +35,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -73,7 +86,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -124,7 +137,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -175,7 +188,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -226,7 +239,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -277,7 +290,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -352,7 +365,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -403,7 +416,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -454,7 +467,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -505,7 +518,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -556,7 +569,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -572,7 +585,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -22,7 +35,7 @@
"options": {
"colorMode": "none"
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -73,7 +86,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -148,7 +161,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -223,7 +236,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -298,7 +311,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -349,7 +362,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -400,7 +413,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -451,7 +464,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -502,7 +515,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -518,7 +531,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -1,5 +1,18 @@
{
"editable": false,
"links": [
{
"asDropdown": true,
"includeVars": true,
"keepTime": true,
"tags": [
"kubernetes-mixin"
],
"targetBlank": false,
"title": "Kubernetes",
"type": "dashboards"
}
],
"panels": [
{
"datasource": {
@ -26,7 +39,7 @@
"displayMode": "basic",
"showUnfilled": false
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -65,7 +78,7 @@
"displayMode": "basic",
"showUnfilled": false
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -104,7 +117,7 @@
"displayMode": "basic",
"showUnfilled": false
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -143,7 +156,7 @@
"displayMode": "basic",
"showUnfilled": false
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -194,7 +207,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -245,7 +258,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -296,7 +309,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -347,7 +360,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -398,7 +411,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -449,7 +462,7 @@
"mode": "single"
}
},
"pluginVersion": "v10.4.0",
"pluginVersion": "v11.1.0",
"targets": [
{
"datasource": {
@ -465,7 +478,7 @@
}
],
"refresh": "10s",
"schemaVersion": 36,
"schemaVersion": 39,
"tags": [
"kubernetes-mixin"
],

View file

@ -15,18 +15,18 @@ groups:
labels:
verb: write
record: code:apiserver_request_total:increase30d
- expr: |
sum by (cluster, verb, scope) (increase(apiserver_request_sli_duration_seconds_count{job="kube-apiserver"}[1h]))
record: cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase1h
- expr: |
sum by (cluster, verb, scope) (avg_over_time(cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase1h[30d]) * 24 * 30)
record: cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase30d
- expr: |
sum by (cluster, verb, scope, le) (increase(apiserver_request_sli_duration_seconds_bucket[1h]))
record: cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase1h
- expr: |
sum by (cluster, verb, scope, le) (avg_over_time(cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase1h[30d]) * 24 * 30)
record: cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase30d
- expr: |
sum by (cluster, verb, scope) (cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase1h{le="+Inf"})
record: cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase1h
- expr: |
sum by (cluster, verb, scope) (cluster_verb_scope_le:apiserver_request_sli_duration_seconds_bucket:increase30d{le="+Inf"} * 24 * 30)
record: cluster_verb_scope:apiserver_request_sli_duration_seconds_count:increase30d
- expr: |
1 - (
(
@ -481,7 +481,7 @@ groups:
max by(cluster, namespace, pod, node) (kube_pod_info{node!=""})
)
record: node_namespace_pod_container:container_memory_swap
- name: k8s.rules.container_resource
- name: k8s.rules.container_memory_requests
rules:
- expr: |
kube_pod_container_resource_requests{resource="memory",job="kube-state-metrics"} * on (namespace, pod, cluster)
@ -500,6 +500,8 @@ groups:
)
)
record: namespace_memory:kube_pod_container_resource_requests:sum
- name: k8s.rules.container_cpu_requests
rules:
- expr: |
kube_pod_container_resource_requests{resource="cpu",job="kube-state-metrics"} * on (namespace, pod, cluster)
group_left() max by (namespace, pod, cluster) (
@ -517,6 +519,8 @@ groups:
)
)
record: namespace_cpu:kube_pod_container_resource_requests:sum
- name: k8s.rules.container_memory_limits
rules:
- expr: |
kube_pod_container_resource_limits{resource="memory",job="kube-state-metrics"} * on (namespace, pod, cluster)
group_left() max by (namespace, pod, cluster) (
@ -534,6 +538,8 @@ groups:
)
)
record: namespace_memory:kube_pod_container_resource_limits:sum
- name: k8s.rules.container_cpu_limits
rules:
- expr: |
kube_pod_container_resource_limits{resource="cpu",job="kube-state-metrics"} * on (namespace, pod, cluster)
group_left() max by (namespace, pod, cluster) (

View file

@ -3,28 +3,31 @@ groups:
rules:
- alert: LokiRequestErrors
annotations:
message: |
{{ $labels.job }} {{ $labels.route }} is experiencing {{ printf "%.2f" $value }}% errors.
description: |
{{ $labels.cluster }} {{ $labels.job }} {{ $labels.route }} is experiencing {{ printf "%.2f" $value }}% errors.
summary: Loki request error rate is high.
expr: |
100 * sum(rate(loki_request_duration_seconds_count{status_code=~"5.."}[2m])) by (namespace, job, route)
100 * sum(rate(loki_request_duration_seconds_count{status_code=~"5.."}[2m])) by (cluster, namespace, job, route)
/
sum(rate(loki_request_duration_seconds_count[2m])) by (namespace, job, route)
sum(rate(loki_request_duration_seconds_count[2m])) by (cluster, namespace, job, route)
> 10
for: 15m
labels:
severity: critical
- alert: LokiRequestPanics
annotations:
message: |
{{ $labels.job }} is experiencing {{ printf "%.2f" $value }}% increase of panics.
description: |
{{ $labels.cluster }} {{ $labels.job }} is experiencing {{ printf "%.2f" $value }}% increase of panics.
summary: Loki requests are causing code panics.
expr: |
sum(increase(loki_panic_total[10m])) by (namespace, job) > 0
sum(increase(loki_panic_total[10m])) by (cluster, namespace, job) > 0
labels:
severity: critical
- alert: LokiRequestLatency
annotations:
message: |
{{ $labels.job }} {{ $labels.route }} is experiencing {{ printf "%.2f" $value }}s 99th percentile latency.
description: |
{{ $labels.cluster }} {{ $labels.job }} {{ $labels.route }} is experiencing {{ printf "%.2f" $value }}s 99th percentile latency.
summary: Loki request error latency is high.
expr: |
cluster_namespace_job_route:loki_request_duration_seconds:99quantile{route!~"(?i).*tail.*|/schedulerpb.SchedulerForQuerier/QuerierLoop"} > 1
for: 15m
@ -32,10 +35,44 @@ groups:
severity: critical
- alert: LokiTooManyCompactorsRunning
annotations:
message: |
description: |
{{ $labels.cluster }} {{ $labels.namespace }} has had {{ printf "%.0f" $value }} compactors running for more than 5m. Only one compactor should run at a time.
summary: Loki deployment is running more than one compactor.
expr: |
sum(loki_boltdb_shipper_compactor_running) by (namespace, cluster) > 1
sum(loki_boltdb_shipper_compactor_running) by (cluster, namespace) > 1
for: 5m
labels:
severity: warning
- alert: LokiCompactorHasNotSuccessfullyRunCompaction
annotations:
description: |
{{ $labels.cluster }} {{ $labels.namespace }} has not run compaction in the last 3 hours since the last compaction. This may indicate a problem with the compactor.
summary: Loki compaction has not run in the last 3 hours since the last compaction.
expr: |
# The "last successful run" metric is updated even if the compactor owns no tenants,
# so this alert correctly doesn't fire if compactor has nothing to do.
min (
time() - (loki_boltdb_shipper_compact_tables_operation_last_successful_run_timestamp_seconds{} > 0)
)
by (cluster, namespace)
> 60 * 60 * 3
for: 1h
labels:
severity: critical
- alert: LokiCompactorHasNotSuccessfullyRunCompaction
annotations:
description: |
{{ $labels.cluster }} {{ $labels.namespace }} has not run compaction in the last 3h since startup. This may indicate a problem with the compactor.
summary: Loki compaction has not run in the last 3h since startup.
expr: |
# The "last successful run" metric is updated even if the compactor owns no tenants,
# so this alert correctly doesn't fire if compactor has nothing to do.
max(
max_over_time(
loki_boltdb_shipper_compact_tables_operation_last_successful_run_timestamp_seconds{}[3h]
)
) by (cluster, namespace)
== 0
for: 1h
labels:
severity: critical

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

View file

@ -62,7 +62,6 @@
"expr": "sum(loki_compactor_pending_delete_requests_count{cluster=~\"$cluster\", namespace=~\"$namespace\"})",
"format": "time_series",
"instant": true,
"intervalFactor": 2,
"refId": "A"
}
],
@ -138,7 +137,6 @@
"expr": "max(loki_compactor_oldest_pending_delete_request_age_seconds{cluster=~\"$cluster\", namespace=~\"$namespace\"})",
"format": "time_series",
"instant": true,
"intervalFactor": 2,
"refId": "A"
}
],
@ -191,232 +189,145 @@
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 3,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 10,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 3,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "(loki_compactor_delete_requests_received_total{cluster=~\"$cluster\", namespace=~\"$namespace\"} or on() vector(0)) - on () (loki_compactor_delete_requests_processed_total{cluster=~\"$cluster\", namespace=~\"$namespace\"} or on () vector(0))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "in progress",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "# of Delete Requests (received - processed) ",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 4,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 10,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 4,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(increase(loki_compactor_delete_requests_received_total{cluster=~\"$cluster\", namespace=~\"$namespace\"}[1d]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "received",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Delete Requests Received / Day",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 5,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 10,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 5,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(increase(loki_compactor_delete_requests_processed_total{cluster=~\"$cluster\", namespace=~\"$namespace\"}[1d]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "processed",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Delete Requests Processed / Day",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
}
],
"repeat": null,
@ -431,232 +342,145 @@
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 10,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"id": 6,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
},
"lines": true,
"linewidth": 1,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=~\"$cluster\", namespace=~\"$namespace\", container=\"compactor\"}",
"expr": "node_namespace_pod_container:container_cpu_usage_seconds_total:sum_irate{cluster=~\"$cluster\", namespace=~\"$namespace\", pod=~\"(compactor|(loki.*|enterprise-logs)-backend.*|loki-single-binary)\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Compactor CPU usage",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 7,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 10,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 7,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "go_memstats_heap_inuse_bytes{cluster=~\"$cluster\", namespace=~\"$namespace\", container=\"compactor\"} / 1024 / 1024 ",
"expr": "go_memstats_heap_inuse_bytes{cluster=~\"$cluster\", namespace=~\"$namespace\", pod=~\"(compactor|(loki.*|enterprise-logs)-backend.*|loki-single-binary)\"} / 1024 / 1024 ",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": " {{pod}} ",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Compactor memory usage (MiB)",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 8,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 10,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 8,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 4,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "loki_boltdb_shipper_compact_tables_operation_duration_seconds{cluster=~\"$cluster\", namespace=~\"$namespace\"}",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{pod}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Compaction run duration (seconds)",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
}
],
"repeat": null,
@ -671,156 +495,98 @@
"height": "250px",
"panels": [
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 9,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 10,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 9,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 6,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(increase(loki_compactor_load_pending_requests_attempts_total{status=\"fail\", cluster=~\"$cluster\", namespace=~\"$namespace\"}[1h]))",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "failures",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Failures in Loading Delete Requests / Hour",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
},
{
"aliasColors": { },
"bars": false,
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fill": 1,
"id": 10,
"legend": {
"avg": false,
"current": false,
"max": false,
"min": false,
"show": true,
"total": false,
"values": false
"fieldConfig": {
"defaults": {
"custom": {
"drawStyle": "line",
"fillOpacity": 10,
"lineWidth": 1,
"pointSize": 5,
"showPoints": "never",
"spanNulls": false,
"stacking": {
"group": "A",
"mode": "none"
}
},
"thresholds": {
"mode": "absolute",
"steps": [ ]
},
"unit": "short"
},
"overrides": [ ]
},
"lines": true,
"linewidth": 1,
"id": 10,
"links": [ ],
"nullPointMode": "null as zero",
"percentage": false,
"pointradius": 5,
"points": false,
"renderer": "flot",
"seriesOverrides": [ ],
"spaceLength": 10,
"options": {
"legend": {
"showLegend": true
},
"tooltip": {
"mode": "single",
"sort": "none"
}
},
"span": 6,
"stack": false,
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(loki_compactor_deleted_lines{cluster=~\"$cluster\",job=~\"$namespace/compactor\"}[$__rate_interval])) by (user)",
"expr": "sum(rate(loki_compactor_deleted_lines{cluster=~\"$cluster\", namespace=~\"$namespace\", pod=~\"(compactor|(loki.*|enterprise-logs)-backend.*|loki-single-binary)\"}[$__rate_interval])) by (user)",
"format": "time_series",
"intervalFactor": 2,
"legendFormat": "{{user}}",
"legendLink": null,
"step": 10
"legendLink": null
}
],
"thresholds": [ ],
"timeFrom": null,
"timeShift": null,
"title": "Lines Deleted / Sec",
"tooltip": {
"shared": true,
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"xaxis": {
"buckets": null,
"mode": "time",
"name": null,
"show": true,
"values": [ ]
},
"yaxes": [
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": 0,
"show": true
},
{
"format": "short",
"label": null,
"logBase": 1,
"max": null,
"min": null,
"show": false
}
]
"type": "timeseries"
}
],
"repeat": null,
@ -840,7 +606,7 @@
"span": 6,
"targets": [
{
"expr": "{cluster=~\"$cluster\", namespace=~\"$namespace\", container=\"compactor\"} |~ \"Started processing delete request|delete request for user marked as processed\" | logfmt | line_format \"{{.ts}} user={{.user}} delete_request_id={{.delete_request_id}} msg={{.msg}}\" ",
"expr": "{cluster=~\"$cluster\", namespace=~\"$namespace\", pod=~\"(compactor|(loki.*|enterprise-logs)-backend.*|loki-single-binary)\"} |~ \"Started processing delete request|delete request for user marked as processed\" | logfmt | line_format \"{{.ts}} user={{.user}} delete_request_id={{.delete_request_id}} msg={{.msg}}\" ",
"refId": "A"
}
],
@ -853,7 +619,7 @@
"span": 6,
"targets": [
{
"expr": "{cluster=~\"$cluster\", namespace=~\"$namespace\", container=\"compactor\"} |~ \"delete request for user added\" | logfmt | line_format \"{{.ts}} user={{.user}} query='{{.query}}'\"",
"expr": "{cluster=~\"$cluster\", namespace=~\"$namespace\", pod=~\"(compactor|(loki.*|enterprise-logs)-backend.*|loki-single-binary)\"} |~ \"delete request for user added\" | logfmt | line_format \"{{.ts}} user={{.user}} query='{{.query}}'\"",
"refId": "A"
}
],
@ -882,7 +648,7 @@
"value": "default"
},
"hide": 0,
"label": "Data Source",
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",
@ -935,6 +701,16 @@
"tagsQuery": "",
"type": "query",
"useTags": false
},
{
"hide": 0,
"label": null,
"name": "loki_datasource",
"options": [ ],
"query": "loki",
"refresh": 1,
"regex": "",
"type": "datasource"
}
]
},

View file

@ -77,7 +77,7 @@
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -114,6 +114,11 @@
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"unit": "s"
}
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
@ -164,7 +169,7 @@
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -236,7 +241,7 @@
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(container_cpu_usage_seconds_total{cluster=\"$cluster\", namespace=\"$namespace\", pod=~\"$deployment.*\", pod=~\"$pod\", container=~\"$container\"}[5m]))",
"expr": "sum(rate(container_cpu_usage_seconds_total{cluster=\"$cluster\", namespace=\"$namespace\", pod=~\"$deployment.*\", pod=~\"$pod\", container=~\"$container\"}[$__rate_interval]))",
"refId": "A"
}
],
@ -250,7 +255,7 @@
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -287,6 +292,11 @@
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"unit": "bytes"
}
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
@ -336,7 +346,7 @@
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -373,6 +383,11 @@
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"unit": "binBps"
}
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
@ -408,7 +423,7 @@
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\", namespace=\"$namespace\", pod=~\"$deployment.*\", pod=~\"$pod\"}[5m]))",
"expr": "sum(rate(container_network_transmit_bytes_total{cluster=\"$cluster\", namespace=\"$namespace\", pod=~\"$deployment.*\", pod=~\"$pod\"}[$__rate_interval]))",
"refId": "A"
}
],
@ -422,7 +437,7 @@
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -459,6 +474,11 @@
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"unit": "binBps"
}
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
@ -494,7 +514,7 @@
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\", namespace=\"$namespace\", pod=~\"$deployment.*\", pod=~\"$pod\"}[5m]))",
"expr": "sum(rate(container_network_receive_bytes_total{cluster=\"$cluster\", namespace=\"$namespace\", pod=~\"$deployment.*\", pod=~\"$pod\"}[$__rate_interval]))",
"refId": "A"
}
],
@ -508,7 +528,7 @@
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -595,7 +615,7 @@
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -632,6 +652,11 @@
"dashLength": 10,
"dashes": false,
"datasource": "$datasource",
"fieldConfig": {
"defaults": {
"unit": "ops"
}
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
@ -667,7 +692,7 @@
"steppedLine": false,
"targets": [
{
"expr": "sum(rate(promtail_custom_bad_words_total{cluster=\"$cluster\", exported_namespace=\"$namespace\", exported_pod=~\"$deployment.*\", exported_pod=~\"$pod\", container=~\"$container\"}[5m])) by (level)",
"expr": "sum(rate(promtail_custom_bad_words_total{cluster=\"$cluster\", exported_namespace=\"$namespace\", exported_pod=~\"$deployment.*\", exported_pod=~\"$pod\", container=~\"$container\"}[$__rate_interval])) by (level)",
"legendFormat": "{{level}}",
"refId": "A"
}
@ -682,7 +707,7 @@
"sort": 0,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -719,6 +744,11 @@
"dashLength": 10,
"dashes": false,
"datasource": "$loki_datasource",
"fieldConfig": {
"defaults": {
"unit": "ops"
}
},
"fill": 1,
"fillGradient": 0,
"gridPos": {
@ -771,7 +801,7 @@
"steppedLine": false,
"targets": [
{
"expr": "sum(rate({cluster=\"$cluster\", namespace=\"$namespace\", pod=~\"$deployment.*\", pod=~\"$pod\", container=~\"$container\" } |logfmt| level=\"$level\" |= \"$filter\" [5m])) by (level)",
"expr": "sum(rate({cluster=\"$cluster\", namespace=\"$namespace\", pod=~\"$deployment.*\", pod=~\"$pod\", container=~\"$container\" } |logfmt| level=\"$level\" |= \"$filter\" | __error__=\"\" [$__auto])) by (level)",
"intervalFactor": 3,
"legendFormat": "{{level}}",
"refId": "A"
@ -787,7 +817,7 @@
"sort": 2,
"value_type": "individual"
},
"type": "graph",
"type": "timeseries",
"xaxis": {
"buckets": null,
"mode": "time",
@ -861,7 +891,7 @@
"value": "default"
},
"hide": 0,
"label": "Data Source",
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",

View file

@ -300,7 +300,8 @@
"value": 80
}
]
}
},
"unit": "s"
},
"overrides": [ ]
},
@ -600,7 +601,7 @@
"value": "default"
},
"hide": 0,
"label": "Data Source",
"label": "Data source",
"name": "datasource",
"options": [ ],
"query": "prometheus",

File diff suppressed because it is too large Load diff

File diff suppressed because it is too large Load diff

Some files were not shown because too many files have changed in this diff Show more