mirror of
https://github.com/monitoring-mixins/website.git
synced 2024-12-14 11:37:31 +00:00
1073 lines
34 KiB
JSON
1073 lines
34 KiB
JSON
{
|
|
"__inputs": [ ],
|
|
"__requires": [ ],
|
|
"annotations": {
|
|
"list": [ ]
|
|
},
|
|
"description": "",
|
|
"editable": false,
|
|
"gnetId": null,
|
|
"graphTooltip": 0,
|
|
"hideControls": false,
|
|
"id": null,
|
|
"links": [
|
|
{
|
|
"asDropdown": false,
|
|
"icon": "external link",
|
|
"includeVars": true,
|
|
"keepTime": true,
|
|
"tags": [
|
|
"apache-hadoop-mixin"
|
|
],
|
|
"targetBlank": false,
|
|
"title": "Other Apache Hadoop dashboards",
|
|
"type": "dashboards",
|
|
"url": ""
|
|
}
|
|
],
|
|
"panels": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"description": "The number of Node Managers by state in the Hadoop ResourceManager.",
|
|
"fieldConfig": {
|
|
"defaults": {
|
|
"color": {
|
|
"mode": "thresholds"
|
|
},
|
|
"mappings": [ ],
|
|
"thresholds": {
|
|
"mode": "absolute",
|
|
"steps": [
|
|
{
|
|
"color": "green",
|
|
"value": null
|
|
}
|
|
]
|
|
}
|
|
},
|
|
"overrides": [ ]
|
|
},
|
|
"gridPos": {
|
|
"h": 9,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 0
|
|
},
|
|
"id": 2,
|
|
"options": {
|
|
"displayMode": "gradient",
|
|
"minVizHeight": 10,
|
|
"minVizWidth": 0,
|
|
"orientation": "horizontal",
|
|
"reduceOptions": {
|
|
"calcs": [
|
|
"lastNotNull"
|
|
],
|
|
"fields": "",
|
|
"values": false
|
|
},
|
|
"showUnfilled": true,
|
|
"valueMode": "color"
|
|
},
|
|
"pluginVersion": "10.0.2-cloud.1.94a6f396",
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_numactivenms{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"ClusterMetrics\",}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "active"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_numdecommissionednms{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"ClusterMetrics\",}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "decommissioned"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_numlostnms{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"ClusterMetrics\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "lost"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_numunhealthynms{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"ClusterMetrics\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "healthy"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_numrebootednms{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"ClusterMetrics\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "rebooted"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_numshutdownnms{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"ClusterMetrics\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "shutdown"
|
|
}
|
|
],
|
|
"title": "Node Managers state",
|
|
"type": "bargauge"
|
|
},
|
|
{
|
|
"collapsed": false,
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 9
|
|
},
|
|
"id": 3,
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": ""
|
|
}
|
|
],
|
|
"title": "Applications",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"description": "Number of applications by state for the Hadoop ResourceManager.",
|
|
"fieldConfig": {
|
|
"defaults": {
|
|
"color": {
|
|
"mode": "palette-classic"
|
|
},
|
|
"custom": {
|
|
"axisCenteredZero": false,
|
|
"axisColorMode": "text",
|
|
"axisLabel": "",
|
|
"axisPlacement": "auto",
|
|
"barAlignment": 0,
|
|
"drawStyle": "line",
|
|
"fillOpacity": 0,
|
|
"gradientMode": "none",
|
|
"hideFrom": {
|
|
"legend": false,
|
|
"tooltip": false,
|
|
"viz": false
|
|
},
|
|
"lineInterpolation": "linear",
|
|
"lineWidth": 1,
|
|
"pointSize": 5,
|
|
"scaleDistribution": {
|
|
"type": "linear"
|
|
},
|
|
"showPoints": "auto",
|
|
"spanNulls": false,
|
|
"stacking": {
|
|
"group": "A",
|
|
"mode": "none"
|
|
},
|
|
"thresholdsStyle": {
|
|
"mode": "off"
|
|
}
|
|
},
|
|
"mappings": [ ],
|
|
"thresholds": {
|
|
"mode": "absolute",
|
|
"steps": [
|
|
{
|
|
"color": "green",
|
|
"value": null
|
|
},
|
|
{
|
|
"color": "red",
|
|
"value": 80
|
|
}
|
|
]
|
|
}
|
|
},
|
|
"overrides": [ ]
|
|
},
|
|
"gridPos": {
|
|
"h": 8,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 10
|
|
},
|
|
"id": 4,
|
|
"options": {
|
|
"legend": {
|
|
"calcs": [ ],
|
|
"displayMode": "list",
|
|
"placement": "bottom",
|
|
"showLegend": true
|
|
},
|
|
"tooltip": {
|
|
"mode": "multi",
|
|
"sort": "desc"
|
|
}
|
|
},
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_appsrunning{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "running"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_appspending{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "pending"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_appskilled{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "killed"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_appssubmitted{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "submitted"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_appscompleted{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "completed"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_appsfailed{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "failed"
|
|
}
|
|
],
|
|
"title": "Applications state",
|
|
"type": "timeseries"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"description": "The available memory in the Hadoop ResourceManager.",
|
|
"fieldConfig": {
|
|
"defaults": {
|
|
"color": {
|
|
"mode": "palette-classic"
|
|
},
|
|
"custom": {
|
|
"axisCenteredZero": false,
|
|
"axisColorMode": "text",
|
|
"axisLabel": "",
|
|
"axisPlacement": "auto",
|
|
"barAlignment": 0,
|
|
"drawStyle": "line",
|
|
"fillOpacity": 0,
|
|
"gradientMode": "none",
|
|
"hideFrom": {
|
|
"legend": false,
|
|
"tooltip": false,
|
|
"viz": false
|
|
},
|
|
"lineInterpolation": "linear",
|
|
"lineWidth": 1,
|
|
"pointSize": 5,
|
|
"scaleDistribution": {
|
|
"type": "linear"
|
|
},
|
|
"showPoints": "auto",
|
|
"spanNulls": false,
|
|
"stacking": {
|
|
"group": "A",
|
|
"mode": "none"
|
|
},
|
|
"thresholdsStyle": {
|
|
"mode": "off"
|
|
}
|
|
},
|
|
"mappings": [ ],
|
|
"thresholds": {
|
|
"mode": "absolute",
|
|
"steps": [
|
|
{
|
|
"color": "green",
|
|
"value": null
|
|
}
|
|
]
|
|
},
|
|
"unit": "decmbytes"
|
|
},
|
|
"overrides": [ ]
|
|
},
|
|
"gridPos": {
|
|
"h": 6,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 18
|
|
},
|
|
"id": 5,
|
|
"options": {
|
|
"legend": {
|
|
"calcs": [ ],
|
|
"displayMode": "list",
|
|
"placement": "bottom",
|
|
"showLegend": true
|
|
},
|
|
"tooltip": {
|
|
"mode": "multi",
|
|
"sort": "desc"
|
|
}
|
|
},
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_allocatedmb{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "allocated"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_availablemb{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "available"
|
|
}
|
|
],
|
|
"title": "Available memory",
|
|
"type": "timeseries"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"description": "The available virtual cores in the Hadoop ResourceManager.",
|
|
"fieldConfig": {
|
|
"defaults": {
|
|
"color": {
|
|
"mode": "palette-classic"
|
|
},
|
|
"custom": {
|
|
"axisCenteredZero": false,
|
|
"axisColorMode": "text",
|
|
"axisLabel": "",
|
|
"axisPlacement": "auto",
|
|
"barAlignment": 0,
|
|
"drawStyle": "line",
|
|
"fillOpacity": 0,
|
|
"gradientMode": "none",
|
|
"hideFrom": {
|
|
"legend": false,
|
|
"tooltip": false,
|
|
"viz": false
|
|
},
|
|
"lineInterpolation": "linear",
|
|
"lineWidth": 1,
|
|
"pointSize": 5,
|
|
"scaleDistribution": {
|
|
"type": "linear"
|
|
},
|
|
"showPoints": "auto",
|
|
"spanNulls": false,
|
|
"stacking": {
|
|
"group": "A",
|
|
"mode": "none"
|
|
},
|
|
"thresholdsStyle": {
|
|
"mode": "off"
|
|
}
|
|
},
|
|
"mappings": [ ],
|
|
"thresholds": {
|
|
"mode": "absolute",
|
|
"steps": [
|
|
{
|
|
"color": "green",
|
|
"value": null
|
|
}
|
|
]
|
|
},
|
|
"unit": ""
|
|
},
|
|
"overrides": [ ]
|
|
},
|
|
"gridPos": {
|
|
"h": 6,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 18
|
|
},
|
|
"id": 6,
|
|
"options": {
|
|
"legend": {
|
|
"calcs": [ ],
|
|
"displayMode": "list",
|
|
"placement": "bottom",
|
|
"showLegend": true
|
|
},
|
|
"tooltip": {
|
|
"mode": "multi",
|
|
"sort": "desc"
|
|
}
|
|
},
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_availablevcores{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "available"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_allocatedvcores{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\", name=\"QueueMetrics\",q0=\"root\", q1=\"default\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "allocated"
|
|
}
|
|
],
|
|
"title": "Available virtual cores",
|
|
"type": "timeseries"
|
|
},
|
|
{
|
|
"collapsed": false,
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"gridPos": {
|
|
"h": 1,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 24
|
|
},
|
|
"id": 7,
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": ""
|
|
}
|
|
],
|
|
"title": "JVM",
|
|
"type": "row"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"description": "The Heap and non-heap memory used for the ResourceManager.",
|
|
"fieldConfig": {
|
|
"defaults": {
|
|
"color": {
|
|
"mode": "palette-classic"
|
|
},
|
|
"custom": {
|
|
"axisCenteredZero": false,
|
|
"axisColorMode": "text",
|
|
"axisLabel": "",
|
|
"axisPlacement": "auto",
|
|
"barAlignment": 0,
|
|
"drawStyle": "line",
|
|
"fillOpacity": 0,
|
|
"gradientMode": "none",
|
|
"hideFrom": {
|
|
"legend": false,
|
|
"tooltip": false,
|
|
"viz": false
|
|
},
|
|
"lineInterpolation": "linear",
|
|
"lineWidth": 1,
|
|
"pointSize": 5,
|
|
"scaleDistribution": {
|
|
"type": "linear"
|
|
},
|
|
"showPoints": "auto",
|
|
"spanNulls": false,
|
|
"stacking": {
|
|
"group": "A",
|
|
"mode": "normal"
|
|
},
|
|
"thresholdsStyle": {
|
|
"mode": "off"
|
|
}
|
|
},
|
|
"mappings": [ ],
|
|
"thresholds": {
|
|
"mode": "absolute",
|
|
"steps": [
|
|
{
|
|
"color": "green",
|
|
"value": null
|
|
}
|
|
]
|
|
},
|
|
"unit": "decmbytes"
|
|
},
|
|
"overrides": [ ]
|
|
},
|
|
"gridPos": {
|
|
"h": 6,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 25
|
|
},
|
|
"id": 8,
|
|
"options": {
|
|
"legend": {
|
|
"calcs": [ ],
|
|
"displayMode": "list",
|
|
"placement": "bottom",
|
|
"showLegend": true
|
|
},
|
|
"tooltip": {
|
|
"mode": "multi",
|
|
"sort": "desc"
|
|
}
|
|
},
|
|
"pluginVersion": "10.0.2-cloud.1.94a6f396",
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_memheapusedm{name=\"JvmMetrics\", job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "heap"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_memnonheapusedm{name=\"JvmMetrics\", job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "nonheap"
|
|
}
|
|
],
|
|
"title": "Memory used",
|
|
"type": "timeseries"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"description": "The Heap and non-heap memory committed for the ResourceManager.",
|
|
"fieldConfig": {
|
|
"defaults": {
|
|
"color": {
|
|
"mode": "palette-classic"
|
|
},
|
|
"custom": {
|
|
"axisCenteredZero": false,
|
|
"axisColorMode": "text",
|
|
"axisLabel": "",
|
|
"axisPlacement": "auto",
|
|
"barAlignment": 0,
|
|
"drawStyle": "line",
|
|
"fillOpacity": 0,
|
|
"gradientMode": "none",
|
|
"hideFrom": {
|
|
"legend": false,
|
|
"tooltip": false,
|
|
"viz": false
|
|
},
|
|
"lineInterpolation": "linear",
|
|
"lineWidth": 1,
|
|
"pointSize": 5,
|
|
"scaleDistribution": {
|
|
"type": "linear"
|
|
},
|
|
"showPoints": "auto",
|
|
"spanNulls": false,
|
|
"stacking": {
|
|
"group": "A",
|
|
"mode": "none"
|
|
},
|
|
"thresholdsStyle": {
|
|
"mode": "off"
|
|
}
|
|
},
|
|
"mappings": [ ],
|
|
"thresholds": {
|
|
"mode": "absolute",
|
|
"steps": [
|
|
{
|
|
"color": "green",
|
|
"value": null
|
|
}
|
|
]
|
|
},
|
|
"unit": "decmbytes"
|
|
},
|
|
"overrides": [ ]
|
|
},
|
|
"gridPos": {
|
|
"h": 6,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 25
|
|
},
|
|
"id": 9,
|
|
"options": {
|
|
"legend": {
|
|
"calcs": [ ],
|
|
"displayMode": "list",
|
|
"placement": "bottom",
|
|
"showLegend": true
|
|
},
|
|
"tooltip": {
|
|
"mode": "multi",
|
|
"sort": "desc"
|
|
}
|
|
},
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_memheapcommittedm{name=\"JvmMetrics\", job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "heap"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "hadoop_resourcemanager_memnonheapcommittedm{name=\"JvmMetrics\", job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"}",
|
|
"format": "time_series",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "nonheap"
|
|
}
|
|
],
|
|
"title": "Memory committed",
|
|
"type": "timeseries"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"description": "The recent increase in the number of garbage collection events for the ResourceManager JVM.",
|
|
"fieldConfig": {
|
|
"defaults": {
|
|
"color": {
|
|
"mode": "palette-classic"
|
|
},
|
|
"custom": {
|
|
"axisCenteredZero": false,
|
|
"axisColorMode": "text",
|
|
"axisLabel": "",
|
|
"axisPlacement": "auto",
|
|
"barAlignment": 0,
|
|
"drawStyle": "line",
|
|
"fillOpacity": 0,
|
|
"gradientMode": "none",
|
|
"hideFrom": {
|
|
"legend": false,
|
|
"tooltip": false,
|
|
"viz": false
|
|
},
|
|
"lineInterpolation": "linear",
|
|
"lineWidth": 1,
|
|
"pointSize": 5,
|
|
"scaleDistribution": {
|
|
"type": "linear"
|
|
},
|
|
"showPoints": "auto",
|
|
"spanNulls": false,
|
|
"stacking": {
|
|
"group": "A",
|
|
"mode": "none"
|
|
},
|
|
"thresholdsStyle": {
|
|
"mode": "off"
|
|
}
|
|
},
|
|
"mappings": [ ],
|
|
"thresholds": {
|
|
"mode": "absolute",
|
|
"steps": [
|
|
{
|
|
"color": "green",
|
|
"value": null
|
|
}
|
|
]
|
|
},
|
|
"unit": ""
|
|
},
|
|
"overrides": [ ]
|
|
},
|
|
"gridPos": {
|
|
"h": 6,
|
|
"w": 12,
|
|
"x": 0,
|
|
"y": 31
|
|
},
|
|
"id": 10,
|
|
"options": {
|
|
"legend": {
|
|
"calcs": [ ],
|
|
"displayMode": "list",
|
|
"placement": "bottom",
|
|
"showLegend": true
|
|
},
|
|
"tooltip": {
|
|
"mode": "multi",
|
|
"sort": "desc"
|
|
}
|
|
},
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "increase(hadoop_resourcemanager_gccount{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"}[$__interval:])",
|
|
"format": "time_series",
|
|
"interval": "1m",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{hadoop_cluster}} - {{instance}}"
|
|
}
|
|
],
|
|
"title": "Garbage collection count",
|
|
"type": "timeseries"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"description": "The average duration for each garbage collection operation in the ResourceManager JVM.",
|
|
"fieldConfig": {
|
|
"defaults": {
|
|
"color": {
|
|
"mode": "palette-classic"
|
|
},
|
|
"custom": {
|
|
"axisCenteredZero": false,
|
|
"axisColorMode": "text",
|
|
"axisLabel": "",
|
|
"axisPlacement": "auto",
|
|
"barAlignment": 0,
|
|
"drawStyle": "line",
|
|
"fillOpacity": 0,
|
|
"gradientMode": "none",
|
|
"hideFrom": {
|
|
"legend": false,
|
|
"tooltip": false,
|
|
"viz": false
|
|
},
|
|
"lineInterpolation": "linear",
|
|
"lineWidth": 1,
|
|
"pointSize": 5,
|
|
"scaleDistribution": {
|
|
"type": "linear"
|
|
},
|
|
"showPoints": "auto",
|
|
"spanNulls": false,
|
|
"stacking": {
|
|
"group": "A",
|
|
"mode": "none"
|
|
},
|
|
"thresholdsStyle": {
|
|
"mode": "off"
|
|
}
|
|
},
|
|
"mappings": [ ],
|
|
"thresholds": {
|
|
"mode": "absolute",
|
|
"steps": [
|
|
{
|
|
"color": "green",
|
|
"value": null
|
|
}
|
|
]
|
|
},
|
|
"unit": "ms"
|
|
},
|
|
"overrides": [ ]
|
|
},
|
|
"gridPos": {
|
|
"h": 6,
|
|
"w": 12,
|
|
"x": 12,
|
|
"y": 31
|
|
},
|
|
"id": 11,
|
|
"options": {
|
|
"legend": {
|
|
"calcs": [ ],
|
|
"displayMode": "list",
|
|
"placement": "bottom",
|
|
"showLegend": true
|
|
},
|
|
"tooltip": {
|
|
"mode": "multi",
|
|
"sort": "desc"
|
|
}
|
|
},
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"expr": "increase(hadoop_resourcemanager_gctimemillis{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"}[$__interval:]) / clamp_min(increase(hadoop_resourcemanager_gccount{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"}[$__interval:]), 1)",
|
|
"format": "time_series",
|
|
"interval": "1m",
|
|
"intervalFactor": 2,
|
|
"legendFormat": "{{hadoop_cluster}} - {{instance}}"
|
|
}
|
|
],
|
|
"title": "Average garbage collection time",
|
|
"type": "timeseries"
|
|
},
|
|
{
|
|
"datasource": {
|
|
"uid": "${loki_datasource}"
|
|
},
|
|
"description": "The ResourceManager logs.",
|
|
"gridPos": {
|
|
"h": 8,
|
|
"w": 24,
|
|
"x": 0,
|
|
"y": 37
|
|
},
|
|
"id": 12,
|
|
"options": {
|
|
"dedupStrategy": "none",
|
|
"enableLogDetails": true,
|
|
"prettifyLogMessage": false,
|
|
"showCommonLabels": false,
|
|
"showLabels": false,
|
|
"showTime": false,
|
|
"sortOrder": "Descending",
|
|
"wrapLogMessage": false
|
|
},
|
|
"targets": [
|
|
{
|
|
"datasource": {
|
|
"uid": "${loki_datasource}"
|
|
},
|
|
"editorMode": "code",
|
|
"expr": "{job=~\"$job\", instance=~\"$instance\", hadoop_cluster=~\"$hadoop_cluster\"} |= `` | (filename=~\".*/hadoop/logs/.*-resourcemanager.*.log\" or log_type=\"resourcemanager\")",
|
|
"queryType": "range",
|
|
"refId": "A"
|
|
}
|
|
],
|
|
"title": "ResourceManager logs",
|
|
"type": "logs"
|
|
}
|
|
],
|
|
"refresh": "1m",
|
|
"rows": [ ],
|
|
"schemaVersion": 14,
|
|
"style": "dark",
|
|
"tags": [
|
|
"apache-hadoop-mixin"
|
|
],
|
|
"templating": {
|
|
"list": [
|
|
{
|
|
"current": { },
|
|
"hide": 0,
|
|
"label": "Data Source",
|
|
"name": "prometheus_datasource",
|
|
"options": [ ],
|
|
"query": "prometheus",
|
|
"refresh": 1,
|
|
"regex": "",
|
|
"type": "datasource"
|
|
},
|
|
{
|
|
"current": { },
|
|
"hide": 0,
|
|
"label": "Loki Datasource",
|
|
"name": "loki_datasource",
|
|
"options": [ ],
|
|
"query": "loki",
|
|
"refresh": 1,
|
|
"regex": "",
|
|
"type": "datasource"
|
|
},
|
|
{
|
|
"allValue": ".+",
|
|
"current": { },
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"hide": 0,
|
|
"includeAll": true,
|
|
"label": "Job",
|
|
"multi": true,
|
|
"name": "job",
|
|
"options": [ ],
|
|
"query": "label_values(hadoop_resourcemanager_activeapplications,job)",
|
|
"refresh": 2,
|
|
"regex": "",
|
|
"sort": 1,
|
|
"tagValuesQuery": "",
|
|
"tags": [ ],
|
|
"tagsQuery": "",
|
|
"type": "query",
|
|
"useTags": false
|
|
},
|
|
{
|
|
"allValue": ".*",
|
|
"current": { },
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"hide": 2,
|
|
"includeAll": true,
|
|
"label": "Cluster",
|
|
"multi": true,
|
|
"name": "cluster",
|
|
"options": [ ],
|
|
"query": "label_values(hadoop_resourcemanager_activeapplications{job=~\"$job\"}, cluster)",
|
|
"refresh": 2,
|
|
"regex": "",
|
|
"sort": 0,
|
|
"tagValuesQuery": "",
|
|
"tags": [ ],
|
|
"tagsQuery": "",
|
|
"type": "query",
|
|
"useTags": false
|
|
},
|
|
{
|
|
"allValue": ".+",
|
|
"current": { },
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"hide": 0,
|
|
"includeAll": true,
|
|
"label": "Instance",
|
|
"multi": true,
|
|
"name": "instance",
|
|
"options": [ ],
|
|
"query": "label_values(hadoop_resourcemanager_activeapplications{job=~\"$job\"}, instance)",
|
|
"refresh": 2,
|
|
"regex": "",
|
|
"sort": 1,
|
|
"tagValuesQuery": "",
|
|
"tags": [ ],
|
|
"tagsQuery": "",
|
|
"type": "query",
|
|
"useTags": false
|
|
},
|
|
{
|
|
"allValue": ".+",
|
|
"current": { },
|
|
"datasource": {
|
|
"uid": "${prometheus_datasource}"
|
|
},
|
|
"hide": 0,
|
|
"includeAll": true,
|
|
"label": "Hadoop cluster",
|
|
"multi": true,
|
|
"name": "hadoop_cluster",
|
|
"options": [ ],
|
|
"query": "label_values(hadoop_resourcemanager_activeapplications{job=~\"$job\"}, hadoop_cluster)",
|
|
"refresh": 2,
|
|
"regex": "",
|
|
"sort": 1,
|
|
"tagValuesQuery": "",
|
|
"tags": [ ],
|
|
"tagsQuery": "",
|
|
"type": "query",
|
|
"useTags": false
|
|
}
|
|
]
|
|
},
|
|
"time": {
|
|
"from": "now-1h",
|
|
"to": "now"
|
|
},
|
|
"timepicker": {
|
|
"refresh_intervals": [
|
|
"5s",
|
|
"10s",
|
|
"30s",
|
|
"1m",
|
|
"5m",
|
|
"15m",
|
|
"30m",
|
|
"1h",
|
|
"2h",
|
|
"1d"
|
|
],
|
|
"time_options": [
|
|
"5m",
|
|
"15m",
|
|
"1h",
|
|
"6h",
|
|
"12h",
|
|
"24h",
|
|
"2d",
|
|
"7d",
|
|
"30d"
|
|
]
|
|
},
|
|
"timezone": "default",
|
|
"title": "Apache Hadoop ResourceManager overview",
|
|
"uid": "apache-hadoop-resourcemanager-overview",
|
|
"version": 0
|
|
}
|