Path: blob/main/operations/observability/mixins/workspace/dashboards/node-problem-detector.json
2501 views
{1"annotations": {2"list": [3{4"builtIn": 1,5"datasource": {6"type": "datasource",7"uid": "grafana"8},9"enable": true,10"hide": true,11"iconColor": "rgba(0, 211, 255, 1)",12"name": "Annotations & Alerts",13"target": {14"limit": 100,15"matchAny": false,16"tags": [],17"type": "dashboard"18},19"type": "dashboard"20}21]22},23"description": "",24"editable": true,25"fiscalYearStartMonth": 0,26"graphTooltip": 1,27"id": 71,28"links": [],29"liveNow": false,30"panels": [31{32"collapsed": false,33"datasource": {34"type": "datasource",35"uid": "grafana"36},37"gridPos": {38"h": 1,39"w": 24,40"x": 0,41"y": 042},43"id": 4,44"panels": [],45"targets": [46{47"datasource": {48"type": "datasource",49"uid": "grafana"50},51"refId": "A"52}53],54"title": "Totals",55"type": "row"56},57{58"datasource": {59"type": "prometheus",60"uid": "${datasource}"61},62"fieldConfig": {63"defaults": {64"color": {65"mode": "palette-classic"66},67"custom": {68"axisLabel": "",69"axisPlacement": "auto",70"barAlignment": 0,71"drawStyle": "line",72"fillOpacity": 0,73"gradientMode": "none",74"hideFrom": {75"legend": false,76"tooltip": false,77"viz": false78},79"lineInterpolation": "linear",80"lineWidth": 1,81"pointSize": 5,82"scaleDistribution": {83"type": "linear"84},85"showPoints": "auto",86"spanNulls": false,87"stacking": {88"group": "A",89"mode": "none"90},91"thresholdsStyle": {92"mode": "off"93}94},95"mappings": [],96"min": 0,97"thresholds": {98"mode": "absolute",99"steps": [100{101"color": "green",102"value": null103},104{105"color": "red",106"value": 80107}108]109}110},111"overrides": []112},113"gridPos": {114"h": 6,115"w": 8,116"x": 0,117"y": 1118},119"id": 40,120"options": {121"legend": {122"calcs": [],123"displayMode": "hidden",124"placement": "bottom"125},126"tooltip": {127"mode": "single",128"sort": "none"129}130},131"targets": [132{133"datasource": {134"type": "prometheus",135"uid": "${datasource}"136},137"exemplar": true,138"expr": " sum(problem_gauge) by (node)",139"interval": "",140"legendFormat": "{{node}}",141"refId": "A"142}143],144"title": "Problem affects a node",145"type": "timeseries"146},147{148"datasource": {149"type": "prometheus",150"uid": "${datasource}"151},152"fieldConfig": {153"defaults": {154"color": {155"mode": "palette-classic"156},157"custom": {158"axisLabel": "",159"axisPlacement": "auto",160"barAlignment": 0,161"drawStyle": "line",162"fillOpacity": 0,163"gradientMode": "none",164"hideFrom": {165"legend": false,166"tooltip": false,167"viz": false168},169"lineInterpolation": "linear",170"lineWidth": 1,171"pointSize": 5,172"scaleDistribution": {173"type": "linear"174},175"showPoints": "auto",176"spanNulls": false,177"stacking": {178"group": "A",179"mode": "none"180},181"thresholdsStyle": {182"mode": "off"183}184},185"mappings": [],186"min": 0,187"thresholds": {188"mode": "absolute",189"steps": [190{191"color": "green",192"value": null193},194{195"color": "red",196"value": 80197}198]199}200},201"overrides": []202},203"gridPos": {204"h": 6,205"w": 8,206"x": 8,207"y": 1208},209"id": 23,210"options": {211"legend": {212"calcs": [],213"displayMode": "hidden",214"placement": "bottom"215},216"tooltip": {217"mode": "single",218"sort": "none"219}220},221"targets": [222{223"datasource": {224"type": "prometheus",225"uid": "${datasource}"226},227"exemplar": true,228"expr": "sum(rate(problem_counter[5m])) by (node)",229"interval": "",230"legendFormat": "{{node}}",231"refId": "A"232}233],234"title": "Problem rates by node",235"type": "timeseries"236},237{238"datasource": {239"type": "prometheus",240"uid": "${datasource}"241},242"fieldConfig": {243"defaults": {244"color": {245"mode": "palette-classic"246},247"custom": {248"axisLabel": "",249"axisPlacement": "auto",250"barAlignment": 0,251"drawStyle": "line",252"fillOpacity": 0,253"gradientMode": "none",254"hideFrom": {255"legend": false,256"tooltip": false,257"viz": false258},259"lineInterpolation": "linear",260"lineWidth": 1,261"pointSize": 5,262"scaleDistribution": {263"type": "linear"264},265"showPoints": "auto",266"spanNulls": false,267"stacking": {268"group": "A",269"mode": "none"270},271"thresholdsStyle": {272"mode": "off"273}274},275"mappings": [],276"thresholds": {277"mode": "absolute",278"steps": [279{280"color": "green",281"value": null282},283{284"color": "red",285"value": 80286}287]288}289},290"overrides": []291},292"gridPos": {293"h": 6,294"w": 8,295"x": 16,296"y": 1297},298"id": 2,299"options": {300"legend": {301"calcs": [],302"displayMode": "hidden",303"placement": "bottom"304},305"tooltip": {306"mode": "single",307"sort": "none"308}309},310"targets": [311{312"datasource": {313"type": "prometheus",314"uid": "${datasource}"315},316"exemplar": true,317"expr": "sum(rate(problem_counter[5m]))",318"interval": "",319"legendFormat": "total",320"refId": "A"321}322],323"title": "Problem rates",324"type": "timeseries"325},326{327"collapsed": false,328"datasource": {329"type": "datasource",330"uid": "grafana"331},332"gridPos": {333"h": 1,334"w": 24,335"x": 0,336"y": 7337},338"id": 25,339"panels": [],340"targets": [341{342"datasource": {343"type": "datasource",344"uid": "grafana"345},346"refId": "A"347}348],349"title": "Gauges",350"type": "row"351},352{353"datasource": {354"type": "prometheus",355"uid": "${datasource}"356},357"fieldConfig": {358"defaults": {359"color": {360"mode": "palette-classic"361},362"custom": {363"axisLabel": "",364"axisPlacement": "auto",365"barAlignment": 0,366"drawStyle": "line",367"fillOpacity": 0,368"gradientMode": "none",369"hideFrom": {370"legend": false,371"tooltip": false,372"viz": false373},374"lineInterpolation": "linear",375"lineWidth": 1,376"pointSize": 5,377"scaleDistribution": {378"type": "linear"379},380"showPoints": "auto",381"spanNulls": false,382"stacking": {383"group": "A",384"mode": "none"385},386"thresholdsStyle": {387"mode": "off"388}389},390"mappings": [],391"thresholds": {392"mode": "absolute",393"steps": [394{395"color": "green",396"value": null397},398{399"color": "red",400"value": 80401}402]403}404},405"overrides": []406},407"gridPos": {408"h": 5,409"w": 8,410"x": 0,411"y": 8412},413"id": 8,414"maxPerRow": 4,415"options": {416"legend": {417"calcs": [],418"displayMode": "hidden",419"placement": "bottom"420},421"tooltip": {422"mode": "single",423"sort": "none"424}425},426"repeat": "problem_type",427"repeatDirection": "h",428"targets": [429{430"datasource": {431"type": "prometheus",432"uid": "${datasource}"433},434"exemplar": true,435"expr": "sum(problem_gauge{type=~\"$problem_type\"})",436"interval": "",437"legendFormat": "$problem_type",438"refId": "A"439}440],441"title": "Problem Type - $problem_type",442"type": "timeseries"443},444{445"collapsed": false,446"datasource": {447"type": "datasource",448"uid": "grafana"449},450"gridPos": {451"h": 1,452"w": 24,453"x": 0,454"y": 13455},456"id": 6,457"panels": [],458"targets": [459{460"datasource": {461"type": "datasource",462"uid": "grafana"463},464"refId": "A"465}466],467"title": "Counters",468"type": "row"469},470{471"datasource": {472"type": "prometheus",473"uid": "${datasource}"474},475"fieldConfig": {476"defaults": {477"color": {478"mode": "palette-classic"479},480"custom": {481"axisLabel": "",482"axisPlacement": "auto",483"barAlignment": 0,484"drawStyle": "line",485"fillOpacity": 0,486"gradientMode": "none",487"hideFrom": {488"legend": false,489"tooltip": false,490"viz": false491},492"lineInterpolation": "linear",493"lineWidth": 1,494"pointSize": 5,495"scaleDistribution": {496"type": "linear"497},498"showPoints": "auto",499"spanNulls": false,500"stacking": {501"group": "A",502"mode": "none"503},504"thresholdsStyle": {505"mode": "off"506}507},508"mappings": [],509"thresholds": {510"mode": "absolute",511"steps": [512{513"color": "green",514"value": null515},516{517"color": "red",518"value": 80519}520]521}522},523"overrides": []524},525"gridPos": {526"h": 5,527"w": 8,528"x": 0,529"y": 14530},531"id": 7,532"maxPerRow": 3,533"options": {534"legend": {535"calcs": [],536"displayMode": "hidden",537"placement": "bottom"538},539"tooltip": {540"mode": "multi",541"sort": "none"542}543},544"repeat": "problem_counter_reason",545"repeatDirection": "h",546"targets": [547{548"datasource": {549"type": "prometheus",550"uid": "${datasource}"551},552"exemplar": true,553"expr": "sum(rate(problem_counter{reason=~\"$problem_counter_reason\"}[5m]))",554"interval": "",555"legendFormat": "$problem_counter_reason",556"refId": "A"557}558],559"title": "Problem rates - $problem_counter_reason",560"type": "timeseries"561}562],563"schemaVersion": 36,564"style": "dark",565"tags": [566"node"567],568"templating": {569"list": [570{571"current": {572"selected": true,573"text": [574"All"575],576"value": [577"$__all"578]579},580"datasource": {581"type": "prometheus",582"uid": "${datasource}"583},584"definition": "label_values(problem_counter,reason)",585"hide": 0,586"includeAll": true,587"multi": true,588"name": "problem_counter_reason",589"options": [],590"query": {591"query": "label_values(problem_counter,reason)",592"refId": "StandardVariableQuery"593},594"refresh": 2,595"regex": "",596"skipUrlSync": false,597"sort": 1,598"type": "query"599},600{601"current": {602"selected": true,603"text": [604"All"605],606"value": [607"$__all"608]609},610"datasource": {611"type": "prometheus",612"uid": "${datasource}"613},614"definition": "label_values(problem_counter,node)",615"hide": 0,616"includeAll": true,617"multi": true,618"name": "node",619"options": [],620"query": {621"query": "label_values(problem_counter,node)",622"refId": "StandardVariableQuery"623},624"refresh": 2,625"regex": "",626"skipUrlSync": false,627"sort": 1,628"type": "query"629},630{631"current": {632"selected": true,633"text": [634"All"635],636"value": [637"$__all"638]639},640"datasource": {641"type": "prometheus",642"uid": "${datasource}"643},644"definition": "label_values(problem_gauge,type)",645"hide": 0,646"includeAll": true,647"multi": true,648"name": "problem_type",649"options": [],650"query": {651"query": "label_values(problem_gauge,type)",652"refId": "StandardVariableQuery"653},654"refresh": 2,655"regex": "",656"skipUrlSync": false,657"sort": 1,658"type": "query"659},660{661"current": {662"selected": false,663"text": "VictoriaMetrics",664"value": "VictoriaMetrics"665},666"hide": 0,667"includeAll": false,668"multi": false,669"name": "datasource",670"options": [],671"query": "prometheus",672"refresh": 1,673"regex": "",674"skipUrlSync": false,675"type": "datasource"676}677]678},679"time": {680"from": "now-3h",681"to": "now"682},683"timepicker": {684"refresh_intervals": [685"10s",686"30s",687"1m",688"5m",689"15m",690"30m",691"1h",692"2h",693"1d"694]695},696"timezone": "utc",697"title": "Node Problem Detector",698"uid": "node-problem-detector",699"version": 5,700"weekStart": ""701}702703704