Skip to content

Commit 89797f4

Browse files
authored
[obs] add node variable and update panels in Node PSI dashboard to use it (#18250)
Related to WKS-303
1 parent 260d822 commit 89797f4

File tree

1 file changed

+52
-18
lines changed
  • operations/observability/mixins/workspace/dashboards

1 file changed

+52
-18
lines changed

operations/observability/mixins/workspace/dashboards/node-psi.json

Lines changed: 52 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@
2424
"editable": true,
2525
"fiscalYearStartMonth": 0,
2626
"graphTooltip": 1,
27-
"id": 80,
27+
"id": 86,
2828
"links": [],
2929
"liveNow": false,
3030
"panels": [
@@ -60,14 +60,15 @@
6060
"dashLength": 10,
6161
"dashes": false,
6262
"datasource": {
63+
"type": "prometheus",
6364
"uid": "$datasource"
6465
},
6566
"description": "Nodes with a high normalized load average do not represent a real problem, it only means that pods should probably not be scheduled to them.\n\nIf you'd like to see more details about resource consumption of a particular node, you can do so by clicking at the node name.\n",
6667
"fill": 1,
6768
"fillGradient": 5,
6869
"gridPos": {
6970
"h": 7,
70-
"w": 6,
71+
"w": 12,
7172
"x": 0,
7273
"y": 1
7374
},
@@ -92,7 +93,7 @@
9293
"alertThreshold": true
9394
},
9495
"percentage": false,
95-
"pluginVersion": "9.1.6",
96+
"pluginVersion": "9.5.3",
9697
"pointradius": 5,
9798
"points": false,
9899
"renderer": "flot",
@@ -112,10 +113,12 @@
112113
"datasource": {
113114
"uid": "$datasource"
114115
},
115-
"expr": "topk(5, sum(nodepool:node_load1:normalized{cluster=~\"$cluster\", nodepool=~\".*workspace.*\"}) by (node))\n",
116+
"editorMode": "code",
117+
"expr": "topk(5, sum(nodepool:node_load1:normalized{cluster=~\"$cluster\", nodepool=~\".*workspace.*\", node=~\"$node\"}) by (node))\n",
116118
"format": "time_series",
117119
"intervalFactor": 2,
118120
"legendFormat": "{{node}}",
121+
"range": true,
119122
"refId": "A"
120123
},
121124
{
@@ -169,7 +172,7 @@
169172
"h": 1,
170173
"w": 24,
171174
"x": 0,
172-
"y": 15
175+
"y": 8
173176
},
174177
"id": 86,
175178
"panels": [],
@@ -236,9 +239,9 @@
236239
},
237240
"gridPos": {
238241
"h": 8,
239-
"w": 6,
242+
"w": 12,
240243
"x": 0,
241-
"y": 16
244+
"y": 9
242245
},
243246
"id": 49,
244247
"options": {
@@ -262,7 +265,7 @@
262265
"uid": "${datasource}"
263266
},
264267
"editorMode": "code",
265-
"expr": "topk(5, rate(node_pressure_cpu_waiting_seconds_total{cluster=\"$cluster\"}[30s]))",
268+
"expr": "topk(5, rate(node_pressure_cpu_waiting_seconds_total{cluster=\"$cluster\",node=~\"$node\"}[30s]))",
266269
"legendFormat": "{{node}}",
267270
"range": true,
268271
"refId": "A"
@@ -277,7 +280,7 @@
277280
"h": 1,
278281
"w": 24,
279282
"x": 0,
280-
"y": 32
283+
"y": 17
281284
},
282285
"id": 165,
283286
"panels": [],
@@ -344,9 +347,9 @@
344347
},
345348
"gridPos": {
346349
"h": 8,
347-
"w": 6,
350+
"w": 12,
348351
"x": 0,
349-
"y": 33
352+
"y": 18
350353
},
351354
"id": 133,
352355
"options": {
@@ -370,7 +373,7 @@
370373
"uid": "${datasource}"
371374
},
372375
"editorMode": "code",
373-
"expr": "topk(5, rate(node_pressure_memory_waiting_seconds_total{cluster=\"$cluster\"}[30s]))",
376+
"expr": "topk(5, rate(node_pressure_memory_waiting_seconds_total{cluster=\"$cluster\",node=~\"$node\"}[30s]))",
374377
"legendFormat": "{{node}}",
375378
"range": true,
376379
"refId": "A"
@@ -385,7 +388,7 @@
385388
"h": 1,
386389
"w": 24,
387390
"x": 0,
388-
"y": 49
391+
"y": 26
389392
},
390393
"id": 224,
391394
"panels": [],
@@ -452,9 +455,9 @@
452455
},
453456
"gridPos": {
454457
"h": 8,
455-
"w": 6,
458+
"w": 12,
456459
"x": 0,
457-
"y": 50
460+
"y": 27
458461
},
459462
"id": 197,
460463
"options": {
@@ -478,7 +481,7 @@
478481
"uid": "${datasource}"
479482
},
480483
"editorMode": "code",
481-
"expr": "topk(5, rate(node_pressure_io_waiting_seconds_total{cluster=\"$cluster\"}[30s]))",
484+
"expr": "topk(5, rate(node_pressure_io_waiting_seconds_total{cluster=\"$cluster\",node=~\"$node\"}[30s]))",
482485
"legendFormat": "{{node}}",
483486
"range": true,
484487
"refId": "A"
@@ -489,7 +492,7 @@
489492
}
490493
],
491494
"refresh": "30s",
492-
"schemaVersion": 37,
495+
"schemaVersion": 38,
493496
"style": "dark",
494497
"tags": [],
495498
"templating": {
@@ -506,6 +509,7 @@
506509
"name": "datasource",
507510
"options": [],
508511
"query": "prometheus",
512+
"queryValue": "",
509513
"refresh": 1,
510514
"regex": "",
511515
"skipUrlSync": false,
@@ -542,6 +546,36 @@
542546
"tagsQuery": "",
543547
"type": "query",
544548
"useTags": false
549+
},
550+
{
551+
"current": {
552+
"selected": true,
553+
"text": [
554+
"All"
555+
],
556+
"value": [
557+
"$__all"
558+
]
559+
},
560+
"datasource": {
561+
"type": "prometheus",
562+
"uid": "${datasource}"
563+
},
564+
"definition": "label_values(node_pressure_memory_waiting_seconds_total,node)",
565+
"hide": 0,
566+
"includeAll": true,
567+
"multi": true,
568+
"name": "node",
569+
"options": [],
570+
"query": {
571+
"query": "label_values(node_pressure_memory_waiting_seconds_total,node)",
572+
"refId": "PrometheusVariableQueryEditor-VariableQuery"
573+
},
574+
"refresh": 2,
575+
"regex": "",
576+
"skipUrlSync": false,
577+
"sort": 0,
578+
"type": "query"
545579
}
546580
]
547581
},
@@ -577,6 +611,6 @@
577611
"timezone": "utc",
578612
"title": "Node Pressure Stall Information",
579613
"uid": "T7pAXoVVk",
580-
"version": 2,
614+
"version": 1,
581615
"weekStart": ""
582616
}

0 commit comments

Comments
 (0)