Skip to content

Commit

Permalink
Update generated dashboards
Browse files Browse the repository at this point in the history
Signed-off-by: Jordà Polo <[email protected]>
  • Loading branch information
jordap authored and koomie committed Jan 9, 2025
1 parent 9561520 commit 11c5490
Show file tree
Hide file tree
Showing 5 changed files with 50 additions and 50 deletions.
14 changes: 7 additions & 7 deletions grafana/json-models/rms-global.json
Original file line number Diff line number Diff line change
Expand Up @@ -1598,7 +1598,7 @@
"vbios": 7
},
"renameByName": {
"card": "Card",
"card": "GPU ID",
"driver_ver": "Driver Version",
"instance": "Node",
"instance (count)": "Number of GPUs",
Expand Down Expand Up @@ -3713,7 +3713,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -4061,7 +4061,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -4183,7 +4183,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -4291,7 +4291,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -4629,7 +4629,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -4737,7 +4737,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down
36 changes: 18 additions & 18 deletions grafana/json-models/rms-job.json
Original file line number Diff line number Diff line change
Expand Up @@ -2483,7 +2483,7 @@
"exemplar": false,
"expr": "avg by (card) (rocm_utilization_percentage * on (instance) group_left() rmsjob_info{jobid=\"$jobid\"})",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -2566,7 +2566,7 @@
"yHistogram": false
},
"yAxis": {
"axisLabel": "Card",
"axisLabel": "GPU ID",
"axisPlacement": "left",
"reverse": false
}
Expand Down Expand Up @@ -2659,7 +2659,7 @@
"exemplar": false,
"expr": "max by (card) (rocm_vram_used_percentage * on (instance) group_left() rmsjob_info{jobid=\"$jobid\"})",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -2742,7 +2742,7 @@
"yHistogram": false
},
"yAxis": {
"axisLabel": "Card",
"axisLabel": "GPU ID",
"axisPlacement": "left",
"reverse": false
}
Expand Down Expand Up @@ -2860,7 +2860,7 @@
"editorMode": "code",
"expr": "avg by (card) (rocm_utilization_percentage * on (instance) group_left() rmsjob_info{jobid=\"$jobid\"})",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand All @@ -2869,7 +2869,7 @@
"type": "timeseries"
}
],
"title": "GPU Usage - Card IDs",
"title": "GPU Usage - GPU IDs",
"type": "row"
},
{
Expand Down Expand Up @@ -3183,7 +3183,7 @@
{
"matcher": {
"id": "byName",
"options": "GPU Card ID"
"options": "GPU ID"
},
"properties": [
{
Expand Down Expand Up @@ -3367,7 +3367,7 @@
"renameByName": {
"Field": "",
"Mean": "GPU Utilization (%)",
"card": "GPU Card ID",
"card": "GPU ID",
"instance": "Node"
}
}
Expand Down Expand Up @@ -3429,7 +3429,7 @@
{
"matcher": {
"id": "byName",
"options": "GPU Card ID"
"options": "GPU ID"
},
"properties": [
{
Expand Down Expand Up @@ -3590,7 +3590,7 @@
"renameByName": {
"Field": "",
"Mean": "GPU Utilization (%)",
"card": "GPU Card ID",
"card": "GPU ID",
"instance": "Node"
}
}
Expand Down Expand Up @@ -3752,7 +3752,7 @@
"renameByName": {
"Field": "",
"Mean": "Utilization",
"card": "Card ID",
"card": "GPU ID",
"instance": "Node"
}
}
Expand Down Expand Up @@ -4346,7 +4346,7 @@
"renameByName": {
"Field": "Node",
"Mean": "Utilization",
"card": "Card ID",
"card": "GPU ID",
"instance": "Node"
}
}
Expand Down Expand Up @@ -4472,7 +4472,7 @@
"editorMode": "code",
"expr": "avg by (card, location) (rocm_temperature_celsius * on (instance) group_left() rmsjob_info{jobid=\"$jobid\"})",
"instant": false,
"legendFormat": "Card {{card}} ({{location}})",
"legendFormat": "GPU ID {{card}} ({{location}})",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -4572,7 +4572,7 @@
"editorMode": "code",
"expr": "avg by (card, location) (rocm_temperature_memory_celsius * on (instance) group_left() rmsjob_info{jobid=\"$jobid\"})",
"instant": false,
"legendFormat": "Card {{card}} ({{location}})",
"legendFormat": "GPU ID {{card}} ({{location}})",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -4672,7 +4672,7 @@
"editorMode": "code",
"expr": "avg by (card) (rocm_average_socket_power_watts * on (instance) group_left() rmsjob_info{jobid=\"$jobid\"})",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -4772,7 +4772,7 @@
"editorMode": "code",
"expr": "avg by (card) (rocm_sclk_clock_mhz * on (instance) group_left() rmsjob_info{jobid=\"$jobid\"})",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -4872,7 +4872,7 @@
"editorMode": "code",
"expr": "avg by (card) (rocm_mclk_clock_mhz * on (instance) group_left() rmsjob_info{jobid=\"$jobid\"})",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand All @@ -4881,7 +4881,7 @@
"type": "timeseries"
}
],
"title": "GPU Telemetry: Card IDs",
"title": "GPU Telemetry: GPU IDs",
"type": "row"
},
{
Expand Down
18 changes: 9 additions & 9 deletions grafana/json-models/rms-node.json
Original file line number Diff line number Diff line change
Expand Up @@ -794,7 +794,7 @@
"editorMode": "code",
"expr": "rocm_utilization_percentage{instance=\"$instance\"}",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -894,7 +894,7 @@
"editorMode": "code",
"expr": "(rocm_utilization_percentage{instance=\"$instance\"})",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -994,7 +994,7 @@
"editorMode": "code",
"expr": "rocm_vram_used_percentage{instance=\"$instance\"}",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -1111,7 +1111,7 @@
"editorMode": "code",
"expr": "avg by (card, location) (rocm_temperature_celsius{instance=\"$instance\"}) ",
"instant": false,
"legendFormat": "Card {{card}} ({{location}})",
"legendFormat": "GPU ID {{card}} ({{location}})",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -1218,7 +1218,7 @@
"editorMode": "code",
"expr": "avg by (card, location) (rocm_temperature_memory_celsius{instance=\"$instance\"})",
"instant": false,
"legendFormat": "Card {{card}} ({{location}})",
"legendFormat": "GPU ID {{card}} ({{location}})",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -1317,7 +1317,7 @@
"editorMode": "code",
"expr": "(rocm_average_socket_power_watts{instance=\"$instance\"}) ",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -1416,7 +1416,7 @@
"editorMode": "code",
"expr": "rocm_sclk_clock_mhz{instance=\"$instance\"}",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -1515,7 +1515,7 @@
"editorMode": "code",
"expr": "rocm_mclk_clock_mhz{instance=\"$instance\"}",
"instant": false,
"legendFormat": "Card {{card}}",
"legendFormat": "GPU ID {{card}}",
"range": true,
"refId": "A"
}
Expand Down Expand Up @@ -2270,7 +2270,7 @@
"vbios": 9
},
"renameByName": {
"card": "GPU Card ID",
"card": "GPU ID",
"driver_ver": "Driver Version",
"instance (count)": "Number of GPUs",
"type": "Type",
Expand Down
14 changes: 7 additions & 7 deletions grafana/json-models/standalone-global.json
Original file line number Diff line number Diff line change
Expand Up @@ -1300,7 +1300,7 @@
"vbios": 7
},
"renameByName": {
"card": "Card",
"card": "GPU ID",
"driver_ver": "Driver Version",
"instance": "Node",
"instance (count)": "Number of GPUs",
Expand Down Expand Up @@ -1672,7 +1672,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -1788,7 +1788,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -1910,7 +1910,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -2018,7 +2018,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -2140,7 +2140,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down Expand Up @@ -2248,7 +2248,7 @@
"id": "renameByRegex",
"options": {
"regex": "(.*):(.*), (.*)",
"renamePattern": "Node: $1 (card $3)"
"renamePattern": "GPU: $1/$3"
}
}
],
Expand Down
Loading

0 comments on commit 11c5490

Please sign in to comment.