File tree Expand file tree Collapse file tree 3 files changed +24
-8
lines changed Expand file tree Collapse file tree 3 files changed +24
-8
lines changed Original file line number Diff line number Diff line change 2419
2419
"type" : " prometheus" ,
2420
2420
"uid" : " ${DS_PROMETHEUS}"
2421
2421
},
2422
- "description" : " List of all GPUs used by this job." ,
2422
+ "description" : " List of all GPUs used by this job. Health is the last known status of the GPU during a running job in the selected time range. " ,
2423
2423
"fieldConfig" : {
2424
2424
"defaults" : {
2425
2425
"color" : {
2569
2569
"showHeader" : true ,
2570
2570
"sortBy" : [
2571
2571
{
2572
- "desc" : true ,
2572
+ "desc" : false ,
2573
2573
"displayName" : " HEALTH"
2574
2574
},
2575
2575
{
2589
2589
"type" : " prometheus" ,
2590
2590
"uid" : " ${DS_PROMETHEUS}"
2591
2591
},
2592
- "editorMode" : " builder " ,
2593
- "expr" : " ${g_metrics_prefix}gpu_health{job_id!=\"\" , job_id=\" $g_job_id\" }" ,
2592
+ "editorMode" : " code " ,
2593
+ "expr" : " ${g_metrics_prefix}gpu_health{job_id!=\"\" , job_id=\" $g_job_id\" } or vector(0) " ,
2594
2594
"instant" : false ,
2595
2595
"legendFormat" : " __auto" ,
2596
2596
"range" : true ,
2601
2601
"type" : " prometheus" ,
2602
2602
"uid" : " ${DS_PROMETHEUS}"
2603
2603
},
2604
- "editorMode" : " builder " ,
2605
- "expr" : " ${g_metrics_prefix}gpu_health{pod!=\"\" , pod=\" $g_pod\" }" ,
2604
+ "editorMode" : " code " ,
2605
+ "expr" : " ${g_metrics_prefix}gpu_health{pod!=\"\" , pod=\" $g_pod\" } or vector(0) " ,
2606
2606
"hide" : false ,
2607
2607
"instant" : false ,
2608
2608
"legendFormat" : " __auto" ,
2672
2672
"hostname (last)" : " HOSTNAME"
2673
2673
}
2674
2674
}
2675
+ },
2676
+ {
2677
+ "id" : " filterByValue" ,
2678
+ "options" : {
2679
+ "filters" : [
2680
+ {
2681
+ "config" : {
2682
+ "id" : " isNull" ,
2683
+ "options" : {}
2684
+ },
2685
+ "fieldName" : " GPU UUID"
2686
+ }
2687
+ ],
2688
+ "match" : " any" ,
2689
+ "type" : " exclude"
2690
+ }
2675
2691
}
2676
2692
],
2677
2693
"type" : " table"
Original file line number Diff line number Diff line change 2232
2232
"showHeader" : true ,
2233
2233
"sortBy" : [
2234
2234
{
2235
- "desc" : true ,
2235
+ "desc" : false ,
2236
2236
"displayName" : " HEALTH"
2237
2237
},
2238
2238
{
Original file line number Diff line number Diff line change 2120
2120
"showHeader" : true ,
2121
2121
"sortBy" : [
2122
2122
{
2123
- "desc" : true ,
2123
+ "desc" : false ,
2124
2124
"displayName" : " HEALTH"
2125
2125
},
2126
2126
{
You can’t perform that action at this time.
0 commit comments