2025-09-16 17:02:17 +03:00
{
"annotations" : {
"list" : [
{
"builtIn" : 1 ,
"datasource" : {
"type" : "datasource" ,
"uid" : "grafana"
} ,
"enable" : true ,
"hide" : true ,
"iconColor" : "rgba(0, 211, 255, 1)" ,
"name" : "Annotations & Alerts" ,
"type" : "dashboard"
}
]
} ,
2026-02-02 16:16:37 +03:00
"description" : "Nvidia GPU Metrics based on the prometheus metrics from github.com/utkuozdemir/nvidia_gpu_exporter" ,
2025-09-16 17:02:17 +03:00
"editable" : true ,
"fiscalYearStartMonth" : 0 ,
"graphTooltip" : 0 ,
2025-09-16 17:43:11 +03:00
"id" : 46 ,
2025-09-16 17:02:17 +03:00
"links" : [ ] ,
"panels" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "The official product name of the GPU. This is an alphanumeric string. For all products." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "thresholds"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"decimals" : 2 ,
"mappings" : [ ] ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "none"
2025-09-16 17:02:17 +03:00
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 3 ,
2026-02-02 16:16:37 +03:00
"w" : 4 ,
2025-09-16 17:02:17 +03:00
"x" : 0 ,
"y" : 0
} ,
2026-02-02 16:16:37 +03:00
"id" : 23 ,
2025-09-16 17:02:17 +03:00
"options" : {
2026-02-02 16:16:37 +03:00
"colorMode" : "value" ,
"graphMode" : "none" ,
2025-09-16 17:02:17 +03:00
"justifyMode" : "auto" ,
2026-02-02 16:16:37 +03:00
"orientation" : "auto" ,
2025-09-16 17:02:17 +03:00
"percentChangeColorMode" : "standard" ,
"reduceOptions" : {
"calcs" : [
2026-02-02 16:16:37 +03:00
"last"
2025-09-16 17:02:17 +03:00
] ,
"fields" : "" ,
"values" : false
} ,
"showPercentChange" : false ,
2026-02-02 16:16:37 +03:00
"text" : { } ,
"textMode" : "name" ,
2025-09-16 17:02:17 +03:00
"wideLayout" : true
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2025-09-16 17:43:11 +03:00
"editorMode" : "code" ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_gpu_info{uuid=\"$gpu\"}" ,
"instant" : true ,
"interval" : "" ,
"legendFormat" : "{{name}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Name" ,
2025-09-16 17:02:17 +03:00
"type" : "stat"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "The current performance state for the GPU. States range from P0 (maximum performance) to P12 (minimum performance)." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "thresholds"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"decimals" : 0 ,
2025-09-16 17:02:17 +03:00
"mappings" : [
{
"options" : {
2026-02-02 16:16:37 +03:00
"" : {
"text" : ""
2025-09-16 17:02:17 +03:00
}
} ,
2026-02-02 16:16:37 +03:00
"type" : "value"
2025-09-16 17:02:17 +03:00
}
] ,
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "prefix:P"
2025-09-16 17:02:17 +03:00
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 3 ,
2026-02-02 16:16:37 +03:00
"w" : 2 ,
"x" : 4 ,
2025-09-16 17:02:17 +03:00
"y" : 0
} ,
2026-02-02 16:16:37 +03:00
"id" : 22 ,
2025-09-16 17:02:17 +03:00
"options" : {
2026-02-02 16:16:37 +03:00
"colorMode" : "value" ,
"graphMode" : "none" ,
2025-09-16 17:02:17 +03:00
"justifyMode" : "auto" ,
2026-02-02 16:16:37 +03:00
"orientation" : "auto" ,
2025-09-16 17:02:17 +03:00
"percentChangeColorMode" : "standard" ,
"reduceOptions" : {
"calcs" : [
2026-02-02 16:16:37 +03:00
"last"
2025-09-16 17:02:17 +03:00
] ,
"fields" : "" ,
"values" : false
} ,
"showPercentChange" : false ,
2026-02-02 16:16:37 +03:00
"text" : { } ,
"textMode" : "value" ,
2025-09-16 17:02:17 +03:00
"wideLayout" : true
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_pstate{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "P-State" ,
2025-09-16 17:02:17 +03:00
"type" : "stat"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "Percent of time over the past sample period during which one or more kernels was executing on the GPU.\nThe sample period may be between 1 second and 1/6 second depending on the product." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "thresholds"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"mappings" : [ ] ,
"max" : 1 ,
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
2026-02-02 16:16:37 +03:00
"mode" : "percentage" ,
2025-09-16 17:02:17 +03:00
"steps" : [
{
2026-02-02 16:16:37 +03:00
"color" : "green" ,
2025-09-16 17:02:17 +03:00
"value" : 0
} ,
{
2026-02-02 16:16:37 +03:00
"color" : "#EAB839" ,
"value" : 70
2025-09-16 17:02:17 +03:00
} ,
{
2026-02-02 16:16:37 +03:00
"color" : "red" ,
"value" : 90
2025-09-16 17:02:17 +03:00
}
]
} ,
"unit" : "percentunit"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 3 ,
"x" : 6 ,
2025-09-16 17:02:17 +03:00
"y" : 0
} ,
2026-02-02 16:16:37 +03:00
"id" : 6 ,
2025-09-16 17:02:17 +03:00
"options" : {
2026-02-02 16:16:37 +03:00
"minVizHeight" : 75 ,
"minVizWidth" : 75 ,
"orientation" : "auto" ,
2025-09-16 17:02:17 +03:00
"reduceOptions" : {
"calcs" : [
2026-02-02 16:16:37 +03:00
"last"
2025-09-16 17:02:17 +03:00
] ,
"fields" : "" ,
"values" : false
} ,
2026-02-02 16:16:37 +03:00
"showThresholdLabels" : false ,
"showThresholdMarkers" : true ,
"sizing" : "auto" ,
"text" : { }
2025-09-16 17:02:17 +03:00
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_utilization_gpu_ratio{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "GPU Utilization %" ,
"type" : "gauge"
2025-09-16 17:02:17 +03:00
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "The last measured power draw for the entire board, in watts. Only available if power management is supported. This reading is accurate to within +/- 5 watts / The software power limit in watts." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "thresholds"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"mappings" : [ ] ,
"max" : 1 ,
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
2026-02-02 16:16:37 +03:00
"mode" : "percentage" ,
2025-09-16 17:02:17 +03:00
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
2026-02-02 16:16:37 +03:00
{
"color" : "#EAB839" ,
"value" : 70
} ,
2025-09-16 17:02:17 +03:00
{
"color" : "red" ,
2026-02-02 16:16:37 +03:00
"value" : 90
2025-09-16 17:02:17 +03:00
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "percentunit"
2025-09-16 17:02:17 +03:00
} ,
"overrides" : [ ]
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
2025-09-16 17:02:17 +03:00
"w" : 3 ,
2026-02-02 16:16:37 +03:00
"x" : 9 ,
2025-09-16 17:02:17 +03:00
"y" : 0
} ,
2026-02-02 16:16:37 +03:00
"id" : 21 ,
2025-09-16 17:02:17 +03:00
"options" : {
2026-02-02 16:16:37 +03:00
"minVizHeight" : 75 ,
"minVizWidth" : 75 ,
"orientation" : "auto" ,
2025-09-16 17:02:17 +03:00
"reduceOptions" : {
"calcs" : [
2026-02-02 16:16:37 +03:00
"last"
2025-09-16 17:02:17 +03:00
] ,
"fields" : "" ,
"values" : false
} ,
2026-02-02 16:16:37 +03:00
"showThresholdLabels" : false ,
"showThresholdMarkers" : true ,
"sizing" : "auto" ,
"text" : { }
2025-09-16 17:02:17 +03:00
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_power_draw_watts{uuid=\"$gpu\"} / nvidia_smi_power_default_limit_watts{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Power Draw %" ,
"type" : "gauge"
2025-09-16 17:02:17 +03:00
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "The fan speed value is the percent of the product's maximum noise tolerance fan speed that the device's fan is currently intended to run at. This value may exceed 100% in certain cases. Note: The reported speed is the intended fan speed. If the fan is physically blocked and unable to spin, this output will not match the actual fan speed. Many parts do not report fan speeds because they rely on cooling via fans in the surrounding enclosure.\n" ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "thresholds"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"mappings" : [ ] ,
"max" : 1 ,
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
2026-02-02 16:16:37 +03:00
"mode" : "percentage" ,
2025-09-16 17:02:17 +03:00
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
2026-02-02 16:16:37 +03:00
{
"color" : "#EAB839" ,
"value" : 70
} ,
2025-09-16 17:02:17 +03:00
{
"color" : "red" ,
2026-02-02 16:16:37 +03:00
"value" : 90
2025-09-16 17:02:17 +03:00
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "percentunit"
2025-09-16 17:02:17 +03:00
} ,
"overrides" : [ ]
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
2025-09-16 17:02:17 +03:00
"w" : 3 ,
2026-02-02 16:16:37 +03:00
"x" : 12 ,
2025-09-16 17:02:17 +03:00
"y" : 0
} ,
2026-02-02 16:16:37 +03:00
"id" : 4 ,
2025-09-16 17:02:17 +03:00
"options" : {
2026-02-02 16:16:37 +03:00
"minVizHeight" : 75 ,
"minVizWidth" : 75 ,
"orientation" : "auto" ,
2025-09-16 17:02:17 +03:00
"reduceOptions" : {
"calcs" : [
2026-02-02 16:16:37 +03:00
"last"
2025-09-16 17:02:17 +03:00
] ,
"fields" : "" ,
"values" : false
} ,
2026-02-02 16:16:37 +03:00
"showThresholdLabels" : false ,
"showThresholdMarkers" : true ,
"sizing" : "auto" ,
"text" : { }
2025-09-16 17:02:17 +03:00
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_fan_speed_ratio{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Fan Speed %" ,
"type" : "gauge"
2025-09-16 17:02:17 +03:00
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "Core GPU temperature. in degrees C." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "thresholds"
2025-09-16 17:02:17 +03:00
} ,
"mappings" : [ ] ,
2026-02-02 16:16:37 +03:00
"max" : 100 ,
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
2026-02-02 16:16:37 +03:00
{
"color" : "#EAB839" ,
"value" : 70
} ,
2025-09-16 17:02:17 +03:00
{
"color" : "red" ,
"value" : 80
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "celsius"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"overrides" : [ ]
2025-09-16 17:02:17 +03:00
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 3 ,
"x" : 15 ,
"y" : 0
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"id" : 16 ,
2025-09-16 17:02:17 +03:00
"options" : {
2026-02-02 16:16:37 +03:00
"minVizHeight" : 75 ,
"minVizWidth" : 75 ,
"orientation" : "auto" ,
"reduceOptions" : {
2025-09-16 17:02:17 +03:00
"calcs" : [
2026-02-02 16:16:37 +03:00
"last"
2025-09-16 17:02:17 +03:00
] ,
2026-02-02 16:16:37 +03:00
"fields" : "" ,
"values" : false
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"showThresholdLabels" : false ,
"showThresholdMarkers" : true ,
"sizing" : "auto" ,
"text" : { }
2025-09-16 17:02:17 +03:00
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_temperature_gpu{uuid=\"$gpu\"}" ,
2025-09-16 17:02:17 +03:00
"interval" : "" ,
2026-02-02 16:16:37 +03:00
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Temperature" ,
"type" : "gauge"
2025-09-16 17:02:17 +03:00
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "Percent of time over the past sample period during which global (device) memory was being read or written.\nThe sample period may be between 1 second and 1/6 second depending on the product." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "palette-classic"
} ,
"custom" : {
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
2026-02-02 16:16:37 +03:00
"fillOpacity" : 10 ,
2025-09-16 17:02:17 +03:00
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
2026-02-02 16:16:37 +03:00
"lineWidth" : 1 ,
2025-09-16 17:02:17 +03:00
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
"showPoints" : "never" ,
2026-02-02 16:16:37 +03:00
"spanNulls" : false ,
2025-09-16 17:02:17 +03:00
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
2026-02-02 16:16:37 +03:00
"mode" : "line+area"
2025-09-16 17:02:17 +03:00
}
} ,
"mappings" : [ ] ,
2026-02-02 16:16:37 +03:00
"max" : 1 ,
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
2026-02-02 16:16:37 +03:00
"color" : "transparent" ,
2025-09-16 17:02:17 +03:00
"value" : 0
} ,
2026-02-02 16:16:37 +03:00
{
"color" : "orange" ,
"value" : 0.7
} ,
2025-09-16 17:02:17 +03:00
{
"color" : "red" ,
2026-02-02 16:16:37 +03:00
"value" : 0.9
2025-09-16 17:02:17 +03:00
}
]
} ,
"unit" : "percentunit"
} ,
2026-02-02 16:16:37 +03:00
"overrides" : [ ]
2025-09-16 17:02:17 +03:00
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 6 ,
"x" : 18 ,
"y" : 0
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"id" : 11 ,
2025-09-16 17:02:17 +03:00
"options" : {
"legend" : {
2026-02-02 16:16:37 +03:00
"calcs" : [ ] ,
"displayMode" : "list" ,
"placement" : "bottom" ,
"showLegend" : false
2025-09-16 17:02:17 +03:00
} ,
"tooltip" : {
"hideZeros" : false ,
"mode" : "multi" ,
2026-02-02 16:16:37 +03:00
"sort" : "none"
2025-09-16 17:02:17 +03:00
}
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_utilization_memory_ratio{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Memory Utilization %" ,
2025-09-16 17:02:17 +03:00
"type" : "timeseries"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "The version of the installed NVIDIA display driver. This is an alphanumeric string." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "thresholds"
} ,
"decimals" : 2 ,
"mappings" : [ ] ,
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
}
]
} ,
"unit" : "none"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 2 ,
"w" : 3 ,
"x" : 0 ,
"y" : 3
} ,
"id" : 14 ,
"options" : {
"colorMode" : "value" ,
"graphMode" : "none" ,
"justifyMode" : "auto" ,
"orientation" : "auto" ,
"percentChangeColorMode" : "standard" ,
"reduceOptions" : {
"calcs" : [
"last"
] ,
"fields" : "" ,
"values" : false
} ,
"showPercentChange" : false ,
"text" : { } ,
"textMode" : "name" ,
"wideLayout" : true
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_gpu_info{uuid=\"$gpu\"}" ,
"instant" : true ,
"interval" : "" ,
"legendFormat" : "{{driver_version}}" ,
"refId" : "A"
}
] ,
"title" : "Driver Version" ,
"type" : "stat"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "The BIOS of the GPU board." ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "thresholds"
} ,
"decimals" : 2 ,
"mappings" : [ ] ,
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
}
]
} ,
"unit" : "none"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 2 ,
"w" : 3 ,
"x" : 3 ,
"y" : 3
} ,
"id" : 34 ,
"options" : {
"colorMode" : "value" ,
"graphMode" : "none" ,
"justifyMode" : "auto" ,
"orientation" : "auto" ,
"percentChangeColorMode" : "standard" ,
"reduceOptions" : {
"calcs" : [
"last"
] ,
"fields" : "" ,
"values" : false
} ,
"showPercentChange" : false ,
"text" : { } ,
"textMode" : "name" ,
"wideLayout" : true
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_gpu_info{uuid=\"$gpu\"}" ,
"instant" : true ,
"interval" : "" ,
"legendFormat" : "{{vbios_version}}" ,
"refId" : "A"
}
] ,
"title" : "Vbios Version" ,
"type" : "stat"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "Information about factors that are reducing the frequency of clocks. If all throttle reasons are returned as \"Not Active\" it means that clocks are running as high as possible." ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "thresholds"
} ,
"decimals" : 0 ,
"mappings" : [
{
"options" : {
"0" : {
"text" : "Not Active"
} ,
"1" : {
"text" : "Active"
}
} ,
"type" : "value"
}
] ,
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
}
]
} ,
"unit" : "none"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 5 ,
"w" : 6 ,
"x" : 0 ,
"y" : 5
} ,
"id" : 32 ,
"options" : {
"displayMode" : "gradient" ,
"legend" : {
"calcs" : [ ] ,
"displayMode" : "list" ,
"placement" : "bottom" ,
"showLegend" : false
} ,
"maxVizHeight" : 300 ,
"minVizHeight" : 16 ,
"minVizWidth" : 8 ,
"namePlacement" : "auto" ,
"orientation" : "horizontal" ,
"reduceOptions" : {
"calcs" : [
"last"
] ,
"fields" : "" ,
"values" : false
} ,
"showUnfilled" : true ,
"sizing" : "auto" ,
"text" : { } ,
"valueMode" : "color"
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_event_reasons_gpu_idle{uuid=\"$gpu\"} or nvidia_smi_clocks_throttle_reasons_gpu_idle{uuid=\"$gpu\"}" ,
"instant" : false ,
"interval" : "" ,
"legendFormat" : "Idle" ,
"refId" : "A"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_event_reasons_hw_thermal_slowdown{uuid=\"$gpu\"} or nvidia_smi_clocks_throttle_reasons_hw_thermal_slowdown{uuid=\"$gpu\"}" ,
"hide" : false ,
"interval" : "" ,
"legendFormat" : "HW Thermal Slowdown" ,
"refId" : "B"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_event_reasons_sw_power_cap{uuid=\"$gpu\"} or nvidia_smi_clocks_throttle_reasons_sw_power_cap{uuid=\"$gpu\"}" ,
"hide" : false ,
"interval" : "" ,
"legendFormat" : "SW Power Cap" ,
"refId" : "C"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_event_reasons_applications_clocks_setting{uuid=\"$gpu\"} or nvidia_smi_clocks_throttle_reasons_applications_clocks_setting{uuid=\"$gpu\"}" ,
"hide" : false ,
"interval" : "" ,
"legendFormat" : "App Clocks Setting" ,
"refId" : "D"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_event_reasons_hw_power_brake_slowdown{uuid=\"$gpu\"} or nvidia_smi_clocks_throttle_reasons_hw_power_brake_slowdown{uuid=\"$gpu\"}" ,
"hide" : false ,
"interval" : "" ,
"legendFormat" : "HW Power Brake" ,
"refId" : "E"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_event_reasons_sw_thermal_slowdown{uuid=\"$gpu\"} or nvidia_smi_clocks_throttle_reasons_sw_thermal_slowdown{uuid=\"$gpu\"}" ,
"hide" : false ,
"interval" : "" ,
"legendFormat" : "SW Thermal Slowdown" ,
"refId" : "F"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_event_reasons_sync_boost{uuid=\"$gpu\"} or nvidia_smi_clocks_throttle_reasons_sync_boost{uuid=\"$gpu\"}" ,
"hide" : false ,
"interval" : "" ,
"legendFormat" : "Sync Boost" ,
"refId" : "G"
}
] ,
"title" : "Throttle Reasons" ,
"type" : "bargauge"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "Current frequency of graphics (shader) clock\n/\nMaximum frequency of graphics (shader) clock.\n" ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "thresholds"
} ,
"mappings" : [ ] ,
"max" : 1 ,
"min" : 0 ,
"thresholds" : {
"mode" : "percentage" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
{
"color" : "#EAB839" ,
"value" : 70
} ,
{
"color" : "red" ,
"value" : 90
}
]
} ,
"unit" : "percentunit"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 5 ,
"w" : 3 ,
"x" : 6 ,
"y" : 5
} ,
"id" : 20 ,
"options" : {
"minVizHeight" : 75 ,
"minVizWidth" : 75 ,
"orientation" : "auto" ,
"reduceOptions" : {
"calcs" : [
"last"
] ,
"fields" : "" ,
"values" : false
} ,
"showThresholdLabels" : false ,
"showThresholdMarkers" : true ,
"sizing" : "auto" ,
"text" : { }
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_current_graphics_clock_hz{uuid=\"$gpu\"} / nvidia_smi_clocks_max_graphics_clock_hz{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "" ,
"refId" : "A"
}
] ,
"title" : "GPU Clock Speed %" ,
"type" : "gauge"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "Current frequency of memory clock / Maximum frequency of memory clock" ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "thresholds"
} ,
"mappings" : [ ] ,
"max" : 1 ,
"min" : 0 ,
"thresholds" : {
"mode" : "percentage" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
{
"color" : "#EAB839" ,
"value" : 70
} ,
{
"color" : "red" ,
"value" : 90
}
]
} ,
"unit" : "percentunit"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 5 ,
"w" : 3 ,
"x" : 9 ,
"y" : 5
} ,
"id" : 33 ,
"options" : {
"minVizHeight" : 75 ,
"minVizWidth" : 75 ,
"orientation" : "auto" ,
"reduceOptions" : {
"calcs" : [
"last"
] ,
"fields" : "" ,
"values" : false
} ,
"showThresholdLabels" : false ,
"showThresholdMarkers" : true ,
"sizing" : "auto" ,
"text" : { }
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_current_memory_clock_hz{uuid=\"$gpu\"} / nvidia_smi_clocks_max_memory_clock_hz{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "" ,
"refId" : "A"
}
] ,
"title" : "Memory Clock Speed %" ,
"type" : "gauge"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "Total memory allocated by active contexts / Total installed GPU memory." ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "thresholds"
} ,
"mappings" : [ ] ,
"max" : 1 ,
"min" : 0 ,
"thresholds" : {
"mode" : "percentage" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
{
"color" : "#EAB839" ,
"value" : 70
} ,
{
"color" : "red" ,
"value" : 90
}
]
} ,
"unit" : "percentunit"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 5 ,
"w" : 3 ,
"x" : 12 ,
"y" : 5
} ,
"id" : 25 ,
"options" : {
"minVizHeight" : 75 ,
"minVizWidth" : 75 ,
"orientation" : "auto" ,
"reduceOptions" : {
"calcs" : [
"last"
] ,
"fields" : "" ,
"values" : false
} ,
"showThresholdLabels" : false ,
"showThresholdMarkers" : true ,
"sizing" : "auto" ,
"text" : { }
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_memory_used_bytes{uuid=\"$gpu\"} / nvidia_smi_memory_total_bytes{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "" ,
"refId" : "A"
}
] ,
"title" : "Memory Allocation %" ,
"type" : "gauge"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "Percent of time over the past sample period during which global (device) memory was being read or written.\nThe sample period may be between 1 second and 1/6 second depending on the product." ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "thresholds"
} ,
"mappings" : [ ] ,
"max" : 1 ,
"min" : 0 ,
"thresholds" : {
"mode" : "percentage" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
{
"color" : "#EAB839" ,
"value" : 70
} ,
{
"color" : "red" ,
"value" : 90
}
]
} ,
"unit" : "percentunit"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 5 ,
"w" : 3 ,
"x" : 15 ,
"y" : 5
} ,
"id" : 7 ,
"options" : {
"minVizHeight" : 75 ,
"minVizWidth" : 75 ,
"orientation" : "auto" ,
"reduceOptions" : {
"calcs" : [
"last"
] ,
"fields" : "" ,
"values" : false
} ,
"showThresholdLabels" : false ,
"showThresholdMarkers" : true ,
"sizing" : "auto" ,
"text" : { }
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_utilization_memory_ratio{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "" ,
"refId" : "A"
}
] ,
"title" : "Memory Utilization %" ,
"type" : "gauge"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "Percent of time over the past sample period during which one or more kernels was executing on the GPU.\nThe sample period may be between 1 second and 1/6 second depending on the product." ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "palette-classic"
} ,
"custom" : {
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
"fillOpacity" : 10 ,
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
"lineWidth" : 1 ,
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
"showPoints" : "never" ,
"spanNulls" : false ,
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
"mode" : "line+area"
}
} ,
"mappings" : [ ] ,
"max" : 1 ,
"min" : 0 ,
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "transparent" ,
"value" : 0
} ,
{
"color" : "orange" ,
"value" : 0.7
} ,
{
"color" : "red" ,
"value" : 0.9
}
]
} ,
"unit" : "percentunit"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 5 ,
"w" : 6 ,
"x" : 18 ,
"y" : 5
} ,
"id" : 10 ,
"options" : {
"legend" : {
"calcs" : [ ] ,
"displayMode" : "list" ,
"placement" : "bottom" ,
"showLegend" : false
} ,
"tooltip" : {
"hideZeros" : false ,
"mode" : "multi" ,
"sort" : "none"
}
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_utilization_gpu_ratio{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "" ,
"refId" : "A"
}
] ,
"title" : "GPU Utilization %" ,
"type" : "timeseries"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "Total memory allocated by active contexts." ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "palette-classic"
} ,
"custom" : {
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
"fillOpacity" : 10 ,
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
"lineWidth" : 1 ,
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
"showPoints" : "never" ,
"spanNulls" : false ,
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
"mode" : "off"
}
} ,
"mappings" : [ ] ,
"min" : 0 ,
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
{
"color" : "red" ,
"value" : 80
}
]
} ,
"unit" : "decbytes"
} ,
"overrides" : [ ]
} ,
"gridPos" : {
"h" : 5 ,
"w" : 6 ,
"x" : 0 ,
"y" : 10
} ,
"id" : 17 ,
"options" : {
"legend" : {
"calcs" : [ ] ,
"displayMode" : "list" ,
"placement" : "bottom" ,
"showLegend" : false
} ,
"tooltip" : {
"hideZeros" : false ,
"mode" : "multi" ,
"sort" : "none"
}
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
"expr" : "nvidia_smi_memory_used_bytes{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
}
] ,
"title" : "Memory Allocation" ,
"type" : "timeseries"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"description" : "Core GPU temperature. in degrees C." ,
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "palette-classic"
2025-09-16 17:02:17 +03:00
} ,
"custom" : {
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
"fillOpacity" : 10 ,
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
2026-02-02 16:16:37 +03:00
"lineWidth" : 1 ,
2025-09-16 17:02:17 +03:00
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
"showPoints" : "never" ,
2026-02-02 16:16:37 +03:00
"spanNulls" : false ,
2025-09-16 17:02:17 +03:00
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
2026-02-02 16:16:37 +03:00
"mode" : "line+area"
2025-09-16 17:02:17 +03:00
}
} ,
"mappings" : [ ] ,
2026-02-02 16:16:37 +03:00
"max" : 100 ,
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
2026-02-02 16:16:37 +03:00
"color" : "transparent" ,
2025-09-16 17:02:17 +03:00
"value" : 0
} ,
2026-02-02 16:16:37 +03:00
{
"color" : "orange" ,
"value" : 70
} ,
2025-09-16 17:02:17 +03:00
{
"color" : "red" ,
"value" : 80
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "celsius"
2025-09-16 17:02:17 +03:00
} ,
"overrides" : [ ]
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 6 ,
"x" : 6 ,
2025-09-16 17:02:17 +03:00
"y" : 10
} ,
2026-02-02 16:16:37 +03:00
"id" : 15 ,
2025-09-16 17:02:17 +03:00
"options" : {
"legend" : {
2026-02-02 16:16:37 +03:00
"calcs" : [ ] ,
2025-09-16 17:02:17 +03:00
"displayMode" : "list" ,
"placement" : "bottom" ,
2026-02-02 16:16:37 +03:00
"showLegend" : false
2025-09-16 17:02:17 +03:00
} ,
"tooltip" : {
"hideZeros" : false ,
"mode" : "multi" ,
"sort" : "none"
}
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_temperature_gpu{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Temperature" ,
2025-09-16 17:02:17 +03:00
"type" : "timeseries"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "The last measured power draw for the entire board, in watts. Only available if power management is supported. This reading is accurate to within +/- 5 watts" ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "palette-classic"
} ,
"custom" : {
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
2026-02-02 16:16:37 +03:00
"fillOpacity" : 10 ,
2025-09-16 17:02:17 +03:00
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
2026-02-02 16:16:37 +03:00
"lineWidth" : 1 ,
2025-09-16 17:02:17 +03:00
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
"showPoints" : "never" ,
2026-02-02 16:16:37 +03:00
"spanNulls" : false ,
2025-09-16 17:02:17 +03:00
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
"mode" : "off"
}
} ,
"mappings" : [ ] ,
2026-02-02 16:16:37 +03:00
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
{
"color" : "red" ,
"value" : 80
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "watt"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"overrides" : [ ]
2025-09-16 17:02:17 +03:00
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 6 ,
"x" : 12 ,
2025-09-16 17:02:17 +03:00
"y" : 10
} ,
2026-02-02 16:16:37 +03:00
"id" : 8 ,
2025-09-16 17:02:17 +03:00
"options" : {
"legend" : {
2026-02-02 16:16:37 +03:00
"calcs" : [ ] ,
2025-09-16 17:02:17 +03:00
"displayMode" : "list" ,
"placement" : "bottom" ,
2026-02-02 16:16:37 +03:00
"showLegend" : false
2025-09-16 17:02:17 +03:00
} ,
"tooltip" : {
"hideZeros" : false ,
"mode" : "multi" ,
2026-02-02 16:16:37 +03:00
"sort" : "none"
2025-09-16 17:02:17 +03:00
}
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_power_draw_watts{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Power Draw" ,
2025-09-16 17:02:17 +03:00
"type" : "timeseries"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "The fan speed value is the percent of the product's maximum noise tolerance fan speed that the device's fan is currently intended to run at. This value may exceed 100% in certain cases. Note: The reported speed is the intended fan speed. If the fan is physically blocked and unable to spin, this output will not match the actual fan speed. Many parts do not report fan speeds because they rely on cooling via fans in the surrounding enclosure.\n" ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "palette-classic"
} ,
"custom" : {
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
2026-02-02 16:16:37 +03:00
"axisLabel" : "" ,
2025-09-16 17:02:17 +03:00
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
2026-02-02 16:16:37 +03:00
"fillOpacity" : 10 ,
2025-09-16 17:02:17 +03:00
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
2026-02-02 16:16:37 +03:00
"lineWidth" : 1 ,
2025-09-16 17:02:17 +03:00
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
"showPoints" : "never" ,
2026-02-02 16:16:37 +03:00
"spanNulls" : false ,
2025-09-16 17:02:17 +03:00
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
"mode" : "line+area"
}
} ,
"mappings" : [ ] ,
2026-02-02 16:16:37 +03:00
"max" : 1 ,
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "transparent" ,
"value" : 0
2026-02-02 16:16:37 +03:00
} ,
{
"color" : "orange" ,
"value" : 0.7
} ,
{
"color" : "red" ,
"value" : 0.9
2025-09-16 17:02:17 +03:00
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "percentunit"
2025-09-16 17:02:17 +03:00
} ,
"overrides" : [ ]
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 6 ,
"x" : 18 ,
2025-09-16 17:02:17 +03:00
"y" : 10
} ,
2026-02-02 16:16:37 +03:00
"id" : 9 ,
2025-09-16 17:02:17 +03:00
"options" : {
"legend" : {
2026-02-02 16:16:37 +03:00
"calcs" : [ ] ,
2025-09-16 17:02:17 +03:00
"displayMode" : "list" ,
"placement" : "bottom" ,
"showLegend" : false
} ,
"tooltip" : {
"hideZeros" : false ,
"mode" : "multi" ,
2026-02-02 16:16:37 +03:00
"sort" : "none"
2025-09-16 17:02:17 +03:00
}
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_fan_speed_ratio{uuid=\"$gpu\"}" ,
"interval" : "" ,
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Fan Speed %" ,
2025-09-16 17:02:17 +03:00
"type" : "timeseries"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "Current frequency of graphics (shader) clock." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "palette-classic"
2025-09-16 17:02:17 +03:00
} ,
"custom" : {
2026-02-02 16:16:37 +03:00
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
"fillOpacity" : 10 ,
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
"lineWidth" : 1 ,
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
"showPoints" : "never" ,
"spanNulls" : false ,
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
"mode" : "off"
}
2025-09-16 17:02:17 +03:00
} ,
"mappings" : [ ] ,
2026-02-02 16:16:37 +03:00
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
{
"color" : "red" ,
"value" : 80
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "hertz"
} ,
"overrides" : [ ]
2025-09-16 17:02:17 +03:00
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 6 ,
2025-09-16 17:02:17 +03:00
"x" : 0 ,
2026-02-02 16:16:37 +03:00
"y" : 15
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"id" : 12 ,
2025-09-16 17:02:17 +03:00
"options" : {
2026-02-02 16:16:37 +03:00
"legend" : {
"calcs" : [ ] ,
"displayMode" : "list" ,
"placement" : "bottom" ,
"showLegend" : false
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"tooltip" : {
"hideZeros" : false ,
"mode" : "multi" ,
"sort" : "none"
}
} ,
"pluginVersion" : "12.1.0" ,
"targets" : [
2025-09-16 17:02:17 +03:00
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_current_graphics_clock_hz{uuid=\"$gpu\"}" ,
"format" : "time_series" ,
2025-09-16 17:02:17 +03:00
"interval" : "" ,
2026-02-02 16:16:37 +03:00
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Graphics Clock Speed" ,
"type" : "timeseries"
2025-09-16 17:02:17 +03:00
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "Current frequency of video encoder/decoder clock." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
"mode" : "palette-classic"
} ,
"custom" : {
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
2025-09-16 17:19:07 +03:00
"barWidthFactor" : 0.6 ,
2025-09-16 17:02:17 +03:00
"drawStyle" : "line" ,
2026-02-02 16:16:37 +03:00
"fillOpacity" : 10 ,
2025-09-16 17:02:17 +03:00
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
"lineWidth" : 1 ,
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
2026-02-02 16:16:37 +03:00
"showPoints" : "never" ,
2025-09-16 17:02:17 +03:00
"spanNulls" : false ,
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
"mode" : "off"
}
} ,
"mappings" : [ ] ,
2026-02-02 16:16:37 +03:00
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
2025-09-16 17:19:07 +03:00
"color" : "green" ,
"value" : 0
2025-09-16 17:02:17 +03:00
} ,
{
"color" : "red" ,
"value" : 80
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "hertz"
2025-09-16 17:02:17 +03:00
} ,
"overrides" : [ ]
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 6 ,
"x" : 6 ,
"y" : 15
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"id" : 19 ,
2025-09-16 17:02:17 +03:00
"options" : {
"legend" : {
"calcs" : [ ] ,
"displayMode" : "list" ,
"placement" : "bottom" ,
2026-02-02 16:16:37 +03:00
"showLegend" : false
2025-09-16 17:02:17 +03:00
} ,
"tooltip" : {
2025-09-16 17:19:07 +03:00
"hideZeros" : false ,
2025-09-16 17:02:17 +03:00
"mode" : "multi" ,
"sort" : "none"
}
} ,
2025-09-16 17:19:07 +03:00
"pluginVersion" : "12.1.0" ,
2025-09-16 17:02:17 +03:00
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
2026-02-02 16:16:37 +03:00
"expr" : "nvidia_smi_clocks_current_video_clock_hz{uuid=\"$gpu\"}" ,
2025-09-16 17:02:17 +03:00
"format" : "time_series" ,
"interval" : "" ,
2026-02-02 16:16:37 +03:00
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Video Clock Speed" ,
2025-09-16 17:02:17 +03:00
"type" : "timeseries"
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "Current frequency of SM (Streaming Multiprocessor) clock." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
2026-02-02 16:16:37 +03:00
"color" : {
"mode" : "palette-classic"
} ,
2025-09-16 17:02:17 +03:00
"custom" : {
2026-02-02 16:16:37 +03:00
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
"fillOpacity" : 10 ,
"gradientMode" : "none" ,
2025-09-16 17:02:17 +03:00
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
2026-02-02 16:16:37 +03:00
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
"lineWidth" : 1 ,
"pointSize" : 5 ,
2025-09-16 17:02:17 +03:00
"scaleDistribution" : {
"type" : "linear"
2026-02-02 16:16:37 +03:00
} ,
"showPoints" : "never" ,
"spanNulls" : false ,
"stacking" : {
"group" : "A" ,
"mode" : "none"
} ,
"thresholdsStyle" : {
"mode" : "off"
2025-09-16 17:02:17 +03:00
}
2026-02-02 16:16:37 +03:00
} ,
"mappings" : [ ] ,
"min" : 0 ,
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
"color" : "green" ,
"value" : 0
} ,
{
"color" : "red" ,
"value" : 80
}
]
} ,
"unit" : "hertz"
2025-09-16 17:02:17 +03:00
} ,
"overrides" : [ ]
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 6 ,
2025-09-16 17:02:17 +03:00
"x" : 12 ,
2026-02-02 16:16:37 +03:00
"y" : 15
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"id" : 24 ,
2025-09-16 17:02:17 +03:00
"options" : {
"legend" : {
2026-02-02 16:16:37 +03:00
"calcs" : [ ] ,
"displayMode" : "list" ,
"placement" : "bottom" ,
"showLegend" : false
2025-09-16 17:02:17 +03:00
} ,
"tooltip" : {
2026-02-02 16:16:37 +03:00
"hideZeros" : false ,
"mode" : "multi" ,
"sort" : "none"
2025-09-16 17:02:17 +03:00
}
} ,
2025-09-16 17:19:07 +03:00
"pluginVersion" : "12.1.0" ,
2025-09-16 17:02:17 +03:00
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
"exemplar" : true ,
2026-02-02 16:16:37 +03:00
"expr" : "nvidia_smi_clocks_current_sm_clock_hz{uuid=\"$gpu\"}" ,
"format" : "time_series" ,
2025-09-16 17:02:17 +03:00
"interval" : "" ,
2026-02-02 16:16:37 +03:00
"legendFormat" : "{{uuid}}" ,
2025-09-16 17:02:17 +03:00
"refId" : "A"
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "SM Clock Speed" ,
"type" : "timeseries"
2025-09-16 17:02:17 +03:00
} ,
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"description" : "Current frequency of memory clock." ,
2025-09-16 17:02:17 +03:00
"fieldConfig" : {
"defaults" : {
"color" : {
2026-02-02 16:16:37 +03:00
"mode" : "palette-classic"
2025-09-16 17:02:17 +03:00
} ,
"custom" : {
2026-02-02 16:16:37 +03:00
"axisBorderShow" : false ,
"axisCenteredZero" : false ,
"axisColorMode" : "text" ,
"axisLabel" : "" ,
"axisPlacement" : "auto" ,
"barAlignment" : 0 ,
"barWidthFactor" : 0.6 ,
"drawStyle" : "line" ,
"fillOpacity" : 10 ,
"gradientMode" : "none" ,
"hideFrom" : {
"legend" : false ,
"tooltip" : false ,
"viz" : false
} ,
"insertNulls" : false ,
"lineInterpolation" : "linear" ,
"lineWidth" : 1 ,
"pointSize" : 5 ,
"scaleDistribution" : {
"type" : "linear"
} ,
"showPoints" : "never" ,
"spanNulls" : false ,
"stacking" : {
"group" : "A" ,
"mode" : "none"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"thresholdsStyle" : {
"mode" : "off"
}
2025-09-16 17:02:17 +03:00
} ,
"mappings" : [ ] ,
2026-02-02 16:16:37 +03:00
"min" : 0 ,
2025-09-16 17:02:17 +03:00
"thresholds" : {
"mode" : "absolute" ,
"steps" : [
{
2025-09-16 17:19:07 +03:00
"color" : "green" ,
"value" : 0
2025-09-16 17:02:17 +03:00
} ,
{
"color" : "red" ,
"value" : 80
}
]
} ,
2026-02-02 16:16:37 +03:00
"unit" : "hertz"
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"overrides" : [ ]
2025-09-16 17:02:17 +03:00
} ,
"gridPos" : {
2026-02-02 16:16:37 +03:00
"h" : 5 ,
"w" : 6 ,
"x" : 18 ,
"y" : 15
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"id" : 18 ,
2025-09-16 17:02:17 +03:00
"options" : {
2026-02-02 16:16:37 +03:00
"legend" : {
"calcs" : [ ] ,
"displayMode" : "list" ,
"placement" : "bottom" ,
"showLegend" : false
2025-09-16 17:02:17 +03:00
} ,
2026-02-02 16:16:37 +03:00
"tooltip" : {
"hideZeros" : false ,
"mode" : "multi" ,
"sort" : "none"
}
2025-09-16 17:02:17 +03:00
} ,
2025-09-16 17:19:07 +03:00
"pluginVersion" : "12.1.0" ,
2025-09-16 17:02:17 +03:00
"targets" : [
{
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"exemplar" : true ,
"expr" : "nvidia_smi_clocks_current_memory_clock_hz{uuid=\"$gpu\"}" ,
2025-09-16 17:02:17 +03:00
"format" : "time_series" ,
2026-02-02 16:16:37 +03:00
"interval" : "" ,
"legendFormat" : "{{uuid}}" ,
"refId" : "A"
2025-09-16 17:02:17 +03:00
}
] ,
2026-02-02 16:16:37 +03:00
"title" : "Memory Clock Speed" ,
"type" : "timeseries"
2025-09-16 17:02:17 +03:00
}
] ,
"preload" : false ,
2026-02-02 16:16:37 +03:00
"refresh" : "10s" ,
2025-09-16 17:02:17 +03:00
"schemaVersion" : 41 ,
"tags" : [ ] ,
"templating" : {
"list" : [
{
"current" : {
2026-02-02 16:16:37 +03:00
"text" : "yandex-prod" ,
"value" : "yandex-prod"
2025-09-16 17:02:17 +03:00
} ,
"definition" : "label_values(kube_node_info,cluster)" ,
"label" : "Cluster" ,
"name" : "cluster" ,
"options" : [ ] ,
"query" : {
"qryType" : 1 ,
"query" : "label_values(kube_node_info,cluster)" ,
"refId" : "PrometheusVariableQueryEditor-VariableQuery"
} ,
"refresh" : 1 ,
"regex" : "" ,
"type" : "query"
} ,
{
"current" : {
2026-02-02 16:16:37 +03:00
"text" : "cl1h3aok1ph8647rkppb-aryg" ,
"value" : "cl1h3aok1ph8647rkppb-aryg"
2025-09-16 17:02:17 +03:00
} ,
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"definition" : "label_values(nvidia_smi_index{cluster=~\"$cluster\"},instance)" ,
"includeAll" : false ,
"label" : "Host" ,
"name" : "node" ,
2025-09-16 17:02:17 +03:00
"options" : [ ] ,
2025-09-16 17:43:11 +03:00
"query" : {
"qryType" : 1 ,
2026-02-02 16:16:37 +03:00
"query" : "label_values(nvidia_smi_index{cluster=~\"$cluster\"},instance)" ,
2025-09-16 17:43:11 +03:00
"refId" : "PrometheusVariableQueryEditor-VariableQuery"
} ,
2026-02-02 16:16:37 +03:00
"refresh" : 2 ,
2025-09-16 17:02:17 +03:00
"regex" : "" ,
"type" : "query"
} ,
{
"current" : {
2026-02-02 16:16:37 +03:00
"text" : "1200859e-158e-e077-b06b-0c526fe106ca" ,
"value" : "1200859e-158e-e077-b06b-0c526fe106ca"
2025-09-16 17:02:17 +03:00
} ,
"datasource" : {
"type" : "prometheus" ,
"uid" : "prom"
} ,
2026-02-02 16:16:37 +03:00
"definition" : "label_values(nvidia_smi_index{instance=\"$node\"},uuid)" ,
"includeAll" : false ,
"label" : "GPU" ,
"name" : "gpu" ,
2025-09-16 17:02:17 +03:00
"options" : [ ] ,
2025-09-16 17:43:11 +03:00
"query" : {
2026-02-02 16:16:37 +03:00
"query" : "label_values(nvidia_smi_index{instance=\"$node\"},uuid)" ,
"refId" : "StandardVariableQuery"
2025-09-16 17:43:11 +03:00
} ,
2025-09-16 17:02:17 +03:00
"refresh" : 1 ,
"regex" : "" ,
"sort" : 1 ,
"type" : "query"
}
]
} ,
"time" : {
2026-02-02 16:16:37 +03:00
"from" : "now-30m" ,
2025-09-16 17:02:17 +03:00
"to" : "now"
} ,
2026-02-02 16:16:37 +03:00
"timepicker" : { } ,
"timezone" : "" ,
"title" : "Nvidia GPU Metrics" ,
"uid" : "2e8d5337-fdc5-46e9-96db-fb37d6271fb2" ,
"version" : 4
2025-09-16 17:02:17 +03:00
}