From 05b5ab2a81719fc2b097c982be485eed365bf1a6 Mon Sep 17 00:00:00 2001 From: ctrueblood-epri Date: Wed, 22 Oct 2025 07:47:03 -0400 Subject: [PATCH] Update grafana.json: rename vllm:gpu_cache_usage_perc to vllm:kv_cache_usage_perc Signed-off-by: ctrueblood-epri --- examples/online_serving/prometheus_grafana/grafana.json | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/examples/online_serving/prometheus_grafana/grafana.json b/examples/online_serving/prometheus_grafana/grafana.json index 37abc9de926f..7aa0045a9798 100644 --- a/examples/online_serving/prometheus_grafana/grafana.json +++ b/examples/online_serving/prometheus_grafana/grafana.json @@ -852,9 +852,9 @@ "uid": "${DS_PROMETHEUS}" }, "editorMode": "code", - "expr": "vllm:gpu_cache_usage_perc{model_name=\"$model_name\"}", + "expr": "vllm:kv_cache_usage_perc{model_name=\"$model_name\"}", "instant": false, - "legendFormat": "GPU Cache Usage", + "legendFormat": "KV Cache Usage", "range": true, "refId": "A" }