[UX] Change kv-cache-memory log level to debug (#25479)

Signed-off-by: Michael Goin <mgoin64@gmail.com>
2025-10-20 23:03:52 +08:00 · 2025-09-23 11:01:24 -04:00
parent 4c966e440e
commit 2c58742dff
1 changed files with 1 additions and 1 deletions
--- a/vllm/v1/worker/gpu_worker.py
+++ b/vllm/v1/worker/gpu_worker.py
@ -389,7 +389,7 @@ class Worker(WorkerBase):
                f"utilize gpu memory. Current kv cache memory in use is "
                f"{int(self.available_kv_cache_memory_bytes)} bytes.")
-            logger.info(msg)
+            logger.debug(msg)
        # Warm up sampler and preallocate memory buffer for logits and other
        # sampling related tensors of max possible shape to avoid memory