[Bugfix] Fix unable to run encoder model when disable_hybrid_kv_cache_manager is true (#24571)

Signed-off-by: lianyibo <lianyibo1@kunlunit.com> Co-authored-by: Chen Zhang <zhangch99@outlook.com>
2025-10-20 14:53:52 +08:00 · 2025-09-17 01:36:58 +08:00
parent 567939953b
commit faa7a5daac
1 changed files with 4 additions and 0 deletions
--- a/vllm/v1/core/kv_cache_utils.py
+++ b/vllm/v1/core/kv_cache_utils.py
@ -754,6 +754,10 @@ def is_kv_cache_type_uniform(kv_cache_spec: dict[str, KVCacheSpec]) -> bool:
        True if all layers have the same type, False otherwise.
    """

+    if not kv_cache_spec:
+        # Encoder-only models do not have KV cache, kv_cache_type can be
+        # regarded as uniform.
+        return True
    try:
        kv_cache_spec_values = list(kv_cache_spec.values())
        _ = kv_cache_spec_values[0].merge(kv_cache_spec_values)