mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 14:53:52 +08:00
@ -174,12 +174,10 @@ class SharedStorageConnector(KVConnectorBase_V1):
|
|||||||
# Only process layers that have kv_cache
|
# Only process layers that have kv_cache
|
||||||
# attribute (attention layers) Skip non-attention
|
# attribute (attention layers) Skip non-attention
|
||||||
# layers like FusedMoE/MLP etc.
|
# layers like FusedMoE/MLP etc.
|
||||||
kv_cache_attr = getattr(layer, "kv_cache", None)
|
kv_cache_layer = getattr(layer, "kv_cache", None)
|
||||||
if kv_cache_attr is None:
|
if kv_cache_layer is None:
|
||||||
continue
|
continue
|
||||||
|
|
||||||
kv_cache_layer = kv_cache_attr[forward_context.virtual_engine]
|
|
||||||
|
|
||||||
filename = self._generate_filename_debug(
|
filename = self._generate_filename_debug(
|
||||||
layer_name, request.token_ids, request.mm_hashes
|
layer_name, request.token_ids, request.mm_hashes
|
||||||
)
|
)
|
||||||
|
Reference in New Issue
Block a user