[V1][Minor] Avoid frequently creating ConstantList (#12653)

A small optimization to avoid creating a new `ConstantList` every time `request.kv_block_hashes` is used. Signed-off-by: Woosuk Kwon <woosuk.kwon@berkeley.edu>
2025-10-20 14:53:52 +08:00 · 2025-02-01 23:43:20 -08:00
parent e497f33491
commit abfcdcdf27
1 changed files with 2 additions and 5 deletions
--- a/vllm/v1/request.py
+++ b/vllm/v1/request.py
@ -64,6 +64,7 @@ class Request:
        # Cache the computed kv block hashes of the request to avoid
        # recomputing.
        self._kv_block_hashes: List[BlockHashType] = []
+        self.kv_block_hashes = ConstantList(self._kv_block_hashes)

        # Read-only views
        # Prevent directly appending to the these lists since
@ -121,13 +122,9 @@ class Request:
        num_tokens = self.mm_positions[input_id]["length"]
        return num_tokens

-    @property
-    def kv_block_hashes(self) -> ConstantList["BlockHashType"]:
-        # Prevent directly appending to the kv_block_hashes.
-        return ConstantList(self._kv_block_hashes)
-
    def set_kv_block_hashes(self, value: List["BlockHashType"]) -> None:
        self._kv_block_hashes = value
+        self.kv_block_hashes = ConstantList(self._kv_block_hashes)

    def append_kv_block_hashes(self, block_hash: "BlockHashType") -> None:
        self._kv_block_hashes.append(block_hash)