mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 23:03:52 +08:00
[Misc][Minor] Fix CPU block num log in CPUExecutor. (#4088)
This commit is contained in:
@ -74,7 +74,10 @@ class CPUExecutor(ExecutorBase):
|
|||||||
# NOTE: We log here to avoid multiple logs when number of workers is
|
# NOTE: We log here to avoid multiple logs when number of workers is
|
||||||
# greater than one. We could log in the engine, but not all executors
|
# greater than one. We could log in the engine, but not all executors
|
||||||
# have GPUs.
|
# have GPUs.
|
||||||
logger.info(f"# CPU blocks: {num_cpu_blocks}")
|
# NOTE: `cpu block` for CPU backend is located on CPU memory but is
|
||||||
|
# referred as `gpu block`. Because we want to reuse the existing block
|
||||||
|
# management procedure.
|
||||||
|
logger.info(f"# CPU blocks: {num_gpu_blocks}")
|
||||||
self.driver_worker.initialize_cache(num_gpu_blocks, num_cpu_blocks)
|
self.driver_worker.initialize_cache(num_gpu_blocks, num_cpu_blocks)
|
||||||
|
|
||||||
def execute_model(self,
|
def execute_model(self,
|
||||||
|
Reference in New Issue
Block a user