mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 14:53:52 +08:00
Don't use cupy when enforce_eager=True
(#3037)
This commit is contained in:
@ -284,7 +284,10 @@ class LLMEngine:
|
||||
is_driver_worker=True,
|
||||
)
|
||||
|
||||
self._run_workers("init_model", cupy_port=get_open_port())
|
||||
# don't use cupy for eager mode
|
||||
self._run_workers("init_model",
|
||||
cupy_port=get_open_port()
|
||||
if not model_config.enforce_eager else None)
|
||||
self._run_workers(
|
||||
"load_model",
|
||||
max_concurrent_workers=self.parallel_config.
|
||||
|
Reference in New Issue
Block a user