Don't use cupy when enforce_eager=True (#3037)

This commit is contained in:
Roy
2024-02-27 09:33:38 +08:00
committed by GitHub
parent d9f726c4d0
commit c1c0d00b88

View File

@ -284,7 +284,10 @@ class LLMEngine:
is_driver_worker=True,
)
self._run_workers("init_model", cupy_port=get_open_port())
# don't use cupy for eager mode
self._run_workers("init_model",
cupy_port=get_open_port()
if not model_config.enforce_eager else None)
self._run_workers(
"load_model",
max_concurrent_workers=self.parallel_config.