mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 14:53:52 +08:00
[core] add wake_up doc and some sanity check (#12361)
Signed-off-by: youkaichao <youkaichao@gmail.com>
This commit is contained in:
@ -1157,6 +1157,9 @@ class LLM:
|
||||
self.llm_engine.sleep(level=level)
|
||||
|
||||
def wake_up(self):
|
||||
"""
|
||||
Wake up the engine from sleep mode. See the :meth:`sleep` method
|
||||
for more details."""
|
||||
self.llm_engine.wake_up()
|
||||
|
||||
# LEGACY
|
||||
|
@ -47,6 +47,7 @@ class ExecutorBase(ABC):
|
||||
self.prompt_adapter_config = vllm_config.prompt_adapter_config
|
||||
self.observability_config = vllm_config.observability_config
|
||||
self._init_executor()
|
||||
self.is_sleeping = False
|
||||
|
||||
@abstractmethod
|
||||
def _init_executor(self) -> None:
|
||||
@ -194,10 +195,18 @@ class ExecutorBase(ABC):
|
||||
self.collective_rpc("stop_profile")
|
||||
|
||||
def sleep(self, level: int = 1):
|
||||
if self.is_sleeping:
|
||||
logger.warning("Executor is already sleeping.")
|
||||
return
|
||||
self.collective_rpc("sleep", kwargs=dict(level=level))
|
||||
self.is_sleeping = True
|
||||
|
||||
def wake_up(self):
|
||||
if not self.is_sleeping:
|
||||
logger.warning("Executor is not sleeping.")
|
||||
return
|
||||
self.collective_rpc("wake_up")
|
||||
self.is_sleeping = False
|
||||
|
||||
def save_sharded_state(
|
||||
self,
|
||||
|
Reference in New Issue
Block a user