From 7db4b50a76619ee2ed801126e1d48295b4ffc0c8 Mon Sep 17 00:00:00 2001 From: youkaichao Date: Fri, 24 Jan 2025 02:00:50 +0800 Subject: [PATCH] [core] add wake_up doc and some sanity check (#12361) Signed-off-by: youkaichao --- vllm/entrypoints/llm.py | 3 +++ vllm/executor/executor_base.py | 9 +++++++++ 2 files changed, 12 insertions(+) diff --git a/vllm/entrypoints/llm.py b/vllm/entrypoints/llm.py index 563031cfadc4c..1860ed3d7db5a 100644 --- a/vllm/entrypoints/llm.py +++ b/vllm/entrypoints/llm.py @@ -1157,6 +1157,9 @@ def sleep(self, level: int = 1): self.llm_engine.sleep(level=level) def wake_up(self): + """ + Wake up the engine from sleep mode. See the :meth:`sleep` method + for more details.""" self.llm_engine.wake_up() # LEGACY diff --git a/vllm/executor/executor_base.py b/vllm/executor/executor_base.py index 6be62d4068572..471d1bfac3119 100644 --- a/vllm/executor/executor_base.py +++ b/vllm/executor/executor_base.py @@ -47,6 +47,7 @@ def __init__( self.prompt_adapter_config = vllm_config.prompt_adapter_config self.observability_config = vllm_config.observability_config self._init_executor() + self.is_sleeping = False @abstractmethod def _init_executor(self) -> None: @@ -194,10 +195,18 @@ def stop_profile(self) -> None: self.collective_rpc("stop_profile") def sleep(self, level: int = 1): + if self.is_sleeping: + logger.warning("Executor is already sleeping.") + return self.collective_rpc("sleep", kwargs=dict(level=level)) + self.is_sleeping = True def wake_up(self): + if not self.is_sleeping: + logger.warning("Executor is not sleeping.") + return self.collective_rpc("wake_up") + self.is_sleeping = False def save_sharded_state( self,