Skip to content

Commit 8f10fcd

Browse files
add msg
Signed-off-by: Kacper Pietkun <[email protected]>
1 parent 2314cce commit 8f10fcd

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

vllm_gaudi/v1/worker/hpu_worker.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -327,10 +327,11 @@ def sleep(self, level: int = 1) -> None:
327327
"""Put the worker into sleep mode to reduce memory usage. Unlike GPU workers that use custom
328328
memory allocators, HPU workers use a simpler approach of moving model to CPU and clearing KV cache.
329329
Args:
330-
level (int): Sleep level (kept for interface compatibility, performs only level 1 operations)
330+
level (int): Sleep level (kept for interface compatibility, always performs level 1 operations)
331331
"""
332332

333-
assert level == 1, f"Currently, HPU supports only sleep mode level 1 (and not: level {level})"
333+
if level == 2:
334+
logger.warning("Currently, HPU does not support level 2 sleep mode. Performing level 1 operations")
334335
assert not htorch.utils.internal.is_lazy(
335336
) or self.model_config.enforce_eager, "Sleep mode is supported only for torch.compile mode"
336337

0 commit comments

Comments
 (0)