config check sleep mode support oot platforms (#16562)
This commit is contained in:
parent
1eb3c2ed48
commit
d2020acac7
@ -417,8 +417,10 @@ class ModelConfig:
|
||||
|
||||
from vllm.platforms import current_platform
|
||||
|
||||
if self.enable_sleep_mode and not current_platform.is_cuda():
|
||||
raise ValueError("Sleep mode is only supported on CUDA devices.")
|
||||
if (self.enable_sleep_mode
|
||||
and not current_platform.is_sleep_mode_available()):
|
||||
raise ValueError(
|
||||
"Sleep mode is not supported on current platform.")
|
||||
|
||||
hf_config = get_config(self.hf_config_path or self.model,
|
||||
trust_remote_code, revision, code_revision,
|
||||
|
@ -148,6 +148,9 @@ class Platform:
|
||||
"""Stateless version of :func:`torch.cuda.is_available`."""
|
||||
return self._enum in (PlatformEnum.CUDA, PlatformEnum.ROCM)
|
||||
|
||||
def is_sleep_mode_available(self) -> bool:
|
||||
return self._enum == PlatformEnum.CUDA
|
||||
|
||||
@classmethod
|
||||
def get_attn_backend_cls(cls, selected_backend: _Backend, head_size: int,
|
||||
dtype: torch.dtype, kv_cache_dtype: Optional[str],
|
||||
|
Loading…
x
Reference in New Issue
Block a user