[Bugfix] Fix the fp8 kv_cache check error that occurs when failing to obtain the CUDA version. (#4173)
Signed-off-by: AnyISalIn <anyisalin@gmail.com>
This commit is contained in:
parent
6f1df80436
commit
a88bb9b032
@ -353,7 +353,8 @@ class CacheConfig:
|
|||||||
elif self.cache_dtype == "fp8":
|
elif self.cache_dtype == "fp8":
|
||||||
if not is_hip():
|
if not is_hip():
|
||||||
nvcc_cuda_version = get_nvcc_cuda_version()
|
nvcc_cuda_version = get_nvcc_cuda_version()
|
||||||
if nvcc_cuda_version < Version("11.8"):
|
if nvcc_cuda_version is not None \
|
||||||
|
and nvcc_cuda_version < Version("11.8"):
|
||||||
raise ValueError(
|
raise ValueError(
|
||||||
"FP8 is not supported when cuda version is"
|
"FP8 is not supported when cuda version is"
|
||||||
"lower than 11.8.")
|
"lower than 11.8.")
|
||||||
|
Loading…
x
Reference in New Issue
Block a user