[Misc] AMD Build Improvements (#12923)
This commit is contained in:
parent
7c4033acd4
commit
f1042e86f0
@ -3,7 +3,7 @@
|
|||||||
#include <c10/cuda/CUDAGuard.h>
|
#include <c10/cuda/CUDAGuard.h>
|
||||||
|
|
||||||
#include <ATen/ATen.h>
|
#include <ATen/ATen.h>
|
||||||
#include <THC/THCAtomics.cuh>
|
#include <ATen/cuda/Atomic.cuh>
|
||||||
|
|
||||||
#include "../cuda_compat.h"
|
#include "../cuda_compat.h"
|
||||||
#include "../dispatch_utils.h"
|
#include "../dispatch_utils.h"
|
||||||
|
@ -1122,4 +1122,4 @@ void paged_attention(
|
|||||||
#undef WARP_SIZE
|
#undef WARP_SIZE
|
||||||
#undef MAX
|
#undef MAX
|
||||||
#undef MIN
|
#undef MIN
|
||||||
#undef DIVIDE_ROUND_UP
|
#undef DIVIDE_ROUND_UP
|
||||||
|
@ -205,6 +205,14 @@ _VLLM_MODELS = {
|
|||||||
**_FALLBACK_MODEL,
|
**_FALLBACK_MODEL,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
# This variable is used as the args for subprocess.run(). We
|
||||||
|
# can modify this variable to alter the args if needed. e.g.
|
||||||
|
# when we use par format to pack things together, sys.executable
|
||||||
|
# might not be the target we want to run.
|
||||||
|
_SUBPROCESS_COMMAND = [
|
||||||
|
sys.executable, "-m", "vllm.model_executor.models.registry"
|
||||||
|
]
|
||||||
|
|
||||||
|
|
||||||
@dataclass(frozen=True)
|
@dataclass(frozen=True)
|
||||||
class _ModelInfo:
|
class _ModelInfo:
|
||||||
@ -502,10 +510,9 @@ def _run_in_subprocess(fn: Callable[[], _T]) -> _T:
|
|||||||
|
|
||||||
# cannot use `sys.executable __file__` here because the script
|
# cannot use `sys.executable __file__` here because the script
|
||||||
# contains relative imports
|
# contains relative imports
|
||||||
returned = subprocess.run(
|
returned = subprocess.run(_SUBPROCESS_COMMAND,
|
||||||
[sys.executable, "-m", "vllm.model_executor.models.registry"],
|
input=input_bytes,
|
||||||
input=input_bytes,
|
capture_output=True)
|
||||||
capture_output=True)
|
|
||||||
|
|
||||||
# check if the subprocess is successful
|
# check if the subprocess is successful
|
||||||
try:
|
try:
|
||||||
|
@ -45,4 +45,4 @@ __all__ = [
|
|||||||
"SolarConfig",
|
"SolarConfig",
|
||||||
"Telechat2Config",
|
"Telechat2Config",
|
||||||
"UltravoxConfig",
|
"UltravoxConfig",
|
||||||
]
|
]
|
||||||
|
Loading…
x
Reference in New Issue
Block a user