Unverified Commit f1042e86 authored by Shiyan Deng's avatar Shiyan Deng Committed by GitHub
Browse files

[Misc] AMD Build Improvements (#12923)

parent 7c4033ac
...@@ -3,7 +3,7 @@ ...@@ -3,7 +3,7 @@
#include <c10/cuda/CUDAGuard.h> #include <c10/cuda/CUDAGuard.h>
#include <ATen/ATen.h> #include <ATen/ATen.h>
#include <THC/THCAtomics.cuh> #include <ATen/cuda/Atomic.cuh>
#include "../cuda_compat.h" #include "../cuda_compat.h"
#include "../dispatch_utils.h" #include "../dispatch_utils.h"
......
...@@ -1122,4 +1122,4 @@ void paged_attention( ...@@ -1122,4 +1122,4 @@ void paged_attention(
#undef WARP_SIZE #undef WARP_SIZE
#undef MAX #undef MAX
#undef MIN #undef MIN
#undef DIVIDE_ROUND_UP #undef DIVIDE_ROUND_UP
\ No newline at end of file
...@@ -205,6 +205,14 @@ _VLLM_MODELS = { ...@@ -205,6 +205,14 @@ _VLLM_MODELS = {
**_FALLBACK_MODEL, **_FALLBACK_MODEL,
} }
# This variable is used as the args for subprocess.run(). We
# can modify this variable to alter the args if needed. e.g.
# when we use par format to pack things together, sys.executable
# might not be the target we want to run.
_SUBPROCESS_COMMAND = [
sys.executable, "-m", "vllm.model_executor.models.registry"
]
@dataclass(frozen=True) @dataclass(frozen=True)
class _ModelInfo: class _ModelInfo:
...@@ -502,10 +510,9 @@ def _run_in_subprocess(fn: Callable[[], _T]) -> _T: ...@@ -502,10 +510,9 @@ def _run_in_subprocess(fn: Callable[[], _T]) -> _T:
# cannot use `sys.executable __file__` here because the script # cannot use `sys.executable __file__` here because the script
# contains relative imports # contains relative imports
returned = subprocess.run( returned = subprocess.run(_SUBPROCESS_COMMAND,
[sys.executable, "-m", "vllm.model_executor.models.registry"], input=input_bytes,
input=input_bytes, capture_output=True)
capture_output=True)
# check if the subprocess is successful # check if the subprocess is successful
try: try:
......
...@@ -45,4 +45,4 @@ __all__ = [ ...@@ -45,4 +45,4 @@ __all__ = [
"SolarConfig", "SolarConfig",
"Telechat2Config", "Telechat2Config",
"UltravoxConfig", "UltravoxConfig",
] ]
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment