Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
fd6bc480
Commit
fd6bc480
authored
May 22, 2024
by
zhuwenwen
Browse files
skip fp8
parent
99b471c2
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
5 additions
and
5 deletions
+5
-5
CMakeLists.txt
CMakeLists.txt
+1
-1
cmake/utils.cmake
cmake/utils.cmake
+1
-1
setup.py
setup.py
+3
-3
No files found.
CMakeLists.txt
View file @
fd6bc480
...
...
@@ -167,7 +167,7 @@ set(VLLM_EXT_SRC
"csrc/layernorm_kernels.cu"
"csrc/quantization/squeezellm/quant_cuda_kernel.cu"
"csrc/quantization/gptq/q_gemm.cu"
"csrc/quantization/fp8/fp8_cuda_kernels.cu"
#
"csrc/quantization/fp8/fp8_cuda_kernels.cu"
"csrc/cuda_utils_kernels.cu"
"csrc/moe_align_block_size_kernels.cu"
"csrc/pybind.cpp"
)
...
...
cmake/utils.cmake
View file @
fd6bc480
...
...
@@ -119,7 +119,7 @@ function (get_torch_gpu_compiler_flags OUT_GPU_FLAGS GPU_LANG)
list
(
APPEND GPU_FLAGS
"-DUSE_ROCM"
"-DENABLE_FP8_E4M3"
#
"-DENABLE_FP8_E4M3"
"-U__HIP_NO_HALF_CONVERSIONS__"
"-U__HIP_NO_HALF_OPERATORS__"
"-fno-gpu-rdc"
...
...
setup.py
View file @
fd6bc480
...
...
@@ -356,9 +356,9 @@ def get_vllm_version() -> str:
version
+=
f
"+cu
{
cuda_version_str
}
"
elif
_is_hip
():
# Get the HIP version
hipcc_version
=
get_hipcc_rocm_version
()
if
hipcc_version
!=
MAIN_CUDA_VERSION
:
rocm_version_str
=
hipcc_version
.
replace
(
"."
,
""
)[:
3
]
#
hipcc_version = get_hipcc_rocm_version()
#
if hipcc_version != MAIN_CUDA_VERSION:
#
rocm_version_str = hipcc_version.replace(".", "")[:3]
# version += f"+rocm{rocm_version_str}"
version
=
get_version
()
elif
_is_neuron
():
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment