update gptq relative path

2d0a73a3 · zhuwenwen · 0e7df36b · 2d0a73a3 · 2d0a73a3
Commit 2d0a73a3 authored Jul 24, 2024 by zhuwenwen
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 7 deletions

README.md README.md +2 -5

csrc/quantization/gptq/setup.py csrc/quantization/gptq/setup.py +2 -2

No files found.
--- a/README.md
+++ b/README.md
@@ -59,17 +59,14 @@ git clone http://developer.hpccube.com/codes/OpenDAS/vllm.git # 根据需要的
 ```
 1. 编译whl包并安装
 VLLM_INSTALL_PUNICA_KERNELS=1 python setup.py bdist_wheel 
+python csrc/quantization/gptq/setup.py bdist_wheel
 cd dist
 pip install vllm*
-cd csrc/quantization/gptq
-python setup.py bdist_wheel
-cd dist
 pip install gptq_kernel

 2. 源码编译安装
 VLLM_INSTALL_PUNICA_KERNELS=1 python3 setup.py install 
-cd csrc/quantization/gptq
-python setup.py install 
+python csrc/quantization/gptq/setup.py install 
 ```

 #### 运行基础环境准备

--- a/csrc/quantization/gptq/setup.py
+++ b/csrc/quantization/gptq/setup.py
@@ -24,8 +24,8 @@ setup(
        CUDAExtension(
            name="gptq_kernels",
            sources=[
-                "./torch_bindings.cpp",
-                "./q_gemm.cu",
+                "csrc/quantization/gptq/torch_bindings.cpp",
+                "csrc/quantization/gptq/q_gemm.cu",
            ],
            extra_compile_args=extra_compile_args,
        )