Commit 2d0a73a3 authored by zhuwenwen's avatar zhuwenwen
Browse files

update gptq relative path

parent 0e7df36b
...@@ -59,17 +59,14 @@ git clone http://developer.hpccube.com/codes/OpenDAS/vllm.git # 根据需要的 ...@@ -59,17 +59,14 @@ git clone http://developer.hpccube.com/codes/OpenDAS/vllm.git # 根据需要的
``` ```
1. 编译whl包并安装 1. 编译whl包并安装
VLLM_INSTALL_PUNICA_KERNELS=1 python setup.py bdist_wheel VLLM_INSTALL_PUNICA_KERNELS=1 python setup.py bdist_wheel
python csrc/quantization/gptq/setup.py bdist_wheel
cd dist cd dist
pip install vllm* pip install vllm*
cd csrc/quantization/gptq
python setup.py bdist_wheel
cd dist
pip install gptq_kernel pip install gptq_kernel
2. 源码编译安装 2. 源码编译安装
VLLM_INSTALL_PUNICA_KERNELS=1 python3 setup.py install VLLM_INSTALL_PUNICA_KERNELS=1 python3 setup.py install
cd csrc/quantization/gptq python csrc/quantization/gptq/setup.py install
python setup.py install
``` ```
#### 运行基础环境准备 #### 运行基础环境准备
......
...@@ -24,8 +24,8 @@ setup( ...@@ -24,8 +24,8 @@ setup(
CUDAExtension( CUDAExtension(
name="gptq_kernels", name="gptq_kernels",
sources=[ sources=[
"./torch_bindings.cpp", "csrc/quantization/gptq/torch_bindings.cpp",
"./q_gemm.cu", "csrc/quantization/gptq/q_gemm.cu",
], ],
extra_compile_args=extra_compile_args, extra_compile_args=extra_compile_args,
) )
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment