from setuptools import find_packages, setup from torch.utils.cpp_extension import BuildExtension, CUDAExtension, CppExtension extra_compile_args = { "cxx": ["-g", "-O3", "-fopenmp", "-lgomp", "-std=c++17"], "nvcc": ["-O3", "-std=c++17"], } setup( name="awq_inference_engine", packages=find_packages(), ext_modules=[ CUDAExtension( name="awq_inference_engine", sources=[ "csrc/pybind.cpp", "csrc/quantization/gemm_cuda_gen.cu", "csrc/layernorm/layernorm.cu", "csrc/position_embedding/pos_encoding_kernels.cu" ], extra_compile_args=extra_compile_args, ), ], cmdclass={"build_ext": BuildExtension}, install_requires=["torch"], )