Unverified Commit d5ca4495 authored by guyueh1's avatar guyueh1 Committed by GitHub
Browse files

Make `TORCH_CUDA_ARCH_LIST` as an environment variable (#167)



* Add 10.0 to TORCH_CUDA_ARCH_LIST
Signed-off-by: default avatarGuyue Huang <guyueh@nvidia.com>

* Revert csrc/CMakeLists change; in setup.py make TORCH_CUDA_ARCH_LIST configurable
Signed-off-by: default avatarGuyue Huang <guyueh@nvidia.com>

---------
Signed-off-by: default avatarGuyue Huang <guyueh@nvidia.com>
parent bb393e77
...@@ -10,7 +10,8 @@ if __name__ == '__main__': ...@@ -10,7 +10,8 @@ if __name__ == '__main__':
print(f'NVSHMEM directory: {nvshmem_dir}') print(f'NVSHMEM directory: {nvshmem_dir}')
# TODO: currently, we only support Hopper architecture, we may add Ampere support later # TODO: currently, we only support Hopper architecture, we may add Ampere support later
os.environ['TORCH_CUDA_ARCH_LIST'] = '9.0' if os.getenv('TORCH_CUDA_ARCH_LIST', None) is None:
os.environ['TORCH_CUDA_ARCH_LIST'] = '9.0'
cxx_flags = ['-O3', '-Wno-deprecated-declarations', '-Wno-unused-variable', cxx_flags = ['-O3', '-Wno-deprecated-declarations', '-Wno-unused-variable',
'-Wno-sign-compare', '-Wno-reorder', '-Wno-attributes'] '-Wno-sign-compare', '-Wno-reorder', '-Wno-attributes']
nvcc_flags = ['-O3', '-Xcompiler', '-O3', '-rdc=true', '--ptxas-options=--register-usage-level=10'] nvcc_flags = ['-O3', '-Xcompiler', '-O3', '-rdc=true', '--ptxas-options=--register-usage-level=10']
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment