Fix --cuaev-all-sms (#600)

* Fix --cuaev-all-sms * expecttest * fix ci

Fix --cuaev-all-sms (#600)
* Fix --cuaev-all-sms * expecttest * fix ci
d1a63639 · Jinze (Richard) Xue · GitHub · bf771af0 · d1a63639 · d1a63639
Unverified Commit d1a63639 authored Oct 30, 2021 by Jinze (Richard) Xue Committed by GitHub Oct 30, 2021
Hide whitespace changes
Inline Side-by-side

Showing with 6 additions and 6 deletions

ci/install_dependencies.sh ci/install_dependencies.sh +1 -1

setup.py setup.py +4 -5

test_requirements.txt test_requirements.txt +1 -0

No files found.
--- a/ci/install_dependencies.sh
+++ b/ci/install_dependencies.sh
@@ -2,6 +2,6 @@
 pip install --upgrade pip
 pip install twine wheel
-pip install --pre torch -f https://download.pytorch.org/whl/nightly/cu110/torch_nightly.html
+pip install --pre torch -f https://download.pytorch.org/whl/nightly/cu112/torch_nightly.html
 pip install -r test_requirements.txt
 pip install -r docs_requirements.txt
--- a/setup.py
+++ b/setup.py
@@ -53,10 +53,9 @@ def maybe_download_cub():
 def cuda_extension(build_all=False):
    import torch
    from torch.utils.cpp_extension import CUDAExtension
-    SMs = None
+    SMs = []
    print('-' * 75)
    if not build_all:
-        SMs = []
        devices = torch.cuda.device_count()
        print('FAST_BUILD_CUAEV: ON')
        print('This build will only support the following devices or the devices with same cuda capability: ')
@@ -71,13 +70,13 @@ def cuda_extension(build_all=False):
                SMs.append(sm)
    nvcc_args = ["-Xptxas=-v", '--expt-extended-lambda', '-use_fast_math']
-    if SMs:
+    if SMs and not ONLY_BUILD_SM80:
        for sm in SMs:
            nvcc_args.append(f"-gencode=arch=compute_{sm},code=sm_{sm}")
-    elif len(SMs) == 0 and ONLY_BUILD_SM80:  # --cuaev --only-sm80
+    elif ONLY_BUILD_SM80:  # --cuaev --only-sm80
        nvcc_args.append("-gencode=arch=compute_80,code=sm_80")
    else:  # no gpu detected
-        print('NO gpu detected, will build for all SMs')
+        print('Will build for all SMs')
        nvcc_args.append("-gencode=arch=compute_60,code=sm_60")
        nvcc_args.append("-gencode=arch=compute_61,code=sm_61")
        nvcc_args.append("-gencode=arch=compute_70,code=sm_70")

--- a/test_requirements.txt
+++ b/test_requirements.txt
@@ -6,3 +6,4 @@ pillow
 pkbar
 pyyaml
 pytest
+expecttest