push 2.0.9 version

c7c514c2 · yangzhong · cf967b1f · c7c514c2 · c7c514c2 · c7c514c2
Commit c7c514c2 authored Jan 22, 2024 by yangzhong
17 changed files
--- a/setup.py
+++ b/setup.py
@@ -10,16 +10,14 @@ from torch.__config__ import parallel_info
 from torch.utils.cpp_extension import BuildExtension
 from torch.utils.cpp_extension import CppExtension, CUDAExtension, CUDA_HOME

-WITH_HIP = torch.cuda.is_available() and CUDA_HOME is not None
-suffices = ['cpu', 'cuda'] if WITH_HIP else ['cpu']
+WITH_CUDA = torch.cuda.is_available() and CUDA_HOME is not None
+suffices = ['cpu', 'cuda'] if WITH_CUDA else ['cpu']
 if os.getenv('FORCE_CUDA', '0') == '1':
    suffices = ['cuda', 'cpu']
-if os.getenv('FORCE_ONLY_HIP', '0') == '1':
-    suffices = ['hip']
+if os.getenv('FORCE_ONLY_CUDA', '0') == '1':
+    suffices = ['cuda']
 if os.getenv('FORCE_ONLY_CPU', '0') == '1':
    suffices = ['cpu']
-ROCM_PATH = os.getenv('ROCM_PATH')
-HIPLIB = osp.join(ROCM_PATH, 'hipsparse', 'include')

 BUILD_DOCS = os.getenv('BUILD_DOCS', '0') == '1'

@@ -46,12 +44,12 @@ def get_extensions():
        else:
            print('Compiling without OpenMP...')

-        if suffix == 'hip':
-            define_macros += [('WITH_HIP', None)]
-            hipcc_flags = os.getenv('HIPCC_FLAGS', '')
-            hipcc_flags = [] if hipcc_flags == '' else hipcc_flags.split(' ')
-            hipcc_flags += ['--expt-relaxed-constexpr', '-O2']
-            extra_compile_args['hipcc'] = hipcc_flags
+        if suffix == 'cuda':
+            define_macros += [('WITH_CUDA', None)]
+            nvcc_flags = os.getenv('NVCC_FLAGS', '')
+            nvcc_flags = [] if nvcc_flags == '' else nvcc_flags.split(' ')
+            nvcc_flags += ['--expt-relaxed-constexpr', '-O2']
+            extra_compile_args['nvcc'] = nvcc_flags

        name = main.split(os.sep)[-1][:-4]
        sources = [main]
@@ -60,16 +58,15 @@ def get_extensions():
        if osp.exists(path):
            sources += [path]

-        path = osp.join(extensions_dir, 'hip', f'{name}_hip.hip')
-        if suffix == 'hip' and osp.exists(path):
+        path = osp.join(extensions_dir, 'cuda', f'{name}_cuda.cu')
+        if suffix == 'cuda' and osp.exists(path):
            sources += [path]

        Extension = CppExtension if suffix == 'cpu' else CUDAExtension
-        define_macros += [('TORCH_HIP_VERSION', 10000), ('__HIP__', None), ('__HCC__', None)]
        extension = Extension(
            f'torch_scatter._{name}_{suffix}',
            sources,
-            include_dirs=[extensions_dir, HIPLIB],
+            include_dirs=[extensions_dir],
            define_macros=define_macros,
            extra_compile_args=extra_compile_args,
            extra_link_args=extra_link_args,

--- a/test/__init__.py
+++ b/test/__init__.py
--- a/test/composite/test_logsumexp.py
+++ b/test/composite/test_logsumexp.py
+import torch
+from torch_scatter import scatter_logsumexp
+
+
+def test_logsumexp():
+    inputs = torch.tensor([
+        0.5, 0.5, 0.0, -2.1, 3.2, 7.0, -1.0, -100.0,
+        float('-inf'),
+        float('-inf'), 0.0
+    ])
+    inputs.requires_grad_()
+    index = torch.tensor([0, 0, 1, 1, 1, 2, 4, 4, 5, 6, 6])
+    splits = [2, 3, 1, 0, 2, 1, 2]
+
+    outputs = scatter_logsumexp(inputs, index)
+
+    for src, out in zip(inputs.split(splits), outputs.unbind()):
+        assert out.tolist() == torch.logsumexp(src, dim=0).tolist()
+
+    outputs.backward(torch.randn_like(outputs))
+
+    jit = torch.jit.script(scatter_logsumexp)
+    assert jit(inputs, index).tolist() == outputs.tolist()
--- a/test/composite/test_softmax.py
+++ b/test/composite/test_softmax.py
--- a/test/composite/test_std.py
+++ b/test/composite/test_std.py
+import torch
+from torch_scatter import scatter_std
+
+
+def test_std():
+    src = torch.tensor([[2, 0, 1, 4, 3], [0, 2, 1, 3, 4]], dtype=torch.float)
+    src.requires_grad_()
+    index = torch.tensor([[0, 0, 0, 0, 0], [1, 1, 1, 1, 1]], dtype=torch.long)
+
+    out = scatter_std(src, index, dim=-1, unbiased=True)
+    std = src.std(dim=-1, unbiased=True)[0]
+    expected = torch.tensor([[std, 0], [0, std]])
+    assert torch.allclose(out, expected)
+
+    out.backward(torch.randn_like(out))
+
+    jit = torch.jit.script(scatter_std)
+    assert jit(src, index, dim=-1, unbiased=True).tolist() == out.tolist()
--- a/test/test_broadcasting.py
+++ b/test/test_broadcasting.py
--- a/test/test_gather.py
+++ b/test/test_gather.py
--- a/test/test_multi_gpu.py
+++ b/test/test_multi_gpu.py
--- a/test/test_scatter.py
+++ b/test/test_scatter.py
--- a/test/test_segment.py
+++ b/test/test_segment.py
--- a/test/test_zero_tensors.py
+++ b/test/test_zero_tensors.py
--- a/test/utils.py
+++ b/test/utils.py
--- a/torch_scatter.egg-info/PKG-INFO
+++ b/torch_scatter.egg-info/PKG-INFO
--- a/torch_scatter.egg-info/SOURCES.txt
+++ b/torch_scatter.egg-info/SOURCES.txt
--- a/torch_scatter.egg-info/dependency_links.txt
+++ b/torch_scatter.egg-info/dependency_links.txt
-
--- a/torch_scatter.egg-info/top_level.txt
+++ b/torch_scatter.egg-info/top_level.txt
-torch_scatter
--- a/torch_scatter/__init__.py
+++ b/torch_scatter/__init__.py