[Sparse] Add compact operator (#6352)

Co-authored-by: Ubuntu <ubuntu@ip-172-31-24-117.ap-northeast-1.compute.internal>

[Sparse] Add compact operator (#6352)
Co-authored-by: Ubuntu <ubuntu@ip-172-31-24-117.ap-northeast-1.compute.internal>
fdb4737c · xiangyuzhi · GitHub · 8edcad2d · fdb4737c · 8edcad2d
Unverified Commit fdb4737c authored Oct 09, 2023 by xiangyuzhi Committed by GitHub Oct 09, 2023
7 changed files
--- a/dgl_sparse/include/sparse/matrix_ops.h
+++ b/dgl_sparse/include/sparse/matrix_ops.h
@@ -6,7 +6,6 @@
 #ifndef SPARSE_MATRIX_OPS_H_
 #define SPARSE_MATRIX_OPS_H_
-#include <sparse/sparse_format.h>
 #include <sparse/sparse_matrix.h>
 #include <tuple>
@@ -47,7 +46,7 @@ std::tuple<std::shared_ptr<COO>, torch::Tensor, torch::Tensor> COOIntersection(
 */
 std::tuple<c10::intrusive_ptr<SparseMatrix>, torch::Tensor> Compact(
    const c10::intrusive_ptr<SparseMatrix>& mat, int64_t dim,
-    torch::Tensor leading_indices);
+    const torch::optional<torch::Tensor>& leading_indices);
 }  // namespace sparse
 }  // namespace dgl

--- a/dgl_sparse/src/macro.h
+++ b/dgl_sparse/src/macro.h
-/**
- * Copyright (c) 2023 by Contributors
- * @file macro.h
- * @brief DGL C++ sparse API macros.
- */
-#ifndef DGL_SPARSE_MACRO_H_
-#define DGL_SPARSE_MACRO_H_
-namespace dgl {
-namespace sparse {
-/**
- * Dispatch an operator to a templated implementation function
- * according to its device:
- *
- * DGL_SPARSE_XPU_SWITCH(tensor.device().type(), XPU, {
- *   // Now XPU is a placeholder for tensor.device().type()
- *   DeviceSpecificImplementation<XPU>(...);
- * });
- */
-#define DGL_SPARSE_XPU_SWITCH(device, XPU, op, ...)             \
-  do {                                                          \
-    if ((device) == c10::DeviceType::CPU) {                     \
-      constexpr auto XPU = c10::DeviceType::CPU;                \
-      { __VA_ARGS__ }                                           \
-    } else {                                                    \
-      LOG(FATAL) << "Operator " << (op) << " does not support " \
-                 << c10::DeviceTypeName(device) << " device.";  \
-    }                                                           \
-  } while (0)
-/**
- * Dispatch according to ID type (either int32 or int64):
- *
- * DGL_SPARSE_ID_TYPE_SWITCH(tensor.dtype(), IdType, {
- *   // Now IdType is the type corresponding to data type of the tensor.
- *   // For instance, one can do this for a CPU array:
- *   IdType *data = static_cast<IdType *>(array.data_ptr());
- * });
- */
-#define DGL_SPARSE_ID_TYPE_SWITCH(dtype, IdType, op, ...)       \
-  do {                                                          \
-    if ((dtype) == torch::kInt32) {                             \
-      typedef int32_t IdType;                                   \
-      { __VA_ARGS__ }                                           \
-    } else if ((dtype) == torch::kInt64) {                      \
-      typedef int64_t IdType;                                   \
-      { __VA_ARGS__ }                                           \
-    } else {                                                    \
-      LOG(FATAL) << "Operator " << (op) << " does not support " \
-                 << (dtype).name() << " as ID dtype.";          \
-    }                                                           \
-  } while (0)
-// Macro to dispatch according to device and index type.
-#define DGL_SPARSE_COO_SWITCH(coo, XPU, IdType, op, ...)         \
-  DGL_SPARSE_XPU_SWITCH(coo->indices.device().type(), XPU, op, { \
-    DGL_SPARSE_ID_TYPE_SWITCH(                                   \
-        (coo)->indices.dtype(), IdType, op, {{__VA_ARGS__}});    \
-  });
-}  // namespace sparse
-}  // namespace dgl
-#endif  // DGL_SPARSE_MACRO_H_
--- a/dgl_sparse/src/matrix_ops.cc
+++ b/dgl_sparse/src/matrix_ops.cc
@@ -6,9 +6,6 @@
 #include <sparse/matrix_ops.h>
 #include <torch/script.h>
-#include "./macro.h"
-#include "./matrix_ops_impl.h"
 namespace dgl {
 namespace sparse {
@@ -58,12 +55,122 @@ std::tuple<std::shared_ptr<COO>, torch::Tensor, torch::Tensor> COOIntersection(
  return {ret_coo, lhs_indices, rhs_indices};
 }
+/** @brief Return the reverted mapping of a permutation. */
+static torch::Tensor RevertPermutation(const torch::Tensor& perm) {
+  auto rev_tensor = torch::empty_like(perm);
+  rev_tensor.index_put_(
+      {perm}, torch::arange(0, perm.numel(), rev_tensor.options()));
+  return rev_tensor;
+}
+/**
+ * @brief Compute the compact indices of row indices and leading indices. Return
+ * the compacted indices and the original row indices of compacted indices.
+ *
+ * @param row The row indices.
+ * @param leading_indices The leading indices.
+ *
+ * @return A tuple of compact indices, original indices.
+ */
+static std::tuple<torch::Tensor, torch::Tensor> CompactIndices(
+    const torch::Tensor& row,
+    const torch::optional<torch::Tensor>& leading_indices) {
+  torch::Tensor sorted, sort_indices, uniqued, unique_reverse_indices, counts;
+  // 1. Sort leading indices and row indices in ascending order.
+  int64_t n_leading_indices = 0;
+  if (leading_indices.has_value()) {
+    n_leading_indices = leading_indices.value().numel();
+    std::tie(sorted, sort_indices) =
+        torch::cat({leading_indices.value(), row}).sort();
+  } else {
+    std::tie(sorted, sort_indices) = row.sort();
+  }
+  // 2. Reverse sort indices.
+  auto sort_rev_indices = RevertPermutation(sort_indices);
+  // 3. Unique the sorted array.
+  std::tie(uniqued, unique_reverse_indices, counts) =
+      torch::unique_consecutive(sorted, true);
+  auto reverse_indices = unique_reverse_indices.index({sort_rev_indices});
+  auto n_uniqued = uniqued.numel();
+  // 4. Relabel the indices and map the inverse array to the original array.
+  auto split_indices = torch::full({n_uniqued}, -1, reverse_indices.options());
+  split_indices.index_put_(
+      {reverse_indices.slice(0, 0, n_leading_indices)},
+      torch::arange(0, n_leading_indices, split_indices.options()));
+  split_indices.index_put_(
+      {(split_indices == -1).nonzero().view(-1)},
+      torch::arange(n_leading_indices, n_uniqued, split_indices.options()));
+  // 5. Decode the indices to get the compact indices.
+  auto new_row = split_indices.index({reverse_indices.slice(
+      0, n_leading_indices, n_leading_indices + row.numel())});
+  return {new_row, uniqued.index({RevertPermutation(split_indices)})};
+}
+static std::tuple<c10::intrusive_ptr<SparseMatrix>, torch::Tensor> CompactCOO(
+    const c10::intrusive_ptr<SparseMatrix>& mat, int64_t dim,
+    const torch::optional<torch::Tensor>& leading_indices) {
+  torch::Tensor row, col;
+  auto coo = mat->COOTensors();
+  if (dim == 0)
+    std::tie(row, col) = coo;
+  else
+    std::tie(col, row) = coo;
+  torch::Tensor new_row, uniqued;
+  std::tie(new_row, uniqued) = CompactIndices(row, leading_indices);
+  if (dim == 0) {
+    auto ret = SparseMatrix::FromCOO(
+        torch::stack({new_row, col}, 0), mat->value(),
+        std::vector<int64_t>{uniqued.numel(), mat->shape()[1]});
+    return {ret, uniqued};
+  } else {
+    auto ret = SparseMatrix::FromCOO(
+        torch::stack({col, new_row}, 0), mat->value(),
+        std::vector<int64_t>{mat->shape()[0], uniqued.numel()});
+    return {ret, uniqued};
+  }
+}
+static std::tuple<c10::intrusive_ptr<SparseMatrix>, torch::Tensor> CompactCSR(
+    const c10::intrusive_ptr<SparseMatrix>& mat, int64_t dim,
+    const torch::optional<torch::Tensor>& leading_indices) {
+  std::shared_ptr<CSR> csr;
+  if (dim == 0)
+    csr = mat->CSCPtr();
+  else
+    csr = mat->CSRPtr();
+  torch::Tensor new_indices, uniqued;
+  std::tie(new_indices, uniqued) =
+      CompactIndices(csr->indices, leading_indices);
+  auto ret_value = mat->value();
+  if (csr->value_indices.has_value())
+    ret_value = mat->value().index_select(0, csr->value_indices.value());
+  if (dim == 0) {
+    auto ret = SparseMatrix::FromCSC(
+        csr->indptr, new_indices, ret_value,
+        std::vector<int64_t>{uniqued.numel(), mat->shape()[1]});
+    return {ret, uniqued};
+  } else {
+    auto ret = SparseMatrix::FromCSR(
+        csr->indptr, new_indices, ret_value,
+        std::vector<int64_t>{mat->shape()[0], uniqued.numel()});
+    return {ret, uniqued};
+  }
+}
 std::tuple<c10::intrusive_ptr<SparseMatrix>, torch::Tensor> Compact(
-    const c10::intrusive_ptr<SparseMatrix>& mat, uint64_t dim,
+    const c10::intrusive_ptr<SparseMatrix>& mat, int64_t dim,
-    torch::Tensor leading_indices) {
+    const torch::optional<torch::Tensor>& leading_indices) {
-  DGL_SPARSE_COO_SWITCH(mat->COOPtr(), XPU, IdType, "Compact", {
+  if (mat->HasCOO()) {
-    return CompactImpl<XPU, IdType>(mat, dim, leading_indices);
+    return CompactCOO(mat, dim, leading_indices);
-  });
+  }
+  return CompactCSR(mat, dim, leading_indices);
 }
 }  // namespace sparse

--- a/dgl_sparse/src/matrix_ops_impl.h
+++ b/dgl_sparse/src/matrix_ops_impl.h
@@ -7,21 +7,15 @@
 #define DGL_SPARSE_MATRIX_OPS_IMPL_H_
 #include <sparse/sparse_format.h>
+#include <sparse/sparse_matrix.h>
 #include <tuple>
+#include <vector>
-namespace dgl {
+#include "./utils.h"
-namespace sparse {
-template <c10::DeviceType XPU, typename IdType>
-std::tuple<c10::intrusive_ptr<SparseMatrix>, torch::Tensor> CompactImpl(
-    const c10::intrusive_ptr<SparseMatrix>& mat, int64_t dim,
-    torch::Tensor leading_indices) {
-  // Place holder only.
-  return {mat, leading_indices};
-}
-}  // namespace sparse
+namespace dgl {
+namespace sparse {}  // namespace sparse
 }  // namespace dgl
 #endif  // DGL_SPARSE_MATRIX_OPS_IMPL_H_
--- a/dgl_sparse/src/python_binding.cc
+++ b/dgl_sparse/src/python_binding.cc
@@ -8,6 +8,7 @@
 // clang-format on
 #include <sparse/elementwise_op.h>
+#include <sparse/matrix_ops.h>
 #include <sparse/reduction.h>
 #include <sparse/sddmm.h>
 #include <sparse/softmax.h>
@@ -54,7 +55,8 @@ TORCH_LIBRARY(dgl_sparse, m) {
      .def("spmm", &SpMM)
      .def("sddmm", &SDDMM)
      .def("softmax", &Softmax)
-      .def("spspmm", &SpSpMM);
+      .def("spspmm", &SpSpMM)
+      .def("compact", &Compact);
 }
 }  // namespace sparse

--- a/python/dgl/sparse/sparse_matrix.py
+++ b/python/dgl/sparse/sparse_matrix.py
@@ -754,7 +754,10 @@ class SparseMatrix:
        >>> print(original_rows)
        torch.Tensor([1, 2, 0])
        """
-        raise NotImplementedError
+        mat, idx = torch.ops.dgl_sparse.compact(
+            self.c_sparse_matrix, dim, leading_indices
+        )
+        return SparseMatrix(mat), idx
 def spmatrix(

--- a/tests/python/pytorch/sparse/test_matrix_op.py
+++ b/tests/python/pytorch/sparse/test_matrix_op.py
+import backend as F
+import pytest
+import torch
+from .utils import (
+    rand_coo,
+    rand_csc,
+    rand_csr,
+    rand_diag,
+    sparse_matrix_to_dense,
+)
+@pytest.mark.parametrize(
+    "create_func", [rand_diag, rand_csr, rand_csc, rand_coo]
+)
+@pytest.mark.parametrize("dim", [0, 1])
+@pytest.mark.parametrize("index", [None, (1, 3), (4, 0, 2)])
+def test_compact(create_func, dim, index):
+    ctx = F.ctx()
+    shape = (5, 5)
+    ans_idx = []
+    if index is not None:
+        ans_idx = list(dict.fromkeys(index))
+        index = torch.tensor(index).to(ctx)
+    A = create_func(shape, 8, ctx)
+    A_compact, ret_id = A.compact(dim, index)
+    A_compact_dense = sparse_matrix_to_dense(A_compact)
+    A_dense = sparse_matrix_to_dense(A)
+    for i in range(shape[dim]):
+        if dim == 0:
+            row = list(A_dense[i, :].nonzero().reshape(-1))
+        else:
+            row = list(A_dense[:, i].nonzero().reshape(-1))
+        if (i not in list(ans_idx)) and len(row) > 0:
+            ans_idx.append(i)
+    if len(ans_idx):
+        ans_idx = torch.tensor(ans_idx).to(ctx)
+    A_dense_select = sparse_matrix_to_dense(A.index_select(dim, ans_idx))
+    assert A_compact_dense.shape == A_dense_select.shape
+    assert torch.allclose(A_compact_dense, A_dense_select)
+    assert torch.allclose(ans_idx, ret_id)