[Misc] clang-format auto fix. (#4824)

* [Misc] clang-format auto fix. * blabla * ablabla * blabla Co-authored-by: Steve <ubuntu@ip-172-31-34-29.ap-northeast-1.compute.internal>

[Misc] clang-format auto fix. (#4824)
* [Misc] clang-format auto fix. * blabla * ablabla * blabla Co-authored-by: Steve <ubuntu@ip-172-31-34-29.ap-northeast-1.compute.internal>
8ac27dad · Hongzhi (Steve), Chen · GitHub · bcd37684 · 8ac27dad · 8ac27dad
Unverified Commit 8ac27dad authored Nov 07, 2022 by Hongzhi (Steve), Chen Committed by GitHub Nov 07, 2022
20 changed files
--- a/src/array/cuda/atomic.cuh
+++ b/src/array/cuda/atomic.cuh
--- a/src/array/cuda/csr_get_data.cu
+++ b/src/array/cuda/csr_get_data.cu
@@ -4,9 +4,11 @@
 * @brief Retrieve entries of a CSR matrix
 */
 #include <dgl/array.h>
-#include <vector>
-#include <unordered_set>
 #include <numeric>
+#include <unordered_set>
+#include <vector>
 #include "../../runtime/cuda/cuda_common.h"
 #include "./utils.h"
@@ -19,7 +21,8 @@ namespace impl {
 template <DGLDeviceType XPU, typename IdType, typename DType>
 NDArray CSRGetData(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, DType filler) {
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, DType filler) {
  const int64_t rowlen = rows->shape[0];
  const int64_t collen = cols->shape[0];
@@ -31,44 +34,44 @@ NDArray CSRGetData(
  const int64_t rstlen = std::max(rowlen, collen);
  IdArray rst = NDArray::Empty({rstlen}, weights->dtype, rows->ctx);
-  if (rstlen == 0)
+  if (rstlen == 0) return rst;
-    return rst;
  cudaStream_t stream = runtime::getCurrentCUDAStream();
  const int nt = cuda::FindNumThreads(rstlen);
  const int nb = (rstlen + nt - 1) / nt;
  if (return_eids)
-    BUG_IF_FAIL(DGLDataTypeTraits<DType>::dtype == rows->dtype) <<
+    BUG_IF_FAIL(DGLDataTypeTraits<DType>::dtype == rows->dtype)
-      "DType does not match row's dtype.";
+        << "DType does not match row's dtype.";
  const IdType* indptr_data = csr.indptr.Ptr<IdType>();
  const IdType* indices_data = csr.indices.Ptr<IdType>();
  const IdType* data_data = CSRHasData(csr) ? csr.data.Ptr<IdType>() : nullptr;
  if (csr.is_pinned) {
-    CUDA_CALL(cudaHostGetDevicePointer(
+    CUDA_CALL(
-        &indptr_data, csr.indptr.Ptr<IdType>(), 0));
+        cudaHostGetDevicePointer(&indptr_data, csr.indptr.Ptr<IdType>(), 0));
-    CUDA_CALL(cudaHostGetDevicePointer(
+    CUDA_CALL(
-        &indices_data, csr.indices.Ptr<IdType>(), 0));
+        cudaHostGetDevicePointer(&indices_data, csr.indices.Ptr<IdType>(), 0));
    if (CSRHasData(csr)) {
-      CUDA_CALL(cudaHostGetDevicePointer(
+      CUDA_CALL(
-          &data_data, csr.data.Ptr<IdType>(), 0));
+          cudaHostGetDevicePointer(&data_data, csr.data.Ptr<IdType>(), 0));
    }
  }
  // TODO(minjie): use binary search for sorted csr
-  CUDA_KERNEL_CALL(cuda::_LinearSearchKernel,
+  CUDA_KERNEL_CALL(
-      nb, nt, 0, stream,
+      cuda::_LinearSearchKernel, nb, nt, 0, stream, indptr_data, indices_data,
-      indptr_data, indices_data, data_data,
+      data_data, rows.Ptr<IdType>(), cols.Ptr<IdType>(), row_stride, col_stride,
-      rows.Ptr<IdType>(), cols.Ptr<IdType>(),
+      rstlen, return_eids ? nullptr : weights.Ptr<DType>(), filler,
-      row_stride, col_stride, rstlen,
+      rst.Ptr<DType>());
-      return_eids ? nullptr : weights.Ptr<DType>(), filler, rst.Ptr<DType>());
  return rst;
 }
 template NDArray CSRGetData<kDGLCUDA, int32_t, __half>(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, __half filler);
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, __half filler);
 template NDArray CSRGetData<kDGLCUDA, int64_t, __half>(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, __half filler);
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, __half filler);
 #if BF16_ENABLED
 template NDArray CSRGetData<kDGLCUDA, int32_t, __nv_bfloat16>(
    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
@@ -78,19 +81,25 @@ template NDArray CSRGetData<kDGLCUDA, int64_t, __nv_bfloat16>(
    NDArray weights, __nv_bfloat16 filler);
 #endif  // BF16_ENABLED
 template NDArray CSRGetData<kDGLCUDA, int32_t, float>(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, float filler);
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, float filler);
 template NDArray CSRGetData<kDGLCUDA, int64_t, float>(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, float filler);
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, float filler);
 template NDArray CSRGetData<kDGLCUDA, int32_t, double>(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, double filler);
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, double filler);
 template NDArray CSRGetData<kDGLCUDA, int64_t, double>(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, double filler);
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, double filler);
 // For CSRGetData<XPU, IdType>(CSRMatrix, NDArray, NDArray)
 template NDArray CSRGetData<kDGLCUDA, int32_t, int32_t>(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, int32_t filler);
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, int32_t filler);
 template NDArray CSRGetData<kDGLCUDA, int64_t, int64_t>(
-    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids, NDArray weights, int64_t filler);
+    CSRMatrix csr, NDArray rows, NDArray cols, bool return_eids,
+    NDArray weights, int64_t filler);
 }  // namespace impl
 }  // namespace aten

--- a/src/array/cuda/csr_mm.cu
+++ b/src/array/cuda/csr_mm.cu
--- a/src/array/cuda/csr_sum.cu
+++ b/src/array/cuda/csr_sum.cu
--- a/src/array/cuda/cusparse_dispatcher.cuh
+++ b/src/array/cuda/cusparse_dispatcher.cuh
 /**
 *  Copyright (c) 2020 by Contributors
 * @file array/cuda/dispatcher.cuh
- * @brief Templates to dispatch into different cuSPARSE routines based on the type
+ * @brief Templates to dispatch into different cuSPARSE routines based on the
- *        argument.
+ * type argument.
 */
 #ifndef DGL_ARRAY_CUDA_CUSPARSE_DISPATCHER_CUH_
 #define DGL_ARRAY_CUDA_CUSPARSE_DISPATCHER_CUH_
 #include <cusparse.h>
 #include <dgl/runtime/c_runtime_api.h>
-#include "fp16.cuh"
 #include "bf16.cuh"
+#include "fp16.cuh"
 namespace dgl {
 namespace aten {
@@ -40,8 +41,8 @@ template <>
 struct CSRGEMM<__half> {
  template <typename... Args>
  static inline cusparseStatus_t bufferSizeExt(Args... args) {
-    // TODO(ndickson): There is no cusparseHcsrgemm2_bufferSizeExt, so a different
+    // TODO(ndickson): There is no cusparseHcsrgemm2_bufferSizeExt, so a
-    // implementation would be required.
+    // different implementation would be required.
    LOG(FATAL) << "CSRGEMM::bufferSizeExt does not support dtype half (FP16).";
    return static_cast<cusparseStatus_t>(0);
  }
@@ -65,9 +66,10 @@ template <>
 struct CSRGEMM<__nv_bfloat16> {
  template <typename... Args>
  static inline cusparseStatus_t bufferSizeExt(Args... args) {
-    // TODO(ndickson): There is no cusparseHcsrgemm2_bufferSizeExt, so a different
+    // TODO(ndickson): There is no cusparseHcsrgemm2_bufferSizeExt, so a
-    // implementation would be required.
+    // different implementation would be required.
-    LOG(FATAL) << "CSRGEMM::bufferSizeExt does not support dtype bfloat16 (BF16).";
+    LOG(FATAL)
+        << "CSRGEMM::bufferSizeExt does not support dtype bfloat16 (BF16).";
    return static_cast<cusparseStatus_t>(0);
  }
@@ -147,8 +149,8 @@ template <>
 struct CSRGEAM<__half> {
  template <typename... Args>
  static inline cusparseStatus_t bufferSizeExt(Args... args) {
-    // TODO(ndickson): There is no cusparseHcsrgeam2_bufferSizeExt, so a different
+    // TODO(ndickson): There is no cusparseHcsrgeam2_bufferSizeExt, so a
-    // implementation would be required.
+    // different implementation would be required.
    LOG(FATAL) << "CSRGEAM::bufferSizeExt does not support dtype half (FP16).";
    return static_cast<cusparseStatus_t>(0);
  }
@@ -172,9 +174,10 @@ template <>
 struct CSRGEAM<__nv_bfloat16> {
  template <typename... Args>
  static inline cusparseStatus_t bufferSizeExt(Args... args) {
-    // TODO(ndickson): There is no cusparseHcsrgeam2_bufferSizeExt, so a different
+    // TODO(ndickson): There is no cusparseHcsrgeam2_bufferSizeExt, so a
-    // implementation would be required.
+    // different implementation would be required.
-    LOG(FATAL) << "CSRGEAM::bufferSizeExt does not support dtype bfloat16 (BF16).";
+    LOG(FATAL)
+        << "CSRGEAM::bufferSizeExt does not support dtype bfloat16 (BF16).";
    return static_cast<cusparseStatus_t>(0);
  }

--- a/src/array/cuda/fp16.cuh
+++ b/src/array/cuda/fp16.cuh
--- a/src/array/cuda/functor.cuh
+++ b/src/array/cuda/functor.cuh
--- a/src/array/cuda/gather_mm.cu
+++ b/src/array/cuda/gather_mm.cu
--- a/src/array/cuda/rowwise_sampling_prob.cu
+++ b/src/array/cuda/rowwise_sampling_prob.cu
--- a/src/array/cuda/sddmm.cu
+++ b/src/array/cuda/sddmm.cu
--- a/src/array/cuda/sddmm.cuh
+++ b/src/array/cuda/sddmm.cuh
--- a/src/array/cuda/sddmm_hetero_coo.cu
+++ b/src/array/cuda/sddmm_hetero_coo.cu
--- a/src/array/cuda/sddmm_hetero_csr.cu
+++ b/src/array/cuda/sddmm_hetero_csr.cu
--- a/src/array/cuda/segment_reduce.cu
+++ b/src/array/cuda/segment_reduce.cu
--- a/src/array/cuda/spmm.cu
+++ b/src/array/cuda/spmm.cu
--- a/src/array/cuda/spmm.cuh
+++ b/src/array/cuda/spmm.cuh
--- a/src/array/cuda/spmm_hetero.cu
+++ b/src/array/cuda/spmm_hetero.cu
--- a/src/array/cuda/utils.cu
+++ b/src/array/cuda/utils.cu
--- a/src/array/cuda/utils.h
+++ b/src/array/cuda/utils.h
--- a/src/array/kernel.cc
+++ b/src/array/kernel.cc