sddmm.cc 11.5 KB
Newer Older
1
/**
2
 *  Copyright (c) 2020 by Contributors
3
4
 * @file aten/cpu/sddmm.cc
 * @brief SDDMM C APIs and definitions.
5
6
 */
#include "./sddmm.h"
7

8
9
10
11
12
#include <dgl/array.h>

namespace dgl {
namespace aten {

13
14
15
16
17
18
19
20
21
22
23
24
25
26
#define SWITCH_RHS(rhs_target, RhsTarget, ...)             \
  do {                                                     \
    if ((rhs_target) == 0) {                               \
      constexpr int RhsTarget = 0;                         \
      { __VA_ARGS__ }                                      \
    } else if ((rhs_target) == 1) {                        \
      constexpr int RhsTarget = 1;                         \
      { __VA_ARGS__ }                                      \
    } else if ((rhs_target) == 2) {                        \
      constexpr int RhsTarget = 2;                         \
      { __VA_ARGS__ }                                      \
    } else {                                               \
      LOG(INFO) << "Invalid rhs target: " << (rhs_target); \
    }                                                      \
27
28
  } while (0)

29
30
31
32
33
34
35
36
37
38
39
40
41
42
#define SWITCH_TARGET(lhs_target, rhs_target, LhsTarget, RhsTarget, ...) \
  do {                                                                   \
    if ((lhs_target) == 0) {                                             \
      constexpr int LhsTarget = 0;                                       \
      SWITCH_RHS(rhs_target, RhsTarget, __VA_ARGS__);                    \
    } else if ((lhs_target) == 1) {                                      \
      constexpr int LhsTarget = 1;                                       \
      SWITCH_RHS(rhs_target, RhsTarget, __VA_ARGS__);                    \
    } else if ((lhs_target) == 2) {                                      \
      constexpr int LhsTarget = 2;                                       \
      SWITCH_RHS(rhs_target, RhsTarget, __VA_ARGS__);                    \
    } else {                                                             \
      LOG(INFO) << "Invalid lhs target: " << (lhs_target);               \
    }                                                                    \
43
44
  } while (0)

45
/** @brief Generalized SDDMM on Csr format. */
46
template <int XPU, typename IdType, typename DType>
47
48
49
void SDDMMCsr(
    const std::string& op, const BcastOff& bcast, const CSRMatrix& csr,
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target) {
50
51
  SWITCH_OP(op, Op, {
    SWITCH_TARGET(lhs_target, rhs_target, LhsTarget, RhsTarget, {
52
53
      cpu::SDDMMCsr<IdType, DType, Op, LhsTarget, RhsTarget>(
          bcast, csr, lhs, rhs, out);
54
    });
55
56
57
  });
}

58
/** @brief Generalized SDDMM on Csr format with Heterograph support. */
59
template <int XPU, typename IdType, typename DType>
60
61
62
63
64
65
void SDDMMCsrHetero(
    const std::string& op, const BcastOff& bcast,
    const std::vector<CSRMatrix>& vec_csr, const std::vector<NDArray>& vec_lhs,
    const std::vector<NDArray>& vec_rhs, std::vector<NDArray> vec_out,
    int lhs_target, int rhs_target, const std::vector<dgl_type_t>& lhs_nid,
    const std::vector<dgl_type_t>& rhs_nid) {
66
67
68
69
70
71
72
73
  SWITCH_OP(op, Op, {
    SWITCH_TARGET(lhs_target, rhs_target, LhsTarget, RhsTarget, {
      /* Call  SDDMM for each relation type */
      for (dgl_type_t etype = 0; etype < lhs_nid.size(); ++etype) {
        CSRMatrix csr = vec_csr[etype];
        NDArray lhs = vec_lhs[lhs_nid[etype]];
        NDArray rhs = vec_rhs[rhs_nid[etype]];
        NDArray out = vec_out[etype];
74
75
        cpu::SDDMMCsr<IdType, DType, Op, LhsTarget, RhsTarget>(
            bcast, csr, lhs, rhs, out);
76
      }
77
78
79
80
    });
  });
}

81
82
83
84
85
86
template void SDDMMCsr<kDGLCPU, int32_t, BFloat16>(
    const std::string& op, const BcastOff& bcast, const CSRMatrix& csr,
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
template void SDDMMCsr<kDGLCPU, int64_t, BFloat16>(
    const std::string& op, const BcastOff& bcast, const CSRMatrix& csr,
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
87
template void SDDMMCsr<kDGLCPU, int32_t, float>(
88
    const std::string& op, const BcastOff& bcast, const CSRMatrix& csr,
89
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
90
template void SDDMMCsr<kDGLCPU, int64_t, float>(
91
    const std::string& op, const BcastOff& bcast, const CSRMatrix& csr,
92
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
93
template void SDDMMCsr<kDGLCPU, int32_t, double>(
94
    const std::string& op, const BcastOff& bcast, const CSRMatrix& csr,
95
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
96
template void SDDMMCsr<kDGLCPU, int64_t, double>(
97
    const std::string& op, const BcastOff& bcast, const CSRMatrix& csr,
98
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
99

100
101
102
103
104
105
106
107
108
109
110
111
template void SDDMMCsrHetero<kDGLCPU, int32_t, BFloat16>(
    const std::string& op, const BcastOff& bcast,
    const std::vector<CSRMatrix>& vec_csr, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
    const std::vector<dgl_type_t>& out_eid);
template void SDDMMCsrHetero<kDGLCPU, int64_t, BFloat16>(
    const std::string& op, const BcastOff& bcast,
    const std::vector<CSRMatrix>& vec_csr, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
    const std::vector<dgl_type_t>& out_eid);
112
template void SDDMMCsrHetero<kDGLCPU, int32_t, float>(
113
    const std::string& op, const BcastOff& bcast,
114
115
116
    const std::vector<CSRMatrix>& vec_csr, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
117
    const std::vector<dgl_type_t>& out_eid);
118
template void SDDMMCsrHetero<kDGLCPU, int64_t, float>(
119
    const std::string& op, const BcastOff& bcast,
120
121
122
    const std::vector<CSRMatrix>& vec_csr, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
123
    const std::vector<dgl_type_t>& out_eid);
124
template void SDDMMCsrHetero<kDGLCPU, int32_t, double>(
125
    const std::string& op, const BcastOff& bcast,
126
127
128
    const std::vector<CSRMatrix>& vec_csr, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
129
    const std::vector<dgl_type_t>& out_eid);
130
template void SDDMMCsrHetero<kDGLCPU, int64_t, double>(
131
    const std::string& op, const BcastOff& bcast,
132
133
134
    const std::vector<CSRMatrix>& vec_csr, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
135
    const std::vector<dgl_type_t>& out_eid);
136

137
/** @brief Generalized SDDMM on Coo format. */
138
template <int XPU, typename IdType, typename DType>
139
140
141
void SDDMMCoo(
    const std::string& op, const BcastOff& bcast, const COOMatrix& coo,
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target) {
142
143
  SWITCH_OP(op, Op, {
    SWITCH_TARGET(lhs_target, rhs_target, LhsTarget, RhsTarget, {
144
145
      cpu::SDDMMCoo<IdType, DType, Op, LhsTarget, RhsTarget>(
          bcast, coo, lhs, rhs, out);
146
    });
147
148
149
  });
}

150
/** @brief Generalized SDDMM on Coo format with Heterograph support. */
151
template <int XPU, typename IdType, typename DType>
152
153
154
155
156
157
void SDDMMCooHetero(
    const std::string& op, const BcastOff& bcast,
    const std::vector<COOMatrix>& vec_coo, const std::vector<NDArray>& vec_lhs,
    const std::vector<NDArray>& vec_rhs, std::vector<NDArray> vec_out,
    int lhs_target, int rhs_target, const std::vector<dgl_type_t>& lhs_nid,
    const std::vector<dgl_type_t>& rhs_nid) {
158
159
160
161
162
163
164
165
  SWITCH_OP(op, Op, {
    SWITCH_TARGET(lhs_target, rhs_target, LhsTarget, RhsTarget, {
      /* Call  SDDMM for each relation type */
      for (dgl_type_t etype = 0; etype < lhs_nid.size(); ++etype) {
        COOMatrix coo = vec_coo[etype];
        NDArray lhs = vec_lhs[lhs_nid[etype]];
        NDArray rhs = vec_rhs[rhs_nid[etype]];
        NDArray out = vec_out[etype];
166
167
        cpu::SDDMMCoo<IdType, DType, Op, LhsTarget, RhsTarget>(
            bcast, coo, lhs, rhs, out);
168
      }
169
170
171
172
    });
  });
}

173
174
175
176
177
178
template void SDDMMCoo<kDGLCPU, int32_t, BFloat16>(
    const std::string& op, const BcastOff& bcast, const COOMatrix& coo,
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
template void SDDMMCoo<kDGLCPU, int64_t, BFloat16>(
    const std::string& op, const BcastOff& bcast, const COOMatrix& coo,
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
179
template void SDDMMCoo<kDGLCPU, int32_t, float>(
180
    const std::string& op, const BcastOff& bcast, const COOMatrix& coo,
181
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
182
template void SDDMMCoo<kDGLCPU, int64_t, float>(
183
    const std::string& op, const BcastOff& bcast, const COOMatrix& coo,
184
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
185
template void SDDMMCoo<kDGLCPU, int32_t, double>(
186
    const std::string& op, const BcastOff& bcast, const COOMatrix& coo,
187
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
188
template void SDDMMCoo<kDGLCPU, int64_t, double>(
189
    const std::string& op, const BcastOff& bcast, const COOMatrix& coo,
190
    NDArray lhs, NDArray rhs, NDArray out, int lhs_target, int rhs_target);
191

192
193
194
195
196
197
198
199
200
201
202
203
template void SDDMMCooHetero<kDGLCPU, int32_t, BFloat16>(
    const std::string& op, const BcastOff& bcast,
    const std::vector<COOMatrix>& vec_coo, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
    const std::vector<dgl_type_t>& out_eid);
template void SDDMMCooHetero<kDGLCPU, int64_t, BFloat16>(
    const std::string& op, const BcastOff& bcast,
    const std::vector<COOMatrix>& vec_coo, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
    const std::vector<dgl_type_t>& out_eid);
204
template void SDDMMCooHetero<kDGLCPU, int32_t, float>(
205
    const std::string& op, const BcastOff& bcast,
206
207
208
    const std::vector<COOMatrix>& vec_coo, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
209
    const std::vector<dgl_type_t>& out_eid);
210
template void SDDMMCooHetero<kDGLCPU, int64_t, float>(
211
    const std::string& op, const BcastOff& bcast,
212
213
214
    const std::vector<COOMatrix>& vec_coo, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
215
    const std::vector<dgl_type_t>& out_eid);
216
template void SDDMMCooHetero<kDGLCPU, int32_t, double>(
217
    const std::string& op, const BcastOff& bcast,
218
219
220
    const std::vector<COOMatrix>& vec_coo, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
221
    const std::vector<dgl_type_t>& out_eid);
222
template void SDDMMCooHetero<kDGLCPU, int64_t, double>(
223
    const std::string& op, const BcastOff& bcast,
224
225
226
    const std::vector<COOMatrix>& vec_coo, const std::vector<NDArray>& lhs,
    const std::vector<NDArray>& rhs, std::vector<NDArray> out, int lhs_target,
    int rhs_target, const std::vector<dgl_type_t>& in_eid,
227
    const std::vector<dgl_type_t>& out_eid);
228
229
230

}  // namespace aten
}  // namespace dgl