unit_graph.cc 57.3 KB
Newer Older
1
/**
2
 *  Copyright (c) 2019 by Contributors
3
4
 * @file graph/unit_graph.cc
 * @brief UnitGraph graph implementation
5
6
 */
#include <dgl/array.h>
7
#include <dgl/base_heterograph.h>
8
9
#include <dgl/immutable_graph.h>
#include <dgl/lazy.h>
10
11

#include "../c_api_common.h"
12
#include "./unit_graph.h"
13
#include "./serialize/dglstream.h"
14
15

namespace dgl {
16

17
namespace {
18
19
20

using namespace dgl::aten;

Minjie Wang's avatar
Minjie Wang committed
21
22
23
24
25
26
27
28
29
30
// create metagraph of one node type
inline GraphPtr CreateUnitGraphMetaGraph1() {
  // a self-loop edge 0->0
  std::vector<int64_t> row_vec(1, 0);
  std::vector<int64_t> col_vec(1, 0);
  IdArray row = aten::VecToIdArray(row_vec);
  IdArray col = aten::VecToIdArray(col_vec);
  GraphPtr g = ImmutableGraph::CreateFromCOO(1, row, col);
  return g;
}
31

Minjie Wang's avatar
Minjie Wang committed
32
33
34
35
36
// create metagraph of two node types
inline GraphPtr CreateUnitGraphMetaGraph2() {
  // an edge 0->1
  std::vector<int64_t> row_vec(1, 0);
  std::vector<int64_t> col_vec(1, 1);
37
38
39
40
41
  IdArray row = aten::VecToIdArray(row_vec);
  IdArray col = aten::VecToIdArray(col_vec);
  GraphPtr g = ImmutableGraph::CreateFromCOO(2, row, col);
  return g;
}
Minjie Wang's avatar
Minjie Wang committed
42
43
44
45
46
47
48
49
50
51
52
53

inline GraphPtr CreateUnitGraphMetaGraph(int num_vtypes) {
  static GraphPtr mg1 = CreateUnitGraphMetaGraph1();
  static GraphPtr mg2 = CreateUnitGraphMetaGraph2();
  if (num_vtypes == 1)
    return mg1;
  else if (num_vtypes == 2)
    return mg2;
  else
    LOG(FATAL) << "Invalid number of vertex types. Must be 1 or 2.";
  return {};
}
54
55

};  // namespace
56
57
58
59
60
61
62

//////////////////////////////////////////////////////////
//
// COO graph implementation
//
//////////////////////////////////////////////////////////

Minjie Wang's avatar
Minjie Wang committed
63
class UnitGraph::COO : public BaseHeteroGraph {
64
 public:
65
66
  COO(GraphPtr metagraph, int64_t num_src, int64_t num_dst, IdArray src,
      IdArray dst, bool row_sorted = false, bool col_sorted = false)
Minjie Wang's avatar
Minjie Wang committed
67
    : BaseHeteroGraph(metagraph) {
68
69
70
    CHECK(aten::IsValidIdArray(src));
    CHECK(aten::IsValidIdArray(dst));
    CHECK_EQ(src->shape[0], dst->shape[0]) << "Input arrays should have the same length.";
71
72
73
    adj_ = aten::COOMatrix{num_src, num_dst, src, dst,
        NullArray(),
        row_sorted, col_sorted};
74
  }
75

76
77
78
79
  COO(GraphPtr metagraph, const aten::COOMatrix& coo)
    : BaseHeteroGraph(metagraph), adj_(coo) {
    // Data index should not be inherited. Edges in COO format are always
    // assigned ids from 0 to num_edges - 1.
80
    CHECK(!COOHasData(coo)) << "[BUG] COO should not contain data.";
81
    adj_.data = aten::NullArray();
82
  }
83

84
85
86
87
88
89
90
91
92
93
94
  COO() {
    // set magic num_rows/num_cols to mark it as undefined
    // adj_.num_rows == 0 and adj_.num_cols == 0 means empty UnitGraph which is supported
    adj_.num_rows = -1;
    adj_.num_cols = -1;
  };

  bool defined() const {
    return (adj_.num_rows >= 0) && (adj_.num_cols >= 0);
  }

Minjie Wang's avatar
Minjie Wang committed
95
96
  inline dgl_type_t SrcType() const {
    return 0;
97
  }
Minjie Wang's avatar
Minjie Wang committed
98
99
100
101
102
103
104

  inline dgl_type_t DstType() const {
    return NumVertexTypes() == 1? 0 : 1;
  }

  inline dgl_type_t EdgeType() const {
    return 0;
105
106
107
  }

  HeteroGraphPtr GetRelationGraph(dgl_type_t etype) const override {
Minjie Wang's avatar
Minjie Wang committed
108
    LOG(FATAL) << "The method shouldn't be called for UnitGraph graph. "
109
110
111
112
113
      << "The relation graph is simply this graph itself.";
    return {};
  }

  void AddVertices(dgl_type_t vtype, uint64_t num_vertices) override {
Minjie Wang's avatar
Minjie Wang committed
114
    LOG(FATAL) << "UnitGraph graph is not mutable.";
115
116
117
  }

  void AddEdge(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) override {
Minjie Wang's avatar
Minjie Wang committed
118
    LOG(FATAL) << "UnitGraph graph is not mutable.";
119
120
121
  }

  void AddEdges(dgl_type_t etype, IdArray src_ids, IdArray dst_ids) override {
Minjie Wang's avatar
Minjie Wang committed
122
    LOG(FATAL) << "UnitGraph graph is not mutable.";
123
124
125
  }

  void Clear() override {
Minjie Wang's avatar
Minjie Wang committed
126
    LOG(FATAL) << "UnitGraph graph is not mutable.";
127
128
  }

129
  DGLDataType DataType() const override {
130
131
132
    return adj_.row->dtype;
  }

133
  DGLContext Context() const override {
134
135
136
    return adj_.row->ctx;
  }

137
  bool IsPinned() const override {
138
    return adj_.is_pinned;
139
140
  }

141
142
143
144
  uint8_t NumBits() const override {
    return adj_.row->dtype.bits;
  }

145
146
147
148
149
150
151
152
153
154
155
156
  COO AsNumBits(uint8_t bits) const {
    if (NumBits() == bits)
      return *this;

    COO ret(
        meta_graph_,
        adj_.num_rows, adj_.num_cols,
        aten::AsNumBits(adj_.row, bits),
        aten::AsNumBits(adj_.col, bits));
    return ret;
  }

157
  COO CopyTo(const DGLContext &ctx) const {
158
159
    if (Context() == ctx)
      return *this;
160
    return COO(meta_graph_, adj_.CopyTo(ctx));
161
162
  }

163

164
  /** @brief Pin the adj_: COOMatrix of the COO graph. */
165
166
167
168
  void PinMemory_() {
    adj_.PinMemory_();
  }

169
  /** @brief Unpin the adj_: COOMatrix of the COO graph. */
170
171
172
173
  void UnpinMemory_() {
    adj_.UnpinMemory_();
  }

174
  /** @brief Record stream for the adj_: COOMatrix of the COO graph. */
175
176
177
178
  void RecordStream(DGLStreamHandle stream) override {
    adj_.RecordStream(stream);
  }

179
  bool IsMultigraph() const override {
180
    return aten::COOHasDuplicate(adj_);
181
182
183
184
185
186
187
  }

  bool IsReadonly() const override {
    return true;
  }

  uint64_t NumVertices(dgl_type_t vtype) const override {
Minjie Wang's avatar
Minjie Wang committed
188
    if (vtype == SrcType()) {
189
      return adj_.num_rows;
Minjie Wang's avatar
Minjie Wang committed
190
    } else if (vtype == DstType()) {
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
      return adj_.num_cols;
    } else {
      LOG(FATAL) << "Invalid vertex type: " << vtype;
      return 0;
    }
  }

  uint64_t NumEdges(dgl_type_t etype) const override {
    return adj_.row->shape[0];
  }

  bool HasVertex(dgl_type_t vtype, dgl_id_t vid) const override {
    return vid < NumVertices(vtype);
  }

  BoolArray HasVertices(dgl_type_t vtype, IdArray vids) const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return {};
  }

  bool HasEdgeBetween(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const override {
212
213
214
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
    return aten::COOIsNonZero(adj_, src, dst);
215
216
217
  }

  BoolArray HasEdgesBetween(dgl_type_t etype, IdArray src_ids, IdArray dst_ids) const override {
218
219
220
    CHECK(aten::IsValidIdArray(src_ids)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dst_ids)) << "Invalid vertex id array.";
    return aten::COOIsNonZero(adj_, src_ids, dst_ids);
221
222
223
  }

  IdArray Predecessors(dgl_type_t etype, dgl_id_t dst) const override {
224
225
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
    return aten::COOGetRowDataAndIndices(aten::COOTranspose(adj_), dst).second;
226
227
228
  }

  IdArray Successors(dgl_type_t etype, dgl_id_t src) const override {
229
230
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    return aten::COOGetRowDataAndIndices(adj_, src).second;
231
232
233
  }

  IdArray EdgeId(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const override {
234
235
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
236
    return aten::COOGetAllData(adj_, src, dst);
237
238
  }

239
  EdgeArray EdgeIdsAll(dgl_type_t etype, IdArray src, IdArray dst) const override {
240
241
242
243
    CHECK(aten::IsValidIdArray(src)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dst)) << "Invalid vertex id array.";
    const auto& arrs = aten::COOGetDataAndIndices(adj_, src, dst);
    return EdgeArray{arrs[0], arrs[1], arrs[2]};
244
245
  }

246
247
248
249
  IdArray EdgeIdsOne(dgl_type_t etype, IdArray src, IdArray dst) const override {
    return aten::COOGetData(adj_, src, dst);
  }

250
251
  std::pair<dgl_id_t, dgl_id_t> FindEdge(dgl_type_t etype, dgl_id_t eid) const override {
    CHECK(eid < NumEdges(etype)) << "Invalid edge id: " << eid;
252
253
    const dgl_id_t src = aten::IndexSelect<int64_t>(adj_.row, eid);
    const dgl_id_t dst = aten::IndexSelect<int64_t>(adj_.col, eid);
254
255
256
257
    return std::pair<dgl_id_t, dgl_id_t>(src, dst);
  }

  EdgeArray FindEdges(dgl_type_t etype, IdArray eids) const override {
258
    CHECK(aten::IsValidIdArray(eids)) << "Invalid edge id array";
259
    BUG_IF_FAIL(aten::IsNullArray(adj_.data)) <<
260
      "FindEdges requires the internal COO matrix not having EIDs.";
261
262
263
264
265
266
    return EdgeArray{aten::IndexSelect(adj_.row, eids),
                     aten::IndexSelect(adj_.col, eids),
                     eids};
  }

  EdgeArray InEdges(dgl_type_t etype, dgl_id_t vid) const override {
267
268
269
270
271
    IdArray ret_src, ret_eid;
    std::tie(ret_eid, ret_src) = aten::COOGetRowDataAndIndices(
        aten::COOTranspose(adj_), vid);
    IdArray ret_dst = aten::Full(vid, ret_src->shape[0], NumBits(), ret_src->ctx);
    return EdgeArray{ret_src, ret_dst, ret_eid};
272
273
274
  }

  EdgeArray InEdges(dgl_type_t etype, IdArray vids) const override {
275
276
277
278
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
    auto coosubmat = aten::COOSliceRows(aten::COOTranspose(adj_), vids);
    auto row = aten::IndexSelect(vids, coosubmat.row);
    return EdgeArray{coosubmat.col, row, coosubmat.data};
279
280
281
  }

  EdgeArray OutEdges(dgl_type_t etype, dgl_id_t vid) const override {
282
283
284
285
    IdArray ret_dst, ret_eid;
    std::tie(ret_eid, ret_dst) = aten::COOGetRowDataAndIndices(adj_, vid);
    IdArray ret_src = aten::Full(vid, ret_dst->shape[0], NumBits(), ret_dst->ctx);
    return EdgeArray{ret_src, ret_dst, ret_eid};
286
287
288
  }

  EdgeArray OutEdges(dgl_type_t etype, IdArray vids) const override {
289
290
291
292
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
    auto coosubmat = aten::COOSliceRows(adj_, vids);
    auto row = aten::IndexSelect(vids, coosubmat.row);
    return EdgeArray{row, coosubmat.col, coosubmat.data};
293
294
295
296
297
298
299
300
301
302
303
  }

  EdgeArray Edges(dgl_type_t etype, const std::string &order = "") const override {
    CHECK(order.empty() || order == std::string("eid"))
      << "COO only support Edges of order \"eid\", but got \""
      << order << "\".";
    IdArray rst_eid = aten::Range(0, NumEdges(etype), NumBits(), Context());
    return EdgeArray{adj_.row, adj_.col, rst_eid};
  }

  uint64_t InDegree(dgl_type_t etype, dgl_id_t vid) const override {
304
305
    CHECK(HasVertex(DstType(), vid)) << "Invalid dst vertex id: " << vid;
    return aten::COOGetRowNNZ(aten::COOTranspose(adj_), vid);
306
307
308
  }

  DegreeArray InDegrees(dgl_type_t etype, IdArray vids) const override {
309
310
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
    return aten::COOGetRowNNZ(aten::COOTranspose(adj_), vids);
311
312
313
  }

  uint64_t OutDegree(dgl_type_t etype, dgl_id_t vid) const override {
314
315
    CHECK(HasVertex(SrcType(), vid)) << "Invalid src vertex id: " << vid;
    return aten::COOGetRowNNZ(adj_, vid);
316
317
318
  }

  DegreeArray OutDegrees(dgl_type_t etype, IdArray vids) const override {
319
320
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
    return aten::COOGetRowNNZ(adj_, vids);
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
  }

  DGLIdIters SuccVec(dgl_type_t etype, dgl_id_t vid) const override {
    LOG(INFO) << "Not enabled for COO graph.";
    return {};
  }

  DGLIdIters OutEdgeVec(dgl_type_t etype, dgl_id_t vid) const override {
    LOG(INFO) << "Not enabled for COO graph.";
    return {};
  }

  DGLIdIters PredVec(dgl_type_t etype, dgl_id_t vid) const override {
    LOG(INFO) << "Not enabled for COO graph.";
    return {};
  }

  DGLIdIters InEdgeVec(dgl_type_t etype, dgl_id_t vid) const override {
    LOG(INFO) << "Not enabled for COO graph.";
    return {};
  }

  std::vector<IdArray> GetAdj(
      dgl_type_t etype, bool transpose, const std::string &fmt) const override {
    CHECK(fmt == "coo") << "Not valid adj format request.";
    if (transpose) {
      return {aten::HStack(adj_.col, adj_.row)};
    } else {
      return {aten::HStack(adj_.row, adj_.col)};
    }
  }

353
354
355
356
357
358
359
360
361
362
363
364
365
366
  aten::COOMatrix GetCOOMatrix(dgl_type_t etype) const override {
    return adj_;
  }

  aten::CSRMatrix GetCSCMatrix(dgl_type_t etype) const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return aten::CSRMatrix();
  }

  aten::CSRMatrix GetCSRMatrix(dgl_type_t etype) const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return aten::CSRMatrix();
  }

367
  SparseFormat SelectFormat(dgl_type_t etype, dgl_format_code_t preferred_formats) const override {
368
    LOG(FATAL) << "Not enabled for COO graph";
369
    return SparseFormat::kCOO;
370
371
  }

372
  dgl_format_code_t GetAllowedFormats() const override {
373
    LOG(FATAL) << "Not enabled for COO graph";
374
    return 0;
375
376
  }

377
  dgl_format_code_t GetCreatedFormats() const override {
378
379
380
381
    LOG(FATAL) << "Not enabled for COO graph";
    return 0;
  }

382
  HeteroSubgraph VertexSubgraph(const std::vector<IdArray>& vids) const override {
383
384
385
386
387
388
    CHECK_EQ(vids.size(), NumVertexTypes()) << "Number of vertex types mismatch";
    auto srcvids = vids[SrcType()], dstvids = vids[DstType()];
    CHECK(aten::IsValidIdArray(srcvids)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dstvids)) << "Invalid vertex id array.";
    HeteroSubgraph subg;
    const auto& submat = aten::COOSliceMatrix(adj_, srcvids, dstvids);
389
    DGLContext ctx = aten::GetContextOf(vids);
390
    IdArray sub_eids = aten::Range(0, submat.data->shape[0], NumBits(), ctx);
391
392
393
394
395
    subg.graph = std::make_shared<COO>(meta_graph(), submat.num_rows, submat.num_cols,
        submat.row, submat.col);
    subg.induced_vertices = vids;
    subg.induced_edges.emplace_back(submat.data);
    return subg;
396
397
398
399
400
401
402
403
404
405
406
407
408
409
  }

  HeteroSubgraph EdgeSubgraph(
      const std::vector<IdArray>& eids, bool preserve_nodes = false) const override {
    CHECK_EQ(eids.size(), 1) << "Edge type number mismatch.";
    HeteroSubgraph subg;
    if (!preserve_nodes) {
      IdArray new_src = aten::IndexSelect(adj_.row, eids[0]);
      IdArray new_dst = aten::IndexSelect(adj_.col, eids[0]);
      subg.induced_vertices.emplace_back(aten::Relabel_({new_src}));
      subg.induced_vertices.emplace_back(aten::Relabel_({new_dst}));
      const auto new_nsrc = subg.induced_vertices[0]->shape[0];
      const auto new_ndst = subg.induced_vertices[1]->shape[0];
      subg.graph = std::make_shared<COO>(
Minjie Wang's avatar
Minjie Wang committed
410
          meta_graph(), new_nsrc, new_ndst, new_src, new_dst);
411
412
413
414
      subg.induced_edges = eids;
    } else {
      IdArray new_src = aten::IndexSelect(adj_.row, eids[0]);
      IdArray new_dst = aten::IndexSelect(adj_.col, eids[0]);
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
415
      subg.induced_vertices.emplace_back(
416
          aten::NullArray(DGLDataType{kDGLInt, NumBits(), 1}, Context()));
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
417
      subg.induced_vertices.emplace_back(
418
          aten::NullArray(DGLDataType{kDGLInt, NumBits(), 1}, Context()));
419
      subg.graph = std::make_shared<COO>(
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
420
          meta_graph(), NumVertices(SrcType()), NumVertices(DstType()), new_src, new_dst);
421
422
423
424
425
      subg.induced_edges = eids;
    }
    return subg;
  }

426
  HeteroGraphPtr GetGraphInFormat(dgl_format_code_t formats) const override {
427
428
429
430
    LOG(FATAL) << "Not enabled for COO graph.";
    return nullptr;
  }

431
432
433
434
  aten::COOMatrix adj() const {
    return adj_;
  }

435
  /**
436
   * @brief Determines whether the graph is "hypersparse", i.e. having significantly more
437
438
439
440
441
442
443
   * nodes than edges.
   */
  bool IsHypersparse() const {
    return (NumVertices(SrcType()) / 8 > NumEdges(EdgeType())) &&
           (NumVertices(SrcType()) > 1000000);
  }

444
445
446
447
448
449
450
451
452
453
454
455
456
  bool Load(dmlc::Stream* fs) {
    auto meta_imgraph = Serializer::make_shared<ImmutableGraph>();
    CHECK(fs->Read(&meta_imgraph)) << "Invalid meta graph";
    meta_graph_ = meta_imgraph;
    CHECK(fs->Read(&adj_)) << "Invalid adj matrix";
    return true;
  }
  void Save(dmlc::Stream* fs) const {
    auto meta_graph_ptr = ImmutableGraph::ToImmutable(meta_graph());
    fs->Write(meta_graph_ptr);
    fs->Write(adj_);
  }

457
 private:
458
459
  friend class Serializer;

460
  /** @brief internal adjacency matrix. Data array is empty */
461
462
463
464
465
466
467
468
469
  aten::COOMatrix adj_;
};

//////////////////////////////////////////////////////////
//
// CSR graph implementation
//
//////////////////////////////////////////////////////////

470
/** @brief CSR graph */
Minjie Wang's avatar
Minjie Wang committed
471
class UnitGraph::CSR : public BaseHeteroGraph {
472
 public:
Minjie Wang's avatar
Minjie Wang committed
473
  CSR(GraphPtr metagraph, int64_t num_src, int64_t num_dst,
474
      IdArray indptr, IdArray indices, IdArray edge_ids)
Minjie Wang's avatar
Minjie Wang committed
475
    : BaseHeteroGraph(metagraph) {
476
477
    CHECK(aten::IsValidIdArray(indptr));
    CHECK(aten::IsValidIdArray(indices));
478
479
480
    if (aten::IsValidIdArray(edge_ids))
      CHECK((indices->shape[0] == edge_ids->shape[0]) || aten::IsNullArray(edge_ids))
        << "edge id arrays should have the same length as indices if not empty";
481
482
    CHECK_EQ(num_src, indptr->shape[0] - 1)
      << "number of nodes do not match the length of indptr minus 1.";
483

484
485
486
    adj_ = aten::CSRMatrix{num_src, num_dst, indptr, indices, edge_ids};
  }

487
  CSR(GraphPtr metagraph, const aten::CSRMatrix& csr)
Da Zheng's avatar
Da Zheng committed
488
489
    : BaseHeteroGraph(metagraph), adj_(csr) {
  }
490

491
492
493
494
495
496
497
498
499
500
501
  CSR() {
    // set magic num_rows/num_cols to mark it as undefined
    // adj_.num_rows == 0 and adj_.num_cols == 0 means empty UnitGraph which is supported
    adj_.num_rows = -1;
    adj_.num_cols = -1;
  };

  bool defined() const {
    return (adj_.num_rows >= 0) || (adj_.num_cols >= 0);
  }

Minjie Wang's avatar
Minjie Wang committed
502
503
  inline dgl_type_t SrcType() const {
    return 0;
504
  }
Minjie Wang's avatar
Minjie Wang committed
505
506
507
508
509
510
511

  inline dgl_type_t DstType() const {
    return NumVertexTypes() == 1? 0 : 1;
  }

  inline dgl_type_t EdgeType() const {
    return 0;
512
513
514
  }

  HeteroGraphPtr GetRelationGraph(dgl_type_t etype) const override {
Minjie Wang's avatar
Minjie Wang committed
515
    LOG(FATAL) << "The method shouldn't be called for UnitGraph graph. "
516
517
518
519
520
      << "The relation graph is simply this graph itself.";
    return {};
  }

  void AddVertices(dgl_type_t vtype, uint64_t num_vertices) override {
Minjie Wang's avatar
Minjie Wang committed
521
    LOG(FATAL) << "UnitGraph graph is not mutable.";
522
523
524
  }

  void AddEdge(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) override {
Minjie Wang's avatar
Minjie Wang committed
525
    LOG(FATAL) << "UnitGraph graph is not mutable.";
526
527
528
  }

  void AddEdges(dgl_type_t etype, IdArray src_ids, IdArray dst_ids) override {
Minjie Wang's avatar
Minjie Wang committed
529
    LOG(FATAL) << "UnitGraph graph is not mutable.";
530
531
532
  }

  void Clear() override {
Minjie Wang's avatar
Minjie Wang committed
533
    LOG(FATAL) << "UnitGraph graph is not mutable.";
534
535
  }

536
  DGLDataType DataType() const override {
537
538
539
    return adj_.indices->dtype;
  }

540
  DGLContext Context() const override {
541
542
543
    return adj_.indices->ctx;
  }

544
  bool IsPinned() const override {
545
    return adj_.is_pinned;
546
547
  }

548
549
550
551
  uint8_t NumBits() const override {
    return adj_.indices->dtype.bits;
  }

552
553
554
555
556
  CSR AsNumBits(uint8_t bits) const {
    if (NumBits() == bits) {
      return *this;
    } else {
      CSR ret(
Minjie Wang's avatar
Minjie Wang committed
557
          meta_graph_,
558
559
560
561
562
563
564
565
          adj_.num_rows, adj_.num_cols,
          aten::AsNumBits(adj_.indptr, bits),
          aten::AsNumBits(adj_.indices, bits),
          aten::AsNumBits(adj_.data, bits));
      return ret;
    }
  }

566
  CSR CopyTo(const DGLContext &ctx) const {
567
568
569
    if (Context() == ctx) {
      return *this;
    } else {
570
      return CSR(meta_graph_, adj_.CopyTo(ctx));
571
572
573
    }
  }

574
  /** @brief Pin the adj_: CSRMatrix of the CSR graph. */
575
576
577
578
  void PinMemory_() {
    adj_.PinMemory_();
  }

579
  /** @brief Unpin the adj_: CSRMatrix of the CSR graph. */
580
581
582
583
  void UnpinMemory_() {
    adj_.UnpinMemory_();
  }

584
  /** @brief Record stream for the adj_: CSRMatrix of the CSR graph. */
585
586
587
588
  void RecordStream(DGLStreamHandle stream) override {
    adj_.RecordStream(stream);
  }

589
  bool IsMultigraph() const override {
590
    return aten::CSRHasDuplicate(adj_);
591
592
593
594
595
596
597
  }

  bool IsReadonly() const override {
    return true;
  }

  uint64_t NumVertices(dgl_type_t vtype) const override {
Minjie Wang's avatar
Minjie Wang committed
598
    if (vtype == SrcType()) {
599
      return adj_.num_rows;
Minjie Wang's avatar
Minjie Wang committed
600
    } else if (vtype == DstType()) {
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
      return adj_.num_cols;
    } else {
      LOG(FATAL) << "Invalid vertex type: " << vtype;
      return 0;
    }
  }

  uint64_t NumEdges(dgl_type_t etype) const override {
    return adj_.indices->shape[0];
  }

  bool HasVertex(dgl_type_t vtype, dgl_id_t vid) const override {
    return vid < NumVertices(vtype);
  }

  BoolArray HasVertices(dgl_type_t vtype, IdArray vids) const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return {};
  }

  bool HasEdgeBetween(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const override {
Minjie Wang's avatar
Minjie Wang committed
622
623
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
624
625
626
627
    return aten::CSRIsNonZero(adj_, src, dst);
  }

  BoolArray HasEdgesBetween(dgl_type_t etype, IdArray src_ids, IdArray dst_ids) const override {
628
629
    CHECK(aten::IsValidIdArray(src_ids)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dst_ids)) << "Invalid vertex id array.";
630
631
632
633
634
635
636
637
638
    return aten::CSRIsNonZero(adj_, src_ids, dst_ids);
  }

  IdArray Predecessors(dgl_type_t etype, dgl_id_t dst) const override {
    LOG(INFO) << "Not enabled for CSR graph.";
    return {};
  }

  IdArray Successors(dgl_type_t etype, dgl_id_t src) const override {
Minjie Wang's avatar
Minjie Wang committed
639
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
640
641
642
643
    return aten::CSRGetRowColumnIndices(adj_, src);
  }

  IdArray EdgeId(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const override {
Minjie Wang's avatar
Minjie Wang committed
644
645
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
646
    return aten::CSRGetAllData(adj_, src, dst);
647
648
  }

649
  EdgeArray EdgeIdsAll(dgl_type_t etype, IdArray src, IdArray dst) const override {
650
651
    CHECK(aten::IsValidIdArray(src)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dst)) << "Invalid vertex id array.";
652
653
654
655
    const auto& arrs = aten::CSRGetDataAndIndices(adj_, src, dst);
    return EdgeArray{arrs[0], arrs[1], arrs[2]};
  }

656
657
658
659
  IdArray EdgeIdsOne(dgl_type_t etype, IdArray src, IdArray dst) const override {
    return aten::CSRGetData(adj_, src, dst);
  }

660
  std::pair<dgl_id_t, dgl_id_t> FindEdge(dgl_type_t etype, dgl_id_t eid) const override {
661
    LOG(FATAL) << "Not enabled for CSR graph.";
662
663
664
665
    return {};
  }

  EdgeArray FindEdges(dgl_type_t etype, IdArray eids) const override {
666
    LOG(FATAL) << "Not enabled for CSR graph.";
667
668
669
670
    return {};
  }

  EdgeArray InEdges(dgl_type_t etype, dgl_id_t vid) const override {
671
    LOG(FATAL) << "Not enabled for CSR graph.";
672
673
674
675
    return {};
  }

  EdgeArray InEdges(dgl_type_t etype, IdArray vids) const override {
676
    LOG(FATAL) << "Not enabled for CSR graph.";
677
678
679
680
    return {};
  }

  EdgeArray OutEdges(dgl_type_t etype, dgl_id_t vid) const override {
Minjie Wang's avatar
Minjie Wang committed
681
    CHECK(HasVertex(SrcType(), vid)) << "Invalid src vertex id: " << vid;
682
683
684
685
686
687
688
    IdArray ret_dst = aten::CSRGetRowColumnIndices(adj_, vid);
    IdArray ret_eid = aten::CSRGetRowData(adj_, vid);
    IdArray ret_src = aten::Full(vid, ret_dst->shape[0], NumBits(), ret_dst->ctx);
    return EdgeArray{ret_src, ret_dst, ret_eid};
  }

  EdgeArray OutEdges(dgl_type_t etype, IdArray vids) const override {
689
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
690
691
692
693
694
695
696
697
698
699
700
701
    auto csrsubmat = aten::CSRSliceRows(adj_, vids);
    auto coosubmat = aten::CSRToCOO(csrsubmat, false);
    // Note that the row id in the csr submat is relabled, so
    // we need to recover it using an index select.
    auto row = aten::IndexSelect(vids, coosubmat.row);
    return EdgeArray{row, coosubmat.col, coosubmat.data};
  }

  EdgeArray Edges(dgl_type_t etype, const std::string &order = "") const override {
    CHECK(order.empty() || order == std::string("srcdst"))
      << "CSR only support Edges of order \"srcdst\","
      << " but got \"" << order << "\".";
702
703
704
705
706
    auto coo = aten::CSRToCOO(adj_, false);
    if (order == std::string("srcdst")) {
      // make sure the coo is sorted if an order is requested
      coo = aten::COOSort(coo, true);
    }
707
708
709
710
    return EdgeArray{coo.row, coo.col, coo.data};
  }

  uint64_t InDegree(dgl_type_t etype, dgl_id_t vid) const override {
711
    LOG(FATAL) << "Not enabled for CSR graph.";
712
713
714
715
    return {};
  }

  DegreeArray InDegrees(dgl_type_t etype, IdArray vids) const override {
716
    LOG(FATAL) << "Not enabled for CSR graph.";
717
718
719
720
    return {};
  }

  uint64_t OutDegree(dgl_type_t etype, dgl_id_t vid) const override {
Minjie Wang's avatar
Minjie Wang committed
721
    CHECK(HasVertex(SrcType(), vid)) << "Invalid src vertex id: " << vid;
722
723
724
725
    return aten::CSRGetRowNNZ(adj_, vid);
  }

  DegreeArray OutDegrees(dgl_type_t etype, IdArray vids) const override {
726
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
727
728
729
730
731
732
    return aten::CSRGetRowNNZ(adj_, vids);
  }

  DGLIdIters SuccVec(dgl_type_t etype, dgl_id_t vid) const override {
    // TODO(minjie): This still assumes the data type and device context
    //   of this graph. Should fix later.
733
    CHECK_EQ(NumBits(), 64);
734
735
736
737
738
739
740
    const dgl_id_t* indptr_data = static_cast<dgl_id_t*>(adj_.indptr->data);
    const dgl_id_t* indices_data = static_cast<dgl_id_t*>(adj_.indices->data);
    const dgl_id_t start = indptr_data[vid];
    const dgl_id_t end = indptr_data[vid + 1];
    return DGLIdIters(indices_data + start, indices_data + end);
  }

741
742
743
744
745
746
747
748
749
750
  DGLIdIters32 SuccVec32(dgl_type_t etype, dgl_id_t vid) {
    // TODO(minjie): This still assumes the data type and device context
    //   of this graph. Should fix later.
    const int32_t* indptr_data = static_cast<int32_t*>(adj_.indptr->data);
    const int32_t* indices_data = static_cast<int32_t*>(adj_.indices->data);
    const int32_t start = indptr_data[vid];
    const int32_t end = indptr_data[vid + 1];
    return DGLIdIters32(indices_data + start, indices_data + end);
  }

751
752
753
  DGLIdIters OutEdgeVec(dgl_type_t etype, dgl_id_t vid) const override {
    // TODO(minjie): This still assumes the data type and device context
    //   of this graph. Should fix later.
754
    CHECK_EQ(NumBits(), 64);
755
756
757
758
759
760
761
762
    const dgl_id_t* indptr_data = static_cast<dgl_id_t*>(adj_.indptr->data);
    const dgl_id_t* eid_data = static_cast<dgl_id_t*>(adj_.data->data);
    const dgl_id_t start = indptr_data[vid];
    const dgl_id_t end = indptr_data[vid + 1];
    return DGLIdIters(eid_data + start, eid_data + end);
  }

  DGLIdIters PredVec(dgl_type_t etype, dgl_id_t vid) const override {
763
    LOG(FATAL) << "Not enabled for CSR graph.";
764
765
766
767
    return {};
  }

  DGLIdIters InEdgeVec(dgl_type_t etype, dgl_id_t vid) const override {
768
    LOG(FATAL) << "Not enabled for CSR graph.";
769
770
771
772
773
774
775
776
777
    return {};
  }

  std::vector<IdArray> GetAdj(
      dgl_type_t etype, bool transpose, const std::string &fmt) const override {
    CHECK(!transpose && fmt == "csr") << "Not valid adj format request.";
    return {adj_.indptr, adj_.indices, adj_.data};
  }

778
779
780
781
782
783
784
785
786
787
788
789
790
791
  aten::COOMatrix GetCOOMatrix(dgl_type_t etype) const override {
    LOG(FATAL) << "Not enabled for CSR graph";
    return aten::COOMatrix();
  }

  aten::CSRMatrix GetCSCMatrix(dgl_type_t etype) const override {
    LOG(FATAL) << "Not enabled for CSR graph";
    return aten::CSRMatrix();
  }

  aten::CSRMatrix GetCSRMatrix(dgl_type_t etype) const override {
    return adj_;
  }

792
  SparseFormat SelectFormat(dgl_type_t etype, dgl_format_code_t preferred_formats) const override {
793
    LOG(FATAL) << "Not enabled for CSR graph";
794
    return SparseFormat::kCSR;
795
796
  }

797
798
799
  dgl_format_code_t GetAllowedFormats() const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return 0;
800
801
  }

802
  dgl_format_code_t GetCreatedFormats() const override {
803
804
805
806
    LOG(FATAL) << "Not enabled for CSR graph";
    return 0;
  }

807
  HeteroSubgraph VertexSubgraph(const std::vector<IdArray>& vids) const override {
Minjie Wang's avatar
Minjie Wang committed
808
809
810
811
    CHECK_EQ(vids.size(), NumVertexTypes()) << "Number of vertex types mismatch";
    auto srcvids = vids[SrcType()], dstvids = vids[DstType()];
    CHECK(aten::IsValidIdArray(srcvids)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dstvids)) << "Invalid vertex id array.";
812
    HeteroSubgraph subg;
Minjie Wang's avatar
Minjie Wang committed
813
    const auto& submat = aten::CSRSliceMatrix(adj_, srcvids, dstvids);
814
    DGLContext ctx = aten::GetContextOf(vids);
815
    IdArray sub_eids = aten::Range(0, submat.data->shape[0], NumBits(), ctx);
Minjie Wang's avatar
Minjie Wang committed
816
    subg.graph = std::make_shared<CSR>(meta_graph(), submat.num_rows, submat.num_cols,
817
818
819
820
821
822
823
824
        submat.indptr, submat.indices, sub_eids);
    subg.induced_vertices = vids;
    subg.induced_edges.emplace_back(submat.data);
    return subg;
  }

  HeteroSubgraph EdgeSubgraph(
      const std::vector<IdArray>& eids, bool preserve_nodes = false) const override {
825
    LOG(FATAL) << "Not enabled for CSR graph.";
826
827
828
    return {};
  }

829
  HeteroGraphPtr GetGraphInFormat(dgl_format_code_t formats) const override {
830
831
832
833
    LOG(FATAL) << "Not enabled for CSR graph.";
    return nullptr;
  }

834
835
836
837
  aten::CSRMatrix adj() const {
    return adj_;
  }

838
839
840
841
842
843
844
845
846
847
848
849
850
  bool Load(dmlc::Stream* fs) {
    auto meta_imgraph = Serializer::make_shared<ImmutableGraph>();
    CHECK(fs->Read(&meta_imgraph)) << "Invalid meta graph";
    meta_graph_ = meta_imgraph;
    CHECK(fs->Read(&adj_)) << "Invalid adj matrix";
    return true;
  }
  void Save(dmlc::Stream* fs) const {
    auto meta_graph_ptr = ImmutableGraph::ToImmutable(meta_graph());
    fs->Write(meta_graph_ptr);
    fs->Write(adj_);
  }

851
 private:
852
853
  friend class Serializer;

854
  /** @brief internal adjacency matrix. Data array stores edge ids */
855
856
857
858
859
  aten::CSRMatrix adj_;
};

//////////////////////////////////////////////////////////
//
Minjie Wang's avatar
Minjie Wang committed
860
// unit graph implementation
861
862
863
//
//////////////////////////////////////////////////////////

864
DGLDataType UnitGraph::DataType() const {
865
866
867
  return GetAny()->DataType();
}

868
DGLContext UnitGraph::Context() const {
869
870
871
  return GetAny()->Context();
}

872
873
874
875
bool UnitGraph::IsPinned() const {
  return GetAny()->IsPinned();
}

Minjie Wang's avatar
Minjie Wang committed
876
uint8_t UnitGraph::NumBits() const {
877
878
879
  return GetAny()->NumBits();
}

Minjie Wang's avatar
Minjie Wang committed
880
bool UnitGraph::IsMultigraph() const {
881
  const SparseFormat fmt = SelectFormat(CSC_CODE);
882
883
  const auto ptr = GetFormat(fmt);
  return ptr->IsMultigraph();
884
885
}

Minjie Wang's avatar
Minjie Wang committed
886
uint64_t UnitGraph::NumVertices(dgl_type_t vtype) const {
887
  const SparseFormat fmt = SelectFormat(ALL_CODE);
888
889
890
  const auto ptr = GetFormat(fmt);
  // TODO(BarclayII): we have a lot of special handling for CSC.
  // Need to have a UnitGraph::CSC backend instead.
891
  if (fmt == SparseFormat::kCSC)
Minjie Wang's avatar
Minjie Wang committed
892
    vtype = (vtype == SrcType()) ? DstType() : SrcType();
893
  return ptr->NumVertices(vtype);
894
895
}

Minjie Wang's avatar
Minjie Wang committed
896
uint64_t UnitGraph::NumEdges(dgl_type_t etype) const {
897
898
899
  return GetAny()->NumEdges(etype);
}

Minjie Wang's avatar
Minjie Wang committed
900
bool UnitGraph::HasVertex(dgl_type_t vtype, dgl_id_t vid) const {
901
  const SparseFormat fmt = SelectFormat(ALL_CODE);
902
  const auto ptr = GetFormat(fmt);
903
  if (fmt == SparseFormat::kCSC)
Minjie Wang's avatar
Minjie Wang committed
904
    vtype = (vtype == SrcType()) ? DstType() : SrcType();
905
  return ptr->HasVertex(vtype, vid);
906
907
}

Minjie Wang's avatar
Minjie Wang committed
908
BoolArray UnitGraph::HasVertices(dgl_type_t vtype, IdArray vids) const {
909
  CHECK(aten::IsValidIdArray(vids)) << "Invalid id array input";
910
911
912
  return aten::LT(vids, NumVertices(vtype));
}

Minjie Wang's avatar
Minjie Wang committed
913
bool UnitGraph::HasEdgeBetween(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const {
914
  const SparseFormat fmt = SelectFormat(CSC_CODE);
915
  const auto ptr = GetFormat(fmt);
916
  if (fmt == SparseFormat::kCSC)
917
918
919
    return ptr->HasEdgeBetween(etype, dst, src);
  else
    return ptr->HasEdgeBetween(etype, src, dst);
920
921
}

Minjie Wang's avatar
Minjie Wang committed
922
BoolArray UnitGraph::HasEdgesBetween(
923
    dgl_type_t etype, IdArray src, IdArray dst) const {
924
  const SparseFormat fmt = SelectFormat(CSC_CODE);
925
  const auto ptr = GetFormat(fmt);
926
  if (fmt == SparseFormat::kCSC)
927
928
929
    return ptr->HasEdgesBetween(etype, dst, src);
  else
    return ptr->HasEdgesBetween(etype, src, dst);
930
931
}

Minjie Wang's avatar
Minjie Wang committed
932
IdArray UnitGraph::Predecessors(dgl_type_t etype, dgl_id_t dst) const {
933
  const SparseFormat fmt = SelectFormat(CSC_CODE);
934
  const auto ptr = GetFormat(fmt);
935
  if (fmt == SparseFormat::kCSC)
936
937
938
    return ptr->Successors(etype, dst);
  else
    return ptr->Predecessors(etype, dst);
939
940
}

Minjie Wang's avatar
Minjie Wang committed
941
IdArray UnitGraph::Successors(dgl_type_t etype, dgl_id_t src) const {
942
  const SparseFormat fmt = SelectFormat(CSR_CODE);
943
944
  const auto ptr = GetFormat(fmt);
  return ptr->Successors(etype, src);
945
946
}

Minjie Wang's avatar
Minjie Wang committed
947
IdArray UnitGraph::EdgeId(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const {
948
  const SparseFormat fmt = SelectFormat(CSR_CODE);
949
  const auto ptr = GetFormat(fmt);
950
  if (fmt == SparseFormat::kCSC)
951
952
953
    return ptr->EdgeId(etype, dst, src);
  else
    return ptr->EdgeId(etype, src, dst);
954
955
}

956
EdgeArray UnitGraph::EdgeIdsAll(dgl_type_t etype, IdArray src, IdArray dst) const {
957
  const SparseFormat fmt = SelectFormat(CSR_CODE);
958
  const auto ptr = GetFormat(fmt);
959
  if (fmt == SparseFormat::kCSC) {
960
    EdgeArray edges = ptr->EdgeIdsAll(etype, dst, src);
961
962
    return EdgeArray{edges.dst, edges.src, edges.id};
  } else {
963
964
965
966
967
    return ptr->EdgeIdsAll(etype, src, dst);
  }
}

IdArray UnitGraph::EdgeIdsOne(dgl_type_t etype, IdArray src, IdArray dst) const {
968
  const SparseFormat fmt = SelectFormat(CSR_CODE);
969
970
971
972
973
  const auto ptr = GetFormat(fmt);
  if (fmt == SparseFormat::kCSC) {
    return ptr->EdgeIdsOne(etype, dst, src);
  } else {
    return ptr->EdgeIdsOne(etype, src, dst);
974
975
976
  }
}

Minjie Wang's avatar
Minjie Wang committed
977
std::pair<dgl_id_t, dgl_id_t> UnitGraph::FindEdge(dgl_type_t etype, dgl_id_t eid) const {
978
  const SparseFormat fmt = SelectFormat(COO_CODE);
979
980
  const auto ptr = GetFormat(fmt);
  return ptr->FindEdge(etype, eid);
981
982
}

Minjie Wang's avatar
Minjie Wang committed
983
EdgeArray UnitGraph::FindEdges(dgl_type_t etype, IdArray eids) const {
984
  const SparseFormat fmt = SelectFormat(COO_CODE);
985
986
  const auto ptr = GetFormat(fmt);
  return ptr->FindEdges(etype, eids);
987
988
}

Minjie Wang's avatar
Minjie Wang committed
989
EdgeArray UnitGraph::InEdges(dgl_type_t etype, dgl_id_t vid) const {
990
  const SparseFormat fmt = SelectFormat(CSC_CODE);
991
  const auto ptr = GetFormat(fmt);
992
  if (fmt == SparseFormat::kCSC) {
993
994
995
996
997
    const EdgeArray& ret = ptr->OutEdges(etype, vid);
    return {ret.dst, ret.src, ret.id};
  } else {
    return ptr->InEdges(etype, vid);
  }
998
999
}

Minjie Wang's avatar
Minjie Wang committed
1000
EdgeArray UnitGraph::InEdges(dgl_type_t etype, IdArray vids) const {
1001
  const SparseFormat fmt = SelectFormat(CSC_CODE);
1002
  const auto ptr = GetFormat(fmt);
1003
  if (fmt == SparseFormat::kCSC) {
1004
1005
1006
1007
1008
    const EdgeArray& ret = ptr->OutEdges(etype, vids);
    return {ret.dst, ret.src, ret.id};
  } else {
    return ptr->InEdges(etype, vids);
  }
1009
1010
}

Minjie Wang's avatar
Minjie Wang committed
1011
EdgeArray UnitGraph::OutEdges(dgl_type_t etype, dgl_id_t vid) const {
1012
  const SparseFormat fmt = SelectFormat(CSR_CODE);
1013
1014
  const auto ptr = GetFormat(fmt);
  return ptr->OutEdges(etype, vid);
1015
1016
}

Minjie Wang's avatar
Minjie Wang committed
1017
EdgeArray UnitGraph::OutEdges(dgl_type_t etype, IdArray vids) const {
1018
  const SparseFormat fmt = SelectFormat(CSR_CODE);
1019
1020
  const auto ptr = GetFormat(fmt);
  return ptr->OutEdges(etype, vids);
1021
1022
}

Minjie Wang's avatar
Minjie Wang committed
1023
EdgeArray UnitGraph::Edges(dgl_type_t etype, const std::string &order) const {
1024
1025
  SparseFormat fmt;
  if (order == std::string("eid")) {
1026
    fmt = SelectFormat(COO_CODE);
1027
  } else if (order.empty()) {
1028
    // arbitrary order
1029
    fmt = SelectFormat(ALL_CODE);
1030
  } else if (order == std::string("srcdst")) {
1031
    fmt = SelectFormat(CSR_CODE);
1032
1033
  } else {
    LOG(FATAL) << "Unsupported order request: " << order;
1034
    return {};
1035
  }
1036
1037

  const auto& edges = GetFormat(fmt)->Edges(etype, order);
1038
  if (fmt == SparseFormat::kCSC)
1039
1040
1041
    return EdgeArray{edges.dst, edges.src, edges.id};
  else
    return edges;
1042
1043
}

Minjie Wang's avatar
Minjie Wang committed
1044
uint64_t UnitGraph::InDegree(dgl_type_t etype, dgl_id_t vid) const {
1045
  SparseFormat fmt = SelectFormat(CSC_CODE);
1046
  const auto ptr = GetFormat(fmt);
1047
1048
1049
1050
1051
  CHECK(fmt == SparseFormat::kCSC || fmt == SparseFormat::kCOO)
      << "In degree cannot be computed as neither CSC nor COO format is "
         "allowed for this graph. Please enable one of them at least.";
  return fmt == SparseFormat::kCSC ? ptr->OutDegree(etype, vid)
                                   : ptr->InDegree(etype, vid);
1052
1053
}

Minjie Wang's avatar
Minjie Wang committed
1054
DegreeArray UnitGraph::InDegrees(dgl_type_t etype, IdArray vids) const {
1055
  SparseFormat fmt = SelectFormat(CSC_CODE);
1056
  const auto ptr = GetFormat(fmt);
1057
1058
1059
1060
1061
  CHECK(fmt == SparseFormat::kCSC || fmt == SparseFormat::kCOO)
      << "In degree cannot be computed as neither CSC nor COO format is "
         "allowed for this graph. Please enable one of them at least.";
  return fmt == SparseFormat::kCSC ? ptr->OutDegrees(etype, vids)
                                   : ptr->InDegrees(etype, vids);
1062
1063
}

Minjie Wang's avatar
Minjie Wang committed
1064
uint64_t UnitGraph::OutDegree(dgl_type_t etype, dgl_id_t vid) const {
1065
  SparseFormat fmt = SelectFormat(CSR_CODE);
1066
  const auto ptr = GetFormat(fmt);
1067
1068
1069
  CHECK(fmt == SparseFormat::kCSR || fmt == SparseFormat::kCOO)
      << "Out degree cannot be computed as neither CSR nor COO format is "
         "allowed for this graph. Please enable one of them at least.";
1070
  return ptr->OutDegree(etype, vid);
1071
1072
}

Minjie Wang's avatar
Minjie Wang committed
1073
DegreeArray UnitGraph::OutDegrees(dgl_type_t etype, IdArray vids) const {
1074
  SparseFormat fmt = SelectFormat(CSR_CODE);
1075
  const auto ptr = GetFormat(fmt);
1076
1077
1078
  CHECK(fmt == SparseFormat::kCSR || fmt == SparseFormat::kCOO)
      << "Out degree cannot be computed as neither CSR nor COO format is "
         "allowed for this graph. Please enable one of them at least.";
1079
  return ptr->OutDegrees(etype, vids);
1080
1081
}

Minjie Wang's avatar
Minjie Wang committed
1082
DGLIdIters UnitGraph::SuccVec(dgl_type_t etype, dgl_id_t vid) const {
1083
  SparseFormat fmt = SelectFormat(CSR_CODE);
1084
1085
  const auto ptr = GetFormat(fmt);
  return ptr->SuccVec(etype, vid);
1086
1087
}

1088
DGLIdIters32 UnitGraph::SuccVec32(dgl_type_t etype, dgl_id_t vid) const {
1089
  SparseFormat fmt = SelectFormat(CSR_CODE);
1090
1091
1092
1093
1094
  const auto ptr = std::dynamic_pointer_cast<CSR>(GetFormat(fmt));
  CHECK_NOTNULL(ptr);
  return ptr->SuccVec32(etype, vid);
}

Minjie Wang's avatar
Minjie Wang committed
1095
DGLIdIters UnitGraph::OutEdgeVec(dgl_type_t etype, dgl_id_t vid) const {
1096
  SparseFormat fmt = SelectFormat(CSR_CODE);
1097
1098
  const auto ptr = GetFormat(fmt);
  return ptr->OutEdgeVec(etype, vid);
1099
1100
}

Minjie Wang's avatar
Minjie Wang committed
1101
DGLIdIters UnitGraph::PredVec(dgl_type_t etype, dgl_id_t vid) const {
1102
  SparseFormat fmt = SelectFormat(CSC_CODE);
1103
  const auto ptr = GetFormat(fmt);
1104
  if (fmt == SparseFormat::kCSC)
1105
1106
1107
    return ptr->SuccVec(etype, vid);
  else
    return ptr->PredVec(etype, vid);
1108
1109
}

Minjie Wang's avatar
Minjie Wang committed
1110
DGLIdIters UnitGraph::InEdgeVec(dgl_type_t etype, dgl_id_t vid) const {
1111
  SparseFormat fmt = SelectFormat(CSC_CODE);
1112
  const auto ptr = GetFormat(fmt);
1113
  if (fmt == SparseFormat::kCSC)
1114
1115
1116
    return ptr->OutEdgeVec(etype, vid);
  else
    return ptr->InEdgeVec(etype, vid);
1117
1118
}

Minjie Wang's avatar
Minjie Wang committed
1119
std::vector<IdArray> UnitGraph::GetAdj(
1120
1121
1122
1123
1124
1125
1126
1127
1128
    dgl_type_t etype, bool transpose, const std::string &fmt) const {
  // TODO(minjie): Our current semantics of adjacency matrix is row for dst nodes and col for
  //   src nodes. Therefore, we need to flip the transpose flag. For example, transpose=False
  //   is equal to in edge CSR.
  //   We have this behavior because previously we use framework's SPMM and we don't cache
  //   reverse adj. This is not intuitive and also not consistent with networkx's
  //   to_scipy_sparse_matrix. With the upcoming custom kernel change, we should change the
  //   behavior and make row for src and col for dst.
  if (fmt == std::string("csr")) {
1129
    return !transpose ? GetOutCSR()->GetAdj(etype, false, "csr")
1130
1131
      : GetInCSR()->GetAdj(etype, false, "csr");
  } else if (fmt == std::string("coo")) {
1132
    return GetCOO()->GetAdj(etype, transpose, fmt);
1133
1134
1135
1136
1137
1138
  } else {
    LOG(FATAL) << "unsupported adjacency matrix format: " << fmt;
    return {};
  }
}

Minjie Wang's avatar
Minjie Wang committed
1139
HeteroSubgraph UnitGraph::VertexSubgraph(const std::vector<IdArray>& vids) const {
1140
  // We prefer to generate a subgraph from out-csr.
1141
  SparseFormat fmt = SelectFormat(CSR_CODE);
1142
  HeteroSubgraph sg = GetFormat(fmt)->VertexSubgraph(vids);
1143
  HeteroSubgraph ret;
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163

  CSRPtr subcsr = nullptr;
  CSRPtr subcsc = nullptr;
  COOPtr subcoo = nullptr;
  switch (fmt) {
    case SparseFormat::kCSR:
      subcsr = std::dynamic_pointer_cast<CSR>(sg.graph);
      break;
    case SparseFormat::kCSC:
      subcsc = std::dynamic_pointer_cast<CSR>(sg.graph);
      break;
    case SparseFormat::kCOO:
      subcoo = std::dynamic_pointer_cast<COO>(sg.graph);
      break;
    default:
      LOG(FATAL) << "[BUG] unsupported format " << static_cast<int>(fmt);
      return ret;
  }

  ret.graph = HeteroGraphPtr(new UnitGraph(meta_graph(), subcsc, subcsr, subcoo));
1164
1165
1166
1167
1168
  ret.induced_vertices = std::move(sg.induced_vertices);
  ret.induced_edges = std::move(sg.induced_edges);
  return ret;
}

Minjie Wang's avatar
Minjie Wang committed
1169
HeteroSubgraph UnitGraph::EdgeSubgraph(
1170
    const std::vector<IdArray>& eids, bool preserve_nodes) const {
1171
  SparseFormat fmt = SelectFormat(COO_CODE);
1172
  auto sg = GetFormat(fmt)->EdgeSubgraph(eids, preserve_nodes);
1173
  HeteroSubgraph ret;
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193

  CSRPtr subcsr = nullptr;
  CSRPtr subcsc = nullptr;
  COOPtr subcoo = nullptr;
  switch (fmt) {
    case SparseFormat::kCSR:
      subcsr = std::dynamic_pointer_cast<CSR>(sg.graph);
      break;
    case SparseFormat::kCSC:
      subcsc = std::dynamic_pointer_cast<CSR>(sg.graph);
      break;
    case SparseFormat::kCOO:
      subcoo = std::dynamic_pointer_cast<COO>(sg.graph);
      break;
    default:
      LOG(FATAL) << "[BUG] unsupported format " << static_cast<int>(fmt);
      return ret;
  }

  ret.graph = HeteroGraphPtr(new UnitGraph(meta_graph(), subcsc, subcsr, subcoo));
1194
1195
1196
1197
1198
  ret.induced_vertices = std::move(sg.induced_vertices);
  ret.induced_edges = std::move(sg.induced_edges);
  return ret;
}

Minjie Wang's avatar
Minjie Wang committed
1199
HeteroGraphPtr UnitGraph::CreateFromCOO(
1200
1201
    int64_t num_vtypes, int64_t num_src, int64_t num_dst,
    IdArray row, IdArray col,
1202
    bool row_sorted, bool col_sorted,
1203
    dgl_format_code_t formats) {
Minjie Wang's avatar
Minjie Wang committed
1204
1205
1206
1207
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(num_src, num_dst);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
1208
1209
  COOPtr coo(new COO(mg, num_src, num_dst, row, col,
      row_sorted, col_sorted));
1210
1211

  return HeteroGraphPtr(
1212
      new UnitGraph(mg, nullptr, nullptr, coo, formats));
1213
1214
}

1215
1216
HeteroGraphPtr UnitGraph::CreateFromCOO(
    int64_t num_vtypes, const aten::COOMatrix& mat,
1217
    dgl_format_code_t formats) {
1218
1219
1220
1221
1222
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(mat.num_rows, mat.num_cols);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
  COOPtr coo(new COO(mg, mat));
1223

1224
  return HeteroGraphPtr(
1225
      new UnitGraph(mg, nullptr, nullptr, coo, formats));
1226
1227
}

Minjie Wang's avatar
Minjie Wang committed
1228
1229
HeteroGraphPtr UnitGraph::CreateFromCSR(
    int64_t num_vtypes, int64_t num_src, int64_t num_dst,
1230
    IdArray indptr, IdArray indices, IdArray edge_ids, dgl_format_code_t formats) {
Minjie Wang's avatar
Minjie Wang committed
1231
1232
1233
1234
1235
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(num_src, num_dst);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
  CSRPtr csr(new CSR(mg, num_src, num_dst, indptr, indices, edge_ids));
1236
  return HeteroGraphPtr(new UnitGraph(mg, nullptr, csr, nullptr, formats));
1237
1238
}

1239
1240
HeteroGraphPtr UnitGraph::CreateFromCSR(
    int64_t num_vtypes, const aten::CSRMatrix& mat,
1241
    dgl_format_code_t formats) {
1242
1243
1244
1245
1246
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(mat.num_rows, mat.num_cols);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
  CSRPtr csr(new CSR(mg, mat));
1247
  return HeteroGraphPtr(new UnitGraph(mg, nullptr, csr, nullptr, formats));
1248
1249
}

1250
1251
HeteroGraphPtr UnitGraph::CreateFromCSC(
    int64_t num_vtypes, int64_t num_src, int64_t num_dst,
1252
    IdArray indptr, IdArray indices, IdArray edge_ids, dgl_format_code_t formats) {
1253
1254
1255
1256
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(num_src, num_dst);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
1257
  CSRPtr csc(new CSR(mg, num_dst, num_src, indptr, indices, edge_ids));
1258
  return HeteroGraphPtr(new UnitGraph(mg, csc, nullptr, nullptr, formats));
1259
1260
1261
1262
}

HeteroGraphPtr UnitGraph::CreateFromCSC(
    int64_t num_vtypes, const aten::CSRMatrix& mat,
1263
    dgl_format_code_t formats) {
1264
1265
1266
1267
1268
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(mat.num_rows, mat.num_cols);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
  CSRPtr csc(new CSR(mg, mat));
1269
  return HeteroGraphPtr(new UnitGraph(mg, csc, nullptr, nullptr, formats));
1270
1271
}

Minjie Wang's avatar
Minjie Wang committed
1272
HeteroGraphPtr UnitGraph::AsNumBits(HeteroGraphPtr g, uint8_t bits) {
1273
1274
1275
  if (g->NumBits() == bits) {
    return g;
  } else {
Minjie Wang's avatar
Minjie Wang committed
1276
    auto bg = std::dynamic_pointer_cast<UnitGraph>(g);
1277
    CHECK_NOTNULL(bg);
1278
1279
1280
1281
1282
1283
    CSRPtr new_incsr =
      (bg->in_csr_->defined())? CSRPtr(new CSR(bg->in_csr_->AsNumBits(bits))) : nullptr;
    CSRPtr new_outcsr =
      (bg->out_csr_->defined())? CSRPtr(new CSR(bg->out_csr_->AsNumBits(bits))) : nullptr;
    COOPtr new_coo =
      (bg->coo_->defined())? COOPtr(new COO(bg->coo_->AsNumBits(bits))) : nullptr;
1284
    return HeteroGraphPtr(
1285
        new UnitGraph(g->meta_graph(), new_incsr, new_outcsr, new_coo, bg->formats_));
1286
1287
1288
  }
}

1289
HeteroGraphPtr UnitGraph::CopyTo(HeteroGraphPtr g, const DGLContext &ctx) {
1290
1291
  if (ctx == g->Context()) {
    return g;
1292
1293
1294
  } else {
    auto bg = std::dynamic_pointer_cast<UnitGraph>(g);
    CHECK_NOTNULL(bg);
1295
    CSRPtr new_incsr = (bg->in_csr_->defined())
1296
                           ? CSRPtr(new CSR(bg->in_csr_->CopyTo(ctx)))
1297
1298
                           : nullptr;
    CSRPtr new_outcsr = (bg->out_csr_->defined())
1299
                            ? CSRPtr(new CSR(bg->out_csr_->CopyTo(ctx)))
1300
1301
                            : nullptr;
    COOPtr new_coo = (bg->coo_->defined())
1302
                         ? COOPtr(new COO(bg->coo_->CopyTo(ctx)))
1303
                         : nullptr;
1304
    return HeteroGraphPtr(
1305
        new UnitGraph(g->meta_graph(), new_incsr, new_outcsr, new_coo, bg->formats_));
1306
1307
1308
  }
}

1309
1310
1311
1312
1313
1314
1315
1316
1317
1318
1319
1320
1321
1322
1323
1324
1325
1326
void UnitGraph::PinMemory_() {
  if (this->in_csr_->defined())
    this->in_csr_->PinMemory_();
  if (this->out_csr_->defined())
    this->out_csr_->PinMemory_();
  if (this->coo_->defined())
    this->coo_->PinMemory_();
}

void UnitGraph::UnpinMemory_() {
  if (this->in_csr_->defined())
    this->in_csr_->UnpinMemory_();
  if (this->out_csr_->defined())
    this->out_csr_->UnpinMemory_();
  if (this->coo_->defined())
    this->coo_->UnpinMemory_();
}

1327
1328
1329
1330
1331
1332
1333
1334
1335
1336
void UnitGraph::RecordStream(DGLStreamHandle stream) {
  if (this->in_csr_->defined())
    this->in_csr_->RecordStream(stream);
  if (this->out_csr_->defined())
    this->out_csr_->RecordStream(stream);
  if (this->coo_->defined())
    this->coo_->RecordStream(stream);
  this->recorded_streams.push_back(stream);
}

1337
1338
1339
1340
1341
1342
1343
1344
1345
1346
1347
1348
void UnitGraph::InvalidateCSR() {
  this->out_csr_ = CSRPtr(new CSR());
}

void UnitGraph::InvalidateCSC() {
  this->in_csr_ = CSRPtr(new CSR());
}

void UnitGraph::InvalidateCOO() {
  this->coo_ = COOPtr(new COO());
}

1349
UnitGraph::UnitGraph(GraphPtr metagraph, CSRPtr in_csr, CSRPtr out_csr, COOPtr coo,
1350
                     dgl_format_code_t formats)
Minjie Wang's avatar
Minjie Wang committed
1351
  : BaseHeteroGraph(metagraph), in_csr_(in_csr), out_csr_(out_csr), coo_(coo) {
1352
1353
1354
1355
1356
1357
1358
1359
1360
  if (!in_csr_) {
    in_csr_ = CSRPtr(new CSR());
  }
  if (!out_csr_) {
    out_csr_ = CSRPtr(new CSR());
  }
  if (!coo_) {
    coo_ = COOPtr(new COO());
  }
1361
1362
1363
1364
1365
  formats_ = formats;
  dgl_format_code_t created = GetCreatedFormats();
  if ((formats | created) != formats)
    LOG(FATAL) << "Graph created from formats: " << CodeToStr(created) <<
      ", which is not compatible with available formats: " << CodeToStr(formats);
1366
1367
1368
  CHECK(GetAny()) << "At least one graph structure should exist.";
}

1369
1370
HeteroGraphPtr UnitGraph::CreateUnitGraphFrom(
    int num_vtypes,
1371
1372
1373
1374
1375
1376
    const aten::CSRMatrix &in_csr,
    const aten::CSRMatrix &out_csr,
    const aten::COOMatrix &coo,
    bool has_in_csr,
    bool has_out_csr,
    bool has_coo,
1377
    dgl_format_code_t formats) {
1378
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
1379
1380
1381
1382
1383
1384
1385

  CSRPtr in_csr_ptr = nullptr;
  CSRPtr out_csr_ptr = nullptr;
  COOPtr coo_ptr = nullptr;

  if (has_in_csr)
    in_csr_ptr = CSRPtr(new CSR(mg, in_csr));
1386
1387
  else
    in_csr_ptr = CSRPtr(new CSR());
1388
1389
  if (has_out_csr)
    out_csr_ptr = CSRPtr(new CSR(mg, out_csr));
1390
1391
  else
    out_csr_ptr = CSRPtr(new CSR());
1392
1393
  if (has_coo)
    coo_ptr = COOPtr(new COO(mg, coo));
1394
1395
  else
    coo_ptr = COOPtr(new COO());
1396

1397
  return HeteroGraphPtr(new UnitGraph(mg, in_csr_ptr, out_csr_ptr, coo_ptr, formats));
1398
1399
}

1400
1401
UnitGraph::CSRPtr UnitGraph::GetInCSR(bool inplace) const {
  if (inplace)
1402
    if (!(formats_ & CSC_CODE))
1403
1404
      LOG(FATAL) << "The graph have restricted sparse format " <<
        CodeToStr(formats_) << ", cannot create CSC matrix.";
1405
  CSRPtr ret = in_csr_;
1406
1407
  // Prefers converting from COO since it is parallelized.
  // TODO(BarclayII): need benchmarking.
1408
  if (!in_csr_->defined()) {
1409
1410
1411
    if (coo_->defined()) {
      const auto& newadj = aten::COOToCSR(
            aten::COOTranspose(coo_->adj()));
1412

1413
      if (inplace)
1414
1415
1416
        *(const_cast<UnitGraph*>(this)->in_csr_) = CSR(meta_graph(), newadj);
      else
        ret = std::make_shared<CSR>(meta_graph(), newadj);
1417
    } else {
1418
1419
      CHECK(out_csr_->defined()) << "None of CSR, COO exist";
      const auto& newadj = aten::CSRTranspose(out_csr_->adj());
1420

1421
      if (inplace)
1422
1423
1424
        *(const_cast<UnitGraph*>(this)->in_csr_) = CSR(meta_graph(), newadj);
      else
        ret = std::make_shared<CSR>(meta_graph(), newadj);
1425
    }
1426
1427
1428
1429
1430
1431
    if (inplace) {
      if (IsPinned())
        in_csr_->PinMemory_();
      for (auto stream : recorded_streams)
        in_csr_->RecordStream(stream);
    }
1432
  }
1433
  return ret;
1434
1435
}

1436
/** @brief Return out csr. If not exist, transpose the other one.*/
1437
1438
UnitGraph::CSRPtr UnitGraph::GetOutCSR(bool inplace) const {
  if (inplace)
1439
    if (!(formats_ & CSR_CODE))
1440
1441
      LOG(FATAL) << "The graph have restricted sparse format " <<
        CodeToStr(formats_) << ", cannot create CSR matrix.";
1442
  CSRPtr ret = out_csr_;
1443
1444
  // Prefers converting from COO since it is parallelized.
  // TODO(BarclayII): need benchmarking.
1445
  if (!out_csr_->defined()) {
1446
1447
    if (coo_->defined()) {
      const auto& newadj = aten::COOToCSR(coo_->adj());
1448

1449
      if (inplace)
1450
1451
1452
        *(const_cast<UnitGraph*>(this)->out_csr_) = CSR(meta_graph(), newadj);
      else
        ret = std::make_shared<CSR>(meta_graph(), newadj);
1453
    } else {
1454
1455
      CHECK(in_csr_->defined()) << "None of CSR, COO exist";
      const auto& newadj = aten::CSRTranspose(in_csr_->adj());
1456

1457
      if (inplace)
1458
1459
1460
        *(const_cast<UnitGraph*>(this)->out_csr_) = CSR(meta_graph(), newadj);
      else
        ret = std::make_shared<CSR>(meta_graph(), newadj);
1461
    }
1462
1463
1464
1465
1466
1467
    if (inplace) {
      if (IsPinned())
        out_csr_->PinMemory_();
      for (auto stream : recorded_streams)
        out_csr_->RecordStream(stream);
    }
1468
  }
1469
  return ret;
1470
1471
}

1472
/** @brief Return coo. If not exist, create from csr.*/
1473
1474
UnitGraph::COOPtr UnitGraph::GetCOO(bool inplace) const {
  if (inplace)
1475
    if (!(formats_ & COO_CODE))
1476
1477
      LOG(FATAL) << "The graph have restricted sparse format " <<
        CodeToStr(formats_) << ", cannot create COO matrix.";
1478
  COOPtr ret = coo_;
1479
1480
  if (!coo_->defined()) {
    if (in_csr_->defined()) {
1481
      const auto& newadj = aten::COOTranspose(aten::CSRToCOO(in_csr_->adj(), true));
1482

1483
      if (inplace)
1484
1485
1486
        *(const_cast<UnitGraph*>(this)->coo_) = COO(meta_graph(), newadj);
      else
        ret = std::make_shared<COO>(meta_graph(), newadj);
1487
    } else {
1488
      CHECK(out_csr_->defined()) << "Both CSR are missing.";
1489
      const auto& newadj = aten::CSRToCOO(out_csr_->adj(), true);
1490

1491
      if (inplace)
1492
1493
1494
        *(const_cast<UnitGraph*>(this)->coo_) = COO(meta_graph(), newadj);
      else
        ret = std::make_shared<COO>(meta_graph(), newadj);
1495
    }
1496
1497
1498
1499
1500
1501
    if (inplace) {
      if (IsPinned())
        coo_->PinMemory_();
      for (auto stream : recorded_streams)
        coo_->RecordStream(stream);
    }
1502
  }
1503
  return ret;
1504
1505
}

1506
aten::CSRMatrix UnitGraph::GetCSCMatrix(dgl_type_t etype) const {
1507
1508
1509
  return GetInCSR()->adj();
}

1510
aten::CSRMatrix UnitGraph::GetCSRMatrix(dgl_type_t etype) const {
1511
1512
1513
  return GetOutCSR()->adj();
}

1514
aten::COOMatrix UnitGraph::GetCOOMatrix(dgl_type_t etype) const {
1515
1516
1517
  return GetCOO()->adj();
}

Minjie Wang's avatar
Minjie Wang committed
1518
HeteroGraphPtr UnitGraph::GetAny() const {
1519
  if (in_csr_->defined()) {
1520
    return in_csr_;
1521
  } else if (out_csr_->defined()) {
1522
1523
1524
1525
1526
1527
    return out_csr_;
  } else {
    return coo_;
  }
}

1528
dgl_format_code_t UnitGraph::GetCreatedFormats() const {
1529
  dgl_format_code_t ret = 0;
1530
  if (in_csr_->defined())
1531
    ret |= CSC_CODE;
1532
  if (out_csr_->defined())
1533
    ret |= CSR_CODE;
1534
  if (coo_->defined())
1535
    ret |= COO_CODE;
1536
1537
1538
  return ret;
}

1539
1540
1541
1542
dgl_format_code_t UnitGraph::GetAllowedFormats() const {
  return formats_;
}

1543
1544
HeteroGraphPtr UnitGraph::GetFormat(SparseFormat format) const {
  switch (format) {
1545
1546
1547
1548
  case SparseFormat::kCSR:
    return GetOutCSR();
  case SparseFormat::kCSC:
    return GetInCSR();
1549
  default:
1550
    return GetCOO();
1551
1552
1553
  }
}

1554
HeteroGraphPtr UnitGraph::GetGraphInFormat(dgl_format_code_t formats) const {
1555
  if (formats == ALL_CODE)
1556
    return HeteroGraphPtr(
1557
1558
        // TODO(xiangsx) Make it as graph storage.Clone()
        new UnitGraph(meta_graph_,
1559
1560
1561
1562
1563
1564
1565
1566
1567
1568
1569
                      (in_csr_->defined())
                          ? CSRPtr(new CSR(*in_csr_))
                          : nullptr,
                      (out_csr_->defined())
                          ? CSRPtr(new CSR(*out_csr_))
                          : nullptr,
                      (coo_->defined())
                          ? COOPtr(new COO(*coo_))
                          : nullptr,
                      formats));
  int64_t num_vtypes = NumVertexTypes();
1570
  if (formats & COO_CODE)
1571
    return CreateFromCOO(num_vtypes, GetCOO(false)->adj(), formats);
1572
  if (formats & CSR_CODE)
1573
1574
1575
1576
1577
1578
1579
1580
1581
    return CreateFromCSR(num_vtypes, GetOutCSR(false)->adj(), formats);
  return CreateFromCSC(num_vtypes, GetInCSR(false)->adj(), formats);
}

SparseFormat UnitGraph::SelectFormat(dgl_format_code_t preferred_formats) const {
  dgl_format_code_t common = preferred_formats & formats_;
  dgl_format_code_t created = GetCreatedFormats();
  if (common & created)
    return DecodeFormat(common & created);
1582
1583
1584
1585
1586

  // NOTE(zihao): hypersparse is currently disabled since many CUDA operators on COO have
  // not been implmented yet.
  // if (coo_->defined() && coo_->IsHypersparse())  // only allow coo for hypersparse graph.
  //   return SparseFormat::kCOO;
1587
1588
1589
  if (common)
    return DecodeFormat(common);
  return DecodeFormat(created);
1590
1591
}

1592
1593
1594
1595
GraphPtr UnitGraph::AsImmutableGraph() const {
  CHECK(NumVertexTypes() == 1) << "not a homogeneous graph";
  dgl::CSRPtr in_csr_ptr = nullptr, out_csr_ptr = nullptr;
  dgl::COOPtr coo_ptr = nullptr;
1596
  if (in_csr_->defined()) {
1597
    aten::CSRMatrix csc = GetCSCMatrix(0);
1598
    in_csr_ptr = dgl::CSRPtr(new dgl::CSR(csc.indptr, csc.indices, csc.data));
1599
  }
1600
  if (out_csr_->defined()) {
1601
    aten::CSRMatrix csr = GetCSRMatrix(0);
1602
    out_csr_ptr = dgl::CSRPtr(new dgl::CSR(csr.indptr, csr.indices, csr.data));
1603
  }
1604
  if (coo_->defined()) {
1605
1606
    aten::COOMatrix coo = GetCOOMatrix(0);
    if (!COOHasData(coo)) {
1607
      coo_ptr = dgl::COOPtr(new dgl::COO(NumVertices(0), coo.row, coo.col));
1608
1609
1610
    } else {
      IdArray new_src = Scatter(coo.row, coo.data);
      IdArray new_dst = Scatter(coo.col, coo.data);
1611
      coo_ptr = dgl::COOPtr(new dgl::COO(NumVertices(0), new_src, new_dst));
1612
1613
1614
1615
1616
    }
  }
  return GraphPtr(new dgl::ImmutableGraph(in_csr_ptr, out_csr_ptr, coo_ptr));
}

1617
1618
HeteroGraphPtr UnitGraph::LineGraph(bool backtracking) const {
  // TODO(xiangsx) currently we only support homogeneous graph
1619
  auto fmt = SelectFormat(ALL_CODE);
1620
1621
  switch (fmt) {
    case SparseFormat::kCOO: {
1622
      return CreateFromCOO(1, aten::COOLineGraph(coo_->adj(), backtracking));
1623
1624
1625
1626
    }
    case SparseFormat::kCSR: {
      const aten::CSRMatrix csr = GetCSRMatrix(0);
      const aten::COOMatrix coo = aten::COOLineGraph(aten::CSRToCOO(csr, true), backtracking);
1627
      return CreateFromCOO(1, coo);
1628
1629
1630
1631
1632
    }
    case SparseFormat::kCSC: {
      const aten::CSRMatrix csc = GetCSCMatrix(0);
      const aten::CSRMatrix csr = aten::CSRTranspose(csc);
      const aten::COOMatrix coo = aten::COOLineGraph(aten::CSRToCOO(csr, true), backtracking);
1633
      return CreateFromCOO(1, coo);
1634
1635
1636
1637
1638
1639
1640
1641
    }
    default:
      LOG(FATAL) << "None of CSC, CSR, COO exist";
      break;
  }
  return nullptr;
}

1642
1643
1644
1645
1646
1647
constexpr uint64_t kDGLSerialize_UnitGraphMagic = 0xDD2E60F0F6B4A127;

bool UnitGraph::Load(dmlc::Stream* fs) {
  uint64_t magicNum;
  CHECK(fs->Read(&magicNum)) << "Invalid Magic Number";
  CHECK_EQ(magicNum, kDGLSerialize_UnitGraphMagic) << "Invalid UnitGraph Data";
1648

1649
  int64_t save_format_code, formats_code;
1650
  CHECK(fs->Read(&save_format_code)) << "Invalid format";
1651
  CHECK(fs->Read(&formats_code)) << "Invalid format";
1652
1653
1654
1655
1656
1657
1658
1659
  dgl_format_code_t save_formats = ANY_CODE;
  if (save_format_code >> 32) {
    save_formats =
        static_cast<dgl_format_code_t>(0xffffffff & save_format_code);
  } else {
    save_formats =
        SparseFormatsToCode({static_cast<SparseFormat>(save_format_code)});
  }
1660
1661
1662
1663
1664
1665
  if (formats_code >> 32) {
    formats_ = static_cast<dgl_format_code_t>(0xffffffff & formats_code);
  } else {
    // NOTE(zihao): to be compatible with old formats.
    switch (formats_code & 0xffffffff) {
    case 0:
1666
      formats_ = ALL_CODE;
1667
1668
      break;
    case 1:
1669
      formats_ = COO_CODE;
1670
1671
      break;
    case 2:
1672
      formats_ = CSR_CODE;
1673
1674
      break;
    case 3:
1675
      formats_ = CSC_CODE;
1676
1677
1678
1679
1680
1681
      break;
    default:
      LOG(FATAL) << "Load graph failed, formats code " << formats_code <<
        "not recognized.";
    }
  }
1682

1683
1684
1685
1686
1687
1688
1689
1690
1691
1692
1693
  if (save_formats & COO_CODE) {
    fs->Read(&coo_);
  }
  if (save_formats & CSR_CODE) {
    fs->Read(&out_csr_);
  }
  if (save_formats & CSC_CODE) {
    fs->Read(&in_csr_);
  }
  if (!coo_ && !out_csr_ && !in_csr_) {
    LOG(FATAL) << "unsupported format code";
1694
1695
  }

1696
1697
1698
1699
1700
1701
1702
1703
1704
1705
  if (!in_csr_) {
    in_csr_ = CSRPtr(new CSR());
  }
  if (!out_csr_) {
    out_csr_ = CSRPtr(new CSR());
  }
  if (!coo_) {
    coo_ = COOPtr(new COO());
  }

1706
1707
  meta_graph_ = GetAny()->meta_graph();

1708
1709
1710
  return true;
}

1711

1712
1713
void UnitGraph::Save(dmlc::Stream* fs) const {
  fs->Write(kDGLSerialize_UnitGraphMagic);
1714
1715
  // Didn't write UnitGraph::meta_graph_, since it's included in the underlying
  // sparse matrix
1716
1717
1718
1719
1720
1721
1722
1723
1724
  auto save_formats = SparseFormatsToCode({SelectFormat(ALL_CODE)});
  auto fstream = dynamic_cast<dgl::serialize::DGLStream *>(fs);
  if (fstream) {
    auto formats = fstream->FormatsToSave();
    save_formats = formats == ANY_CODE
                       ? SparseFormatsToCode({SelectFormat(ALL_CODE)})
                       : formats;
  }
  fs->Write(static_cast<int64_t>(save_formats | 0x100000000));
1725
  fs->Write(static_cast<int64_t>(formats_ | 0x100000000));
1726
1727
1728
1729
1730
1731
1732
1733
  if (save_formats & COO_CODE) {
    fs->Write(GetCOO());
  }
  if (save_formats & CSR_CODE) {
    fs->Write(GetOutCSR());
  }
  if (save_formats & CSC_CODE) {
    fs->Write(GetInCSR());
1734
  }
1735
1736
}

1737
1738
1739
1740
1741
1742
1743
1744
1745
1746
UnitGraphPtr UnitGraph::Reverse() const {
  CSRPtr new_incsr = out_csr_, new_outcsr = in_csr_;
  COOPtr new_coo = nullptr;
  if (coo_->defined()) {
    new_coo = COOPtr(new COO(coo_->meta_graph(), aten::COOTranspose(coo_->adj())));
  }

  return UnitGraphPtr(new UnitGraph(meta_graph(), new_incsr, new_outcsr, new_coo));
}

1747
1748
1749
1750
1751
1752
1753
std::tuple<UnitGraphPtr, IdArray, IdArray>
UnitGraph::ToSimple() const {
  CSRPtr new_incsr = nullptr, new_outcsr = nullptr;
  COOPtr new_coo = nullptr;
  IdArray count;
  IdArray edge_map;

1754
  auto avail_fmt = SelectFormat(ALL_CODE);
1755
1756
  switch (avail_fmt) {
    case SparseFormat::kCOO: {
1757
      auto ret = aten::COOToSimple(GetCOO()->adj());
1758
1759
      count = std::get<1>(ret);
      edge_map = std::get<2>(ret);
1760
      new_coo = COOPtr(new COO(meta_graph(), std::get<0>(ret)));
1761
1762
1763
      break;
    }
    case SparseFormat::kCSR: {
1764
      auto ret = aten::CSRToSimple(GetOutCSR()->adj());
1765
1766
      count = std::get<1>(ret);
      edge_map = std::get<2>(ret);
1767
      new_outcsr = CSRPtr(new CSR(meta_graph(), std::get<0>(ret)));
1768
1769
1770
      break;
    }
    case SparseFormat::kCSC: {
1771
      auto ret = aten::CSRToSimple(GetInCSR()->adj());
1772
1773
      count = std::get<1>(ret);
      edge_map = std::get<2>(ret);
1774
      new_incsr = CSRPtr(new CSR(meta_graph(), std::get<0>(ret)));
1775
1776
1777
1778
1779
1780
1781
1782
1783
1784
1785
1786
      break;
    }
    default:
      LOG(FATAL) << "At lease one of COO, CSR or CSC adj should exist.";
      break;
  }

  return std::make_tuple(UnitGraphPtr(new UnitGraph(meta_graph(), new_incsr, new_outcsr, new_coo)),
                         count,
                         edge_map);
}

1787
}  // namespace dgl