unit_graph.cc 58.8 KB
Newer Older
1
2
/*!
 *  Copyright (c) 2019 by Contributors
Minjie Wang's avatar
Minjie Wang committed
3
4
 * \file graph/unit_graph.cc
 * \brief UnitGraph graph implementation
5
6
 */
#include <dgl/array.h>
7
#include <dgl/base_heterograph.h>
8
9
#include <dgl/immutable_graph.h>
#include <dgl/lazy.h>
10
11

#include "../c_api_common.h"
12
#include "./unit_graph.h"
13
14

namespace dgl {
15

16
namespace {
17
18
19

using namespace dgl::aten;

Minjie Wang's avatar
Minjie Wang committed
20
21
22
23
24
25
26
27
28
29
// create metagraph of one node type
inline GraphPtr CreateUnitGraphMetaGraph1() {
  // a self-loop edge 0->0
  std::vector<int64_t> row_vec(1, 0);
  std::vector<int64_t> col_vec(1, 0);
  IdArray row = aten::VecToIdArray(row_vec);
  IdArray col = aten::VecToIdArray(col_vec);
  GraphPtr g = ImmutableGraph::CreateFromCOO(1, row, col);
  return g;
}
30

Minjie Wang's avatar
Minjie Wang committed
31
32
33
34
35
// create metagraph of two node types
inline GraphPtr CreateUnitGraphMetaGraph2() {
  // an edge 0->1
  std::vector<int64_t> row_vec(1, 0);
  std::vector<int64_t> col_vec(1, 1);
36
37
38
39
40
  IdArray row = aten::VecToIdArray(row_vec);
  IdArray col = aten::VecToIdArray(col_vec);
  GraphPtr g = ImmutableGraph::CreateFromCOO(2, row, col);
  return g;
}
Minjie Wang's avatar
Minjie Wang committed
41
42
43
44
45
46
47
48
49
50
51
52

inline GraphPtr CreateUnitGraphMetaGraph(int num_vtypes) {
  static GraphPtr mg1 = CreateUnitGraphMetaGraph1();
  static GraphPtr mg2 = CreateUnitGraphMetaGraph2();
  if (num_vtypes == 1)
    return mg1;
  else if (num_vtypes == 2)
    return mg2;
  else
    LOG(FATAL) << "Invalid number of vertex types. Must be 1 or 2.";
  return {};
}
53
54

};  // namespace
55
56
57
58
59
60
61

//////////////////////////////////////////////////////////
//
// COO graph implementation
//
//////////////////////////////////////////////////////////

Minjie Wang's avatar
Minjie Wang committed
62
class UnitGraph::COO : public BaseHeteroGraph {
63
 public:
64
65
  COO(GraphPtr metagraph, int64_t num_src, int64_t num_dst, IdArray src,
      IdArray dst, bool row_sorted = false, bool col_sorted = false)
Minjie Wang's avatar
Minjie Wang committed
66
    : BaseHeteroGraph(metagraph) {
67
68
69
    CHECK(aten::IsValidIdArray(src));
    CHECK(aten::IsValidIdArray(dst));
    CHECK_EQ(src->shape[0], dst->shape[0]) << "Input arrays should have the same length.";
70
71
72
    adj_ = aten::COOMatrix{num_src, num_dst, src, dst,
        NullArray(),
        row_sorted, col_sorted};
73
  }
74

75
76
77
78
  COO(GraphPtr metagraph, const aten::COOMatrix& coo)
    : BaseHeteroGraph(metagraph), adj_(coo) {
    // Data index should not be inherited. Edges in COO format are always
    // assigned ids from 0 to num_edges - 1.
79
    CHECK(!COOHasData(coo)) << "[BUG] COO should not contain data.";
80
    adj_.data = aten::NullArray();
81
  }
82

83
84
85
86
87
88
89
90
91
92
93
  COO() {
    // set magic num_rows/num_cols to mark it as undefined
    // adj_.num_rows == 0 and adj_.num_cols == 0 means empty UnitGraph which is supported
    adj_.num_rows = -1;
    adj_.num_cols = -1;
  };

  bool defined() const {
    return (adj_.num_rows >= 0) && (adj_.num_cols >= 0);
  }

Minjie Wang's avatar
Minjie Wang committed
94
95
  inline dgl_type_t SrcType() const {
    return 0;
96
  }
Minjie Wang's avatar
Minjie Wang committed
97
98
99
100
101
102
103

  inline dgl_type_t DstType() const {
    return NumVertexTypes() == 1? 0 : 1;
  }

  inline dgl_type_t EdgeType() const {
    return 0;
104
105
106
  }

  HeteroGraphPtr GetRelationGraph(dgl_type_t etype) const override {
Minjie Wang's avatar
Minjie Wang committed
107
    LOG(FATAL) << "The method shouldn't be called for UnitGraph graph. "
108
109
110
111
112
      << "The relation graph is simply this graph itself.";
    return {};
  }

  void AddVertices(dgl_type_t vtype, uint64_t num_vertices) override {
Minjie Wang's avatar
Minjie Wang committed
113
    LOG(FATAL) << "UnitGraph graph is not mutable.";
114
115
116
  }

  void AddEdge(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) override {
Minjie Wang's avatar
Minjie Wang committed
117
    LOG(FATAL) << "UnitGraph graph is not mutable.";
118
119
120
  }

  void AddEdges(dgl_type_t etype, IdArray src_ids, IdArray dst_ids) override {
Minjie Wang's avatar
Minjie Wang committed
121
    LOG(FATAL) << "UnitGraph graph is not mutable.";
122
123
124
  }

  void Clear() override {
Minjie Wang's avatar
Minjie Wang committed
125
    LOG(FATAL) << "UnitGraph graph is not mutable.";
126
127
  }

128
129
130
131
  DLDataType DataType() const override {
    return adj_.row->dtype;
  }

132
133
134
135
  DLContext Context() const override {
    return adj_.row->ctx;
  }

136
137
138
139
  bool IsPinned() const override {
    return adj_.row.IsPinned();
  }

140
141
142
143
  uint8_t NumBits() const override {
    return adj_.row->dtype.bits;
  }

144
145
146
147
148
149
150
151
152
153
154
155
  COO AsNumBits(uint8_t bits) const {
    if (NumBits() == bits)
      return *this;

    COO ret(
        meta_graph_,
        adj_.num_rows, adj_.num_cols,
        aten::AsNumBits(adj_.row, bits),
        aten::AsNumBits(adj_.col, bits));
    return ret;
  }

156
157
  COO CopyTo(const DLContext &ctx,
             const DGLStreamHandle &stream = nullptr) const {
158
159
    if (Context() == ctx)
      return *this;
160
    return COO(meta_graph_, adj_.CopyTo(ctx, stream));
161
162
  }

163
164
165
166
167
168
169
170
171
172
173

  /*! \brief Pin the adj_: COOMatrix of the COO graph. */
  void PinMemory_() {
    adj_.PinMemory_();
  }

  /*! \brief Unpin the adj_: COOMatrix of the COO graph. */
  void UnpinMemory_() {
    adj_.UnpinMemory_();
  }

174
  bool IsMultigraph() const override {
175
    return aten::COOHasDuplicate(adj_);
176
177
178
179
180
181
182
  }

  bool IsReadonly() const override {
    return true;
  }

  uint64_t NumVertices(dgl_type_t vtype) const override {
Minjie Wang's avatar
Minjie Wang committed
183
    if (vtype == SrcType()) {
184
      return adj_.num_rows;
Minjie Wang's avatar
Minjie Wang committed
185
    } else if (vtype == DstType()) {
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
      return adj_.num_cols;
    } else {
      LOG(FATAL) << "Invalid vertex type: " << vtype;
      return 0;
    }
  }

  uint64_t NumEdges(dgl_type_t etype) const override {
    return adj_.row->shape[0];
  }

  bool HasVertex(dgl_type_t vtype, dgl_id_t vid) const override {
    return vid < NumVertices(vtype);
  }

  BoolArray HasVertices(dgl_type_t vtype, IdArray vids) const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return {};
  }

  bool HasEdgeBetween(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const override {
207
208
209
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
    return aten::COOIsNonZero(adj_, src, dst);
210
211
212
  }

  BoolArray HasEdgesBetween(dgl_type_t etype, IdArray src_ids, IdArray dst_ids) const override {
213
214
215
    CHECK(aten::IsValidIdArray(src_ids)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dst_ids)) << "Invalid vertex id array.";
    return aten::COOIsNonZero(adj_, src_ids, dst_ids);
216
217
218
  }

  IdArray Predecessors(dgl_type_t etype, dgl_id_t dst) const override {
219
220
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
    return aten::COOGetRowDataAndIndices(aten::COOTranspose(adj_), dst).second;
221
222
223
  }

  IdArray Successors(dgl_type_t etype, dgl_id_t src) const override {
224
225
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    return aten::COOGetRowDataAndIndices(adj_, src).second;
226
227
228
  }

  IdArray EdgeId(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const override {
229
230
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
231
    return aten::COOGetAllData(adj_, src, dst);
232
233
  }

234
  EdgeArray EdgeIdsAll(dgl_type_t etype, IdArray src, IdArray dst) const override {
235
236
237
238
    CHECK(aten::IsValidIdArray(src)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dst)) << "Invalid vertex id array.";
    const auto& arrs = aten::COOGetDataAndIndices(adj_, src, dst);
    return EdgeArray{arrs[0], arrs[1], arrs[2]};
239
240
  }

241
242
243
244
  IdArray EdgeIdsOne(dgl_type_t etype, IdArray src, IdArray dst) const override {
    return aten::COOGetData(adj_, src, dst);
  }

245
246
  std::pair<dgl_id_t, dgl_id_t> FindEdge(dgl_type_t etype, dgl_id_t eid) const override {
    CHECK(eid < NumEdges(etype)) << "Invalid edge id: " << eid;
247
248
    const dgl_id_t src = aten::IndexSelect<int64_t>(adj_.row, eid);
    const dgl_id_t dst = aten::IndexSelect<int64_t>(adj_.col, eid);
249
250
251
252
    return std::pair<dgl_id_t, dgl_id_t>(src, dst);
  }

  EdgeArray FindEdges(dgl_type_t etype, IdArray eids) const override {
253
    CHECK(aten::IsValidIdArray(eids)) << "Invalid edge id array";
254
    BUG_IF_FAIL(aten::IsNullArray(adj_.data)) <<
255
      "FindEdges requires the internal COO matrix not having EIDs.";
256
257
258
259
260
261
    return EdgeArray{aten::IndexSelect(adj_.row, eids),
                     aten::IndexSelect(adj_.col, eids),
                     eids};
  }

  EdgeArray InEdges(dgl_type_t etype, dgl_id_t vid) const override {
262
263
264
265
266
    IdArray ret_src, ret_eid;
    std::tie(ret_eid, ret_src) = aten::COOGetRowDataAndIndices(
        aten::COOTranspose(adj_), vid);
    IdArray ret_dst = aten::Full(vid, ret_src->shape[0], NumBits(), ret_src->ctx);
    return EdgeArray{ret_src, ret_dst, ret_eid};
267
268
269
  }

  EdgeArray InEdges(dgl_type_t etype, IdArray vids) const override {
270
271
272
273
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
    auto coosubmat = aten::COOSliceRows(aten::COOTranspose(adj_), vids);
    auto row = aten::IndexSelect(vids, coosubmat.row);
    return EdgeArray{coosubmat.col, row, coosubmat.data};
274
275
276
  }

  EdgeArray OutEdges(dgl_type_t etype, dgl_id_t vid) const override {
277
278
279
280
    IdArray ret_dst, ret_eid;
    std::tie(ret_eid, ret_dst) = aten::COOGetRowDataAndIndices(adj_, vid);
    IdArray ret_src = aten::Full(vid, ret_dst->shape[0], NumBits(), ret_dst->ctx);
    return EdgeArray{ret_src, ret_dst, ret_eid};
281
282
283
  }

  EdgeArray OutEdges(dgl_type_t etype, IdArray vids) const override {
284
285
286
287
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
    auto coosubmat = aten::COOSliceRows(adj_, vids);
    auto row = aten::IndexSelect(vids, coosubmat.row);
    return EdgeArray{row, coosubmat.col, coosubmat.data};
288
289
290
291
292
293
294
295
296
297
298
  }

  EdgeArray Edges(dgl_type_t etype, const std::string &order = "") const override {
    CHECK(order.empty() || order == std::string("eid"))
      << "COO only support Edges of order \"eid\", but got \""
      << order << "\".";
    IdArray rst_eid = aten::Range(0, NumEdges(etype), NumBits(), Context());
    return EdgeArray{adj_.row, adj_.col, rst_eid};
  }

  uint64_t InDegree(dgl_type_t etype, dgl_id_t vid) const override {
299
300
    CHECK(HasVertex(DstType(), vid)) << "Invalid dst vertex id: " << vid;
    return aten::COOGetRowNNZ(aten::COOTranspose(adj_), vid);
301
302
303
  }

  DegreeArray InDegrees(dgl_type_t etype, IdArray vids) const override {
304
305
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
    return aten::COOGetRowNNZ(aten::COOTranspose(adj_), vids);
306
307
308
  }

  uint64_t OutDegree(dgl_type_t etype, dgl_id_t vid) const override {
309
310
    CHECK(HasVertex(SrcType(), vid)) << "Invalid src vertex id: " << vid;
    return aten::COOGetRowNNZ(adj_, vid);
311
312
313
  }

  DegreeArray OutDegrees(dgl_type_t etype, IdArray vids) const override {
314
315
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
    return aten::COOGetRowNNZ(adj_, vids);
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
  }

  DGLIdIters SuccVec(dgl_type_t etype, dgl_id_t vid) const override {
    LOG(INFO) << "Not enabled for COO graph.";
    return {};
  }

  DGLIdIters OutEdgeVec(dgl_type_t etype, dgl_id_t vid) const override {
    LOG(INFO) << "Not enabled for COO graph.";
    return {};
  }

  DGLIdIters PredVec(dgl_type_t etype, dgl_id_t vid) const override {
    LOG(INFO) << "Not enabled for COO graph.";
    return {};
  }

  DGLIdIters InEdgeVec(dgl_type_t etype, dgl_id_t vid) const override {
    LOG(INFO) << "Not enabled for COO graph.";
    return {};
  }

  std::vector<IdArray> GetAdj(
      dgl_type_t etype, bool transpose, const std::string &fmt) const override {
    CHECK(fmt == "coo") << "Not valid adj format request.";
    if (transpose) {
      return {aten::HStack(adj_.col, adj_.row)};
    } else {
      return {aten::HStack(adj_.row, adj_.col)};
    }
  }

348
349
350
351
352
353
354
355
356
357
358
359
360
361
  aten::COOMatrix GetCOOMatrix(dgl_type_t etype) const override {
    return adj_;
  }

  aten::CSRMatrix GetCSCMatrix(dgl_type_t etype) const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return aten::CSRMatrix();
  }

  aten::CSRMatrix GetCSRMatrix(dgl_type_t etype) const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return aten::CSRMatrix();
  }

362
363
364
365
366
367
368
369
370
371
372
373
  void SetCOOMatrix(dgl_type_t etype, aten::COOMatrix coo) override {
    adj_ = coo;
  }

  void SetCSRMatrix(dgl_type_t etype, aten::CSRMatrix csr) override {
    LOG(FATAL) << "Not enabled for COO graph";
  }

  void SetCSCMatrix(dgl_type_t etype, aten::CSRMatrix csc) override {
    LOG(FATAL) << "Not enabled for COO graph";
  }

374
  SparseFormat SelectFormat(dgl_type_t etype, dgl_format_code_t preferred_formats) const override {
375
    LOG(FATAL) << "Not enabled for COO graph";
376
    return SparseFormat::kCOO;
377
378
  }

379
  dgl_format_code_t GetAllowedFormats() const override {
380
    LOG(FATAL) << "Not enabled for COO graph";
381
    return 0;
382
383
  }

384
  dgl_format_code_t GetCreatedFormats() const override {
385
386
387
388
    LOG(FATAL) << "Not enabled for COO graph";
    return 0;
  }

389
  HeteroSubgraph VertexSubgraph(const std::vector<IdArray>& vids) const override {
390
391
392
393
394
395
396
397
398
399
400
401
    CHECK_EQ(vids.size(), NumVertexTypes()) << "Number of vertex types mismatch";
    auto srcvids = vids[SrcType()], dstvids = vids[DstType()];
    CHECK(aten::IsValidIdArray(srcvids)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dstvids)) << "Invalid vertex id array.";
    HeteroSubgraph subg;
    const auto& submat = aten::COOSliceMatrix(adj_, srcvids, dstvids);
    IdArray sub_eids = aten::Range(0, submat.data->shape[0], NumBits(), Context());
    subg.graph = std::make_shared<COO>(meta_graph(), submat.num_rows, submat.num_cols,
        submat.row, submat.col);
    subg.induced_vertices = vids;
    subg.induced_edges.emplace_back(submat.data);
    return subg;
402
403
404
405
406
407
408
409
410
411
412
413
414
415
  }

  HeteroSubgraph EdgeSubgraph(
      const std::vector<IdArray>& eids, bool preserve_nodes = false) const override {
    CHECK_EQ(eids.size(), 1) << "Edge type number mismatch.";
    HeteroSubgraph subg;
    if (!preserve_nodes) {
      IdArray new_src = aten::IndexSelect(adj_.row, eids[0]);
      IdArray new_dst = aten::IndexSelect(adj_.col, eids[0]);
      subg.induced_vertices.emplace_back(aten::Relabel_({new_src}));
      subg.induced_vertices.emplace_back(aten::Relabel_({new_dst}));
      const auto new_nsrc = subg.induced_vertices[0]->shape[0];
      const auto new_ndst = subg.induced_vertices[1]->shape[0];
      subg.graph = std::make_shared<COO>(
Minjie Wang's avatar
Minjie Wang committed
416
          meta_graph(), new_nsrc, new_ndst, new_src, new_dst);
417
418
419
420
      subg.induced_edges = eids;
    } else {
      IdArray new_src = aten::IndexSelect(adj_.row, eids[0]);
      IdArray new_dst = aten::IndexSelect(adj_.col, eids[0]);
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
421
422
423
424
      subg.induced_vertices.emplace_back(
          aten::Range(0, NumVertices(SrcType()), NumBits(), Context()));
      subg.induced_vertices.emplace_back(
          aten::Range(0, NumVertices(DstType()), NumBits(), Context()));
425
      subg.graph = std::make_shared<COO>(
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
426
          meta_graph(), NumVertices(SrcType()), NumVertices(DstType()), new_src, new_dst);
427
428
429
430
431
      subg.induced_edges = eids;
    }
    return subg;
  }

432
  HeteroGraphPtr GetGraphInFormat(dgl_format_code_t formats) const override {
433
434
435
436
    LOG(FATAL) << "Not enabled for COO graph.";
    return nullptr;
  }

437
438
439
440
  aten::COOMatrix adj() const {
    return adj_;
  }

441
442
443
444
445
446
447
448
449
  /*!
   * \brief Determines whether the graph is "hypersparse", i.e. having significantly more
   * nodes than edges.
   */
  bool IsHypersparse() const {
    return (NumVertices(SrcType()) / 8 > NumEdges(EdgeType())) &&
           (NumVertices(SrcType()) > 1000000);
  }

450
451
452
453
454
455
456
457
458
459
460
461
462
  bool Load(dmlc::Stream* fs) {
    auto meta_imgraph = Serializer::make_shared<ImmutableGraph>();
    CHECK(fs->Read(&meta_imgraph)) << "Invalid meta graph";
    meta_graph_ = meta_imgraph;
    CHECK(fs->Read(&adj_)) << "Invalid adj matrix";
    return true;
  }
  void Save(dmlc::Stream* fs) const {
    auto meta_graph_ptr = ImmutableGraph::ToImmutable(meta_graph());
    fs->Write(meta_graph_ptr);
    fs->Write(adj_);
  }

463
 private:
464
465
  friend class Serializer;

466
467
468
469
470
471
472
473
474
475
476
  /*! \brief internal adjacency matrix. Data array is empty */
  aten::COOMatrix adj_;
};

//////////////////////////////////////////////////////////
//
// CSR graph implementation
//
//////////////////////////////////////////////////////////

/*! \brief CSR graph */
Minjie Wang's avatar
Minjie Wang committed
477
class UnitGraph::CSR : public BaseHeteroGraph {
478
 public:
Minjie Wang's avatar
Minjie Wang committed
479
  CSR(GraphPtr metagraph, int64_t num_src, int64_t num_dst,
480
      IdArray indptr, IdArray indices, IdArray edge_ids)
Minjie Wang's avatar
Minjie Wang committed
481
    : BaseHeteroGraph(metagraph) {
482
483
    CHECK(aten::IsValidIdArray(indptr));
    CHECK(aten::IsValidIdArray(indices));
484
485
486
    if (aten::IsValidIdArray(edge_ids))
      CHECK((indices->shape[0] == edge_ids->shape[0]) || aten::IsNullArray(edge_ids))
        << "edge id arrays should have the same length as indices if not empty";
487
488
    CHECK_EQ(num_src, indptr->shape[0] - 1)
      << "number of nodes do not match the length of indptr minus 1.";
489

490
491
492
    adj_ = aten::CSRMatrix{num_src, num_dst, indptr, indices, edge_ids};
  }

493
  CSR(GraphPtr metagraph, const aten::CSRMatrix& csr)
Da Zheng's avatar
Da Zheng committed
494
495
    : BaseHeteroGraph(metagraph), adj_(csr) {
  }
496

497
498
499
500
501
502
503
504
505
506
507
  CSR() {
    // set magic num_rows/num_cols to mark it as undefined
    // adj_.num_rows == 0 and adj_.num_cols == 0 means empty UnitGraph which is supported
    adj_.num_rows = -1;
    adj_.num_cols = -1;
  };

  bool defined() const {
    return (adj_.num_rows >= 0) || (adj_.num_cols >= 0);
  }

Minjie Wang's avatar
Minjie Wang committed
508
509
  inline dgl_type_t SrcType() const {
    return 0;
510
  }
Minjie Wang's avatar
Minjie Wang committed
511
512
513
514
515
516
517

  inline dgl_type_t DstType() const {
    return NumVertexTypes() == 1? 0 : 1;
  }

  inline dgl_type_t EdgeType() const {
    return 0;
518
519
520
  }

  HeteroGraphPtr GetRelationGraph(dgl_type_t etype) const override {
Minjie Wang's avatar
Minjie Wang committed
521
    LOG(FATAL) << "The method shouldn't be called for UnitGraph graph. "
522
523
524
525
526
      << "The relation graph is simply this graph itself.";
    return {};
  }

  void AddVertices(dgl_type_t vtype, uint64_t num_vertices) override {
Minjie Wang's avatar
Minjie Wang committed
527
    LOG(FATAL) << "UnitGraph graph is not mutable.";
528
529
530
  }

  void AddEdge(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) override {
Minjie Wang's avatar
Minjie Wang committed
531
    LOG(FATAL) << "UnitGraph graph is not mutable.";
532
533
534
  }

  void AddEdges(dgl_type_t etype, IdArray src_ids, IdArray dst_ids) override {
Minjie Wang's avatar
Minjie Wang committed
535
    LOG(FATAL) << "UnitGraph graph is not mutable.";
536
537
538
  }

  void Clear() override {
Minjie Wang's avatar
Minjie Wang committed
539
    LOG(FATAL) << "UnitGraph graph is not mutable.";
540
541
  }

542
543
544
545
  DLDataType DataType() const override {
    return adj_.indices->dtype;
  }

546
547
548
549
  DLContext Context() const override {
    return adj_.indices->ctx;
  }

550
551
552
553
  bool IsPinned() const override {
    return adj_.indices.IsPinned();
  }

554
555
556
557
  uint8_t NumBits() const override {
    return adj_.indices->dtype.bits;
  }

558
559
560
561
562
  CSR AsNumBits(uint8_t bits) const {
    if (NumBits() == bits) {
      return *this;
    } else {
      CSR ret(
Minjie Wang's avatar
Minjie Wang committed
563
          meta_graph_,
564
565
566
567
568
569
570
571
          adj_.num_rows, adj_.num_cols,
          aten::AsNumBits(adj_.indptr, bits),
          aten::AsNumBits(adj_.indices, bits),
          aten::AsNumBits(adj_.data, bits));
      return ret;
    }
  }

572
573
  CSR CopyTo(const DLContext &ctx,
             const DGLStreamHandle &stream = nullptr) const {
574
575
576
    if (Context() == ctx) {
      return *this;
    } else {
577
      return CSR(meta_graph_, adj_.CopyTo(ctx, stream));
578
579
580
    }
  }

581
582
583
584
585
586
587
588
589
590
  /*! \brief Pin the adj_: CSRMatrix of the CSR graph. */
  void PinMemory_() {
    adj_.PinMemory_();
  }

  /*! \brief Unpin the adj_: CSRMatrix of the CSR graph. */
  void UnpinMemory_() {
    adj_.UnpinMemory_();
  }

591
  bool IsMultigraph() const override {
592
    return aten::CSRHasDuplicate(adj_);
593
594
595
596
597
598
599
  }

  bool IsReadonly() const override {
    return true;
  }

  uint64_t NumVertices(dgl_type_t vtype) const override {
Minjie Wang's avatar
Minjie Wang committed
600
    if (vtype == SrcType()) {
601
      return adj_.num_rows;
Minjie Wang's avatar
Minjie Wang committed
602
    } else if (vtype == DstType()) {
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
      return adj_.num_cols;
    } else {
      LOG(FATAL) << "Invalid vertex type: " << vtype;
      return 0;
    }
  }

  uint64_t NumEdges(dgl_type_t etype) const override {
    return adj_.indices->shape[0];
  }

  bool HasVertex(dgl_type_t vtype, dgl_id_t vid) const override {
    return vid < NumVertices(vtype);
  }

  BoolArray HasVertices(dgl_type_t vtype, IdArray vids) const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return {};
  }

  bool HasEdgeBetween(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const override {
Minjie Wang's avatar
Minjie Wang committed
624
625
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
626
627
628
629
    return aten::CSRIsNonZero(adj_, src, dst);
  }

  BoolArray HasEdgesBetween(dgl_type_t etype, IdArray src_ids, IdArray dst_ids) const override {
630
631
    CHECK(aten::IsValidIdArray(src_ids)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dst_ids)) << "Invalid vertex id array.";
632
633
634
635
636
637
638
639
640
    return aten::CSRIsNonZero(adj_, src_ids, dst_ids);
  }

  IdArray Predecessors(dgl_type_t etype, dgl_id_t dst) const override {
    LOG(INFO) << "Not enabled for CSR graph.";
    return {};
  }

  IdArray Successors(dgl_type_t etype, dgl_id_t src) const override {
Minjie Wang's avatar
Minjie Wang committed
641
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
642
643
644
645
    return aten::CSRGetRowColumnIndices(adj_, src);
  }

  IdArray EdgeId(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const override {
Minjie Wang's avatar
Minjie Wang committed
646
647
    CHECK(HasVertex(SrcType(), src)) << "Invalid src vertex id: " << src;
    CHECK(HasVertex(DstType(), dst)) << "Invalid dst vertex id: " << dst;
648
    return aten::CSRGetAllData(adj_, src, dst);
649
650
  }

651
  EdgeArray EdgeIdsAll(dgl_type_t etype, IdArray src, IdArray dst) const override {
652
653
    CHECK(aten::IsValidIdArray(src)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dst)) << "Invalid vertex id array.";
654
655
656
657
    const auto& arrs = aten::CSRGetDataAndIndices(adj_, src, dst);
    return EdgeArray{arrs[0], arrs[1], arrs[2]};
  }

658
659
660
661
  IdArray EdgeIdsOne(dgl_type_t etype, IdArray src, IdArray dst) const override {
    return aten::CSRGetData(adj_, src, dst);
  }

662
  std::pair<dgl_id_t, dgl_id_t> FindEdge(dgl_type_t etype, dgl_id_t eid) const override {
663
    LOG(FATAL) << "Not enabled for CSR graph.";
664
665
666
667
    return {};
  }

  EdgeArray FindEdges(dgl_type_t etype, IdArray eids) const override {
668
    LOG(FATAL) << "Not enabled for CSR graph.";
669
670
671
672
    return {};
  }

  EdgeArray InEdges(dgl_type_t etype, dgl_id_t vid) const override {
673
    LOG(FATAL) << "Not enabled for CSR graph.";
674
675
676
677
    return {};
  }

  EdgeArray InEdges(dgl_type_t etype, IdArray vids) const override {
678
    LOG(FATAL) << "Not enabled for CSR graph.";
679
680
681
682
    return {};
  }

  EdgeArray OutEdges(dgl_type_t etype, dgl_id_t vid) const override {
Minjie Wang's avatar
Minjie Wang committed
683
    CHECK(HasVertex(SrcType(), vid)) << "Invalid src vertex id: " << vid;
684
685
686
687
688
689
690
    IdArray ret_dst = aten::CSRGetRowColumnIndices(adj_, vid);
    IdArray ret_eid = aten::CSRGetRowData(adj_, vid);
    IdArray ret_src = aten::Full(vid, ret_dst->shape[0], NumBits(), ret_dst->ctx);
    return EdgeArray{ret_src, ret_dst, ret_eid};
  }

  EdgeArray OutEdges(dgl_type_t etype, IdArray vids) const override {
691
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
692
693
694
695
696
697
698
699
700
701
702
703
    auto csrsubmat = aten::CSRSliceRows(adj_, vids);
    auto coosubmat = aten::CSRToCOO(csrsubmat, false);
    // Note that the row id in the csr submat is relabled, so
    // we need to recover it using an index select.
    auto row = aten::IndexSelect(vids, coosubmat.row);
    return EdgeArray{row, coosubmat.col, coosubmat.data};
  }

  EdgeArray Edges(dgl_type_t etype, const std::string &order = "") const override {
    CHECK(order.empty() || order == std::string("srcdst"))
      << "CSR only support Edges of order \"srcdst\","
      << " but got \"" << order << "\".";
704
705
706
707
708
    auto coo = aten::CSRToCOO(adj_, false);
    if (order == std::string("srcdst")) {
      // make sure the coo is sorted if an order is requested
      coo = aten::COOSort(coo, true);
    }
709
710
711
712
    return EdgeArray{coo.row, coo.col, coo.data};
  }

  uint64_t InDegree(dgl_type_t etype, dgl_id_t vid) const override {
713
    LOG(FATAL) << "Not enabled for CSR graph.";
714
715
716
717
    return {};
  }

  DegreeArray InDegrees(dgl_type_t etype, IdArray vids) const override {
718
    LOG(FATAL) << "Not enabled for CSR graph.";
719
720
721
722
    return {};
  }

  uint64_t OutDegree(dgl_type_t etype, dgl_id_t vid) const override {
Minjie Wang's avatar
Minjie Wang committed
723
    CHECK(HasVertex(SrcType(), vid)) << "Invalid src vertex id: " << vid;
724
725
726
727
    return aten::CSRGetRowNNZ(adj_, vid);
  }

  DegreeArray OutDegrees(dgl_type_t etype, IdArray vids) const override {
728
    CHECK(aten::IsValidIdArray(vids)) << "Invalid vertex id array.";
729
730
731
732
733
734
    return aten::CSRGetRowNNZ(adj_, vids);
  }

  DGLIdIters SuccVec(dgl_type_t etype, dgl_id_t vid) const override {
    // TODO(minjie): This still assumes the data type and device context
    //   of this graph. Should fix later.
735
    CHECK_EQ(NumBits(), 64);
736
737
738
739
740
741
742
    const dgl_id_t* indptr_data = static_cast<dgl_id_t*>(adj_.indptr->data);
    const dgl_id_t* indices_data = static_cast<dgl_id_t*>(adj_.indices->data);
    const dgl_id_t start = indptr_data[vid];
    const dgl_id_t end = indptr_data[vid + 1];
    return DGLIdIters(indices_data + start, indices_data + end);
  }

743
744
745
746
747
748
749
750
751
752
  DGLIdIters32 SuccVec32(dgl_type_t etype, dgl_id_t vid) {
    // TODO(minjie): This still assumes the data type and device context
    //   of this graph. Should fix later.
    const int32_t* indptr_data = static_cast<int32_t*>(adj_.indptr->data);
    const int32_t* indices_data = static_cast<int32_t*>(adj_.indices->data);
    const int32_t start = indptr_data[vid];
    const int32_t end = indptr_data[vid + 1];
    return DGLIdIters32(indices_data + start, indices_data + end);
  }

753
754
755
  DGLIdIters OutEdgeVec(dgl_type_t etype, dgl_id_t vid) const override {
    // TODO(minjie): This still assumes the data type and device context
    //   of this graph. Should fix later.
756
    CHECK_EQ(NumBits(), 64);
757
758
759
760
761
762
763
764
    const dgl_id_t* indptr_data = static_cast<dgl_id_t*>(adj_.indptr->data);
    const dgl_id_t* eid_data = static_cast<dgl_id_t*>(adj_.data->data);
    const dgl_id_t start = indptr_data[vid];
    const dgl_id_t end = indptr_data[vid + 1];
    return DGLIdIters(eid_data + start, eid_data + end);
  }

  DGLIdIters PredVec(dgl_type_t etype, dgl_id_t vid) const override {
765
    LOG(FATAL) << "Not enabled for CSR graph.";
766
767
768
769
    return {};
  }

  DGLIdIters InEdgeVec(dgl_type_t etype, dgl_id_t vid) const override {
770
    LOG(FATAL) << "Not enabled for CSR graph.";
771
772
773
774
775
776
777
778
779
    return {};
  }

  std::vector<IdArray> GetAdj(
      dgl_type_t etype, bool transpose, const std::string &fmt) const override {
    CHECK(!transpose && fmt == "csr") << "Not valid adj format request.";
    return {adj_.indptr, adj_.indices, adj_.data};
  }

780
781
782
783
784
785
786
787
788
789
790
791
792
793
  aten::COOMatrix GetCOOMatrix(dgl_type_t etype) const override {
    LOG(FATAL) << "Not enabled for CSR graph";
    return aten::COOMatrix();
  }

  aten::CSRMatrix GetCSCMatrix(dgl_type_t etype) const override {
    LOG(FATAL) << "Not enabled for CSR graph";
    return aten::CSRMatrix();
  }

  aten::CSRMatrix GetCSRMatrix(dgl_type_t etype) const override {
    return adj_;
  }

794
795
796
797
798
799
800
801
802
803
804
805
  void SetCOOMatrix(dgl_type_t etype, aten::COOMatrix coo) override {
    LOG(FATAL) << "Not enabled for CSR graph";
  }

  void SetCSRMatrix(dgl_type_t etype, aten::CSRMatrix csr) override {
    adj_ = csr;
  }

  void SetCSCMatrix(dgl_type_t etype, aten::CSRMatrix csc) override {
    LOG(FATAL) << "Please use in_csr_->SetCSRMatrix(etype, csc) instead.";
  }

806
  SparseFormat SelectFormat(dgl_type_t etype, dgl_format_code_t preferred_formats) const override {
807
    LOG(FATAL) << "Not enabled for CSR graph";
808
    return SparseFormat::kCSR;
809
810
  }

811
812
813
  dgl_format_code_t GetAllowedFormats() const override {
    LOG(FATAL) << "Not enabled for COO graph";
    return 0;
814
815
  }

816
  dgl_format_code_t GetCreatedFormats() const override {
817
818
819
820
    LOG(FATAL) << "Not enabled for CSR graph";
    return 0;
  }

821
  HeteroSubgraph VertexSubgraph(const std::vector<IdArray>& vids) const override {
Minjie Wang's avatar
Minjie Wang committed
822
823
824
825
    CHECK_EQ(vids.size(), NumVertexTypes()) << "Number of vertex types mismatch";
    auto srcvids = vids[SrcType()], dstvids = vids[DstType()];
    CHECK(aten::IsValidIdArray(srcvids)) << "Invalid vertex id array.";
    CHECK(aten::IsValidIdArray(dstvids)) << "Invalid vertex id array.";
826
    HeteroSubgraph subg;
Minjie Wang's avatar
Minjie Wang committed
827
    const auto& submat = aten::CSRSliceMatrix(adj_, srcvids, dstvids);
828
    IdArray sub_eids = aten::Range(0, submat.data->shape[0], NumBits(), Context());
Minjie Wang's avatar
Minjie Wang committed
829
    subg.graph = std::make_shared<CSR>(meta_graph(), submat.num_rows, submat.num_cols,
830
831
832
833
834
835
836
837
        submat.indptr, submat.indices, sub_eids);
    subg.induced_vertices = vids;
    subg.induced_edges.emplace_back(submat.data);
    return subg;
  }

  HeteroSubgraph EdgeSubgraph(
      const std::vector<IdArray>& eids, bool preserve_nodes = false) const override {
838
    LOG(FATAL) << "Not enabled for CSR graph.";
839
840
841
    return {};
  }

842
  HeteroGraphPtr GetGraphInFormat(dgl_format_code_t formats) const override {
843
844
845
846
    LOG(FATAL) << "Not enabled for CSR graph.";
    return nullptr;
  }

847
848
849
850
  aten::CSRMatrix adj() const {
    return adj_;
  }

851
852
853
854
855
856
857
858
859
860
861
862
863
  bool Load(dmlc::Stream* fs) {
    auto meta_imgraph = Serializer::make_shared<ImmutableGraph>();
    CHECK(fs->Read(&meta_imgraph)) << "Invalid meta graph";
    meta_graph_ = meta_imgraph;
    CHECK(fs->Read(&adj_)) << "Invalid adj matrix";
    return true;
  }
  void Save(dmlc::Stream* fs) const {
    auto meta_graph_ptr = ImmutableGraph::ToImmutable(meta_graph());
    fs->Write(meta_graph_ptr);
    fs->Write(adj_);
  }

864
 private:
865
866
  friend class Serializer;

867
868
869
870
871
872
  /*! \brief internal adjacency matrix. Data array stores edge ids */
  aten::CSRMatrix adj_;
};

//////////////////////////////////////////////////////////
//
Minjie Wang's avatar
Minjie Wang committed
873
// unit graph implementation
874
875
876
//
//////////////////////////////////////////////////////////

877
878
879
880
DLDataType UnitGraph::DataType() const {
  return GetAny()->DataType();
}

Minjie Wang's avatar
Minjie Wang committed
881
DLContext UnitGraph::Context() const {
882
883
884
  return GetAny()->Context();
}

885
886
887
888
bool UnitGraph::IsPinned() const {
  return GetAny()->IsPinned();
}

Minjie Wang's avatar
Minjie Wang committed
889
uint8_t UnitGraph::NumBits() const {
890
891
892
  return GetAny()->NumBits();
}

Minjie Wang's avatar
Minjie Wang committed
893
bool UnitGraph::IsMultigraph() const {
894
  const SparseFormat fmt = SelectFormat(CSC_CODE);
895
896
  const auto ptr = GetFormat(fmt);
  return ptr->IsMultigraph();
897
898
}

Minjie Wang's avatar
Minjie Wang committed
899
uint64_t UnitGraph::NumVertices(dgl_type_t vtype) const {
900
  const SparseFormat fmt = SelectFormat(ALL_CODE);
901
902
903
  const auto ptr = GetFormat(fmt);
  // TODO(BarclayII): we have a lot of special handling for CSC.
  // Need to have a UnitGraph::CSC backend instead.
904
  if (fmt == SparseFormat::kCSC)
Minjie Wang's avatar
Minjie Wang committed
905
    vtype = (vtype == SrcType()) ? DstType() : SrcType();
906
  return ptr->NumVertices(vtype);
907
908
}

Minjie Wang's avatar
Minjie Wang committed
909
uint64_t UnitGraph::NumEdges(dgl_type_t etype) const {
910
911
912
  return GetAny()->NumEdges(etype);
}

Minjie Wang's avatar
Minjie Wang committed
913
bool UnitGraph::HasVertex(dgl_type_t vtype, dgl_id_t vid) const {
914
  const SparseFormat fmt = SelectFormat(ALL_CODE);
915
  const auto ptr = GetFormat(fmt);
916
  if (fmt == SparseFormat::kCSC)
Minjie Wang's avatar
Minjie Wang committed
917
    vtype = (vtype == SrcType()) ? DstType() : SrcType();
918
  return ptr->HasVertex(vtype, vid);
919
920
}

Minjie Wang's avatar
Minjie Wang committed
921
BoolArray UnitGraph::HasVertices(dgl_type_t vtype, IdArray vids) const {
922
  CHECK(aten::IsValidIdArray(vids)) << "Invalid id array input";
923
924
925
  return aten::LT(vids, NumVertices(vtype));
}

Minjie Wang's avatar
Minjie Wang committed
926
bool UnitGraph::HasEdgeBetween(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const {
927
  const SparseFormat fmt = SelectFormat(CSC_CODE);
928
  const auto ptr = GetFormat(fmt);
929
  if (fmt == SparseFormat::kCSC)
930
931
932
    return ptr->HasEdgeBetween(etype, dst, src);
  else
    return ptr->HasEdgeBetween(etype, src, dst);
933
934
}

Minjie Wang's avatar
Minjie Wang committed
935
BoolArray UnitGraph::HasEdgesBetween(
936
    dgl_type_t etype, IdArray src, IdArray dst) const {
937
  const SparseFormat fmt = SelectFormat(CSC_CODE);
938
  const auto ptr = GetFormat(fmt);
939
  if (fmt == SparseFormat::kCSC)
940
941
942
    return ptr->HasEdgesBetween(etype, dst, src);
  else
    return ptr->HasEdgesBetween(etype, src, dst);
943
944
}

Minjie Wang's avatar
Minjie Wang committed
945
IdArray UnitGraph::Predecessors(dgl_type_t etype, dgl_id_t dst) const {
946
  const SparseFormat fmt = SelectFormat(CSC_CODE);
947
  const auto ptr = GetFormat(fmt);
948
  if (fmt == SparseFormat::kCSC)
949
950
951
    return ptr->Successors(etype, dst);
  else
    return ptr->Predecessors(etype, dst);
952
953
}

Minjie Wang's avatar
Minjie Wang committed
954
IdArray UnitGraph::Successors(dgl_type_t etype, dgl_id_t src) const {
955
  const SparseFormat fmt = SelectFormat(CSR_CODE);
956
957
  const auto ptr = GetFormat(fmt);
  return ptr->Successors(etype, src);
958
959
}

Minjie Wang's avatar
Minjie Wang committed
960
IdArray UnitGraph::EdgeId(dgl_type_t etype, dgl_id_t src, dgl_id_t dst) const {
961
  const SparseFormat fmt = SelectFormat(CSR_CODE);
962
  const auto ptr = GetFormat(fmt);
963
  if (fmt == SparseFormat::kCSC)
964
965
966
    return ptr->EdgeId(etype, dst, src);
  else
    return ptr->EdgeId(etype, src, dst);
967
968
}

969
EdgeArray UnitGraph::EdgeIdsAll(dgl_type_t etype, IdArray src, IdArray dst) const {
970
  const SparseFormat fmt = SelectFormat(CSR_CODE);
971
  const auto ptr = GetFormat(fmt);
972
  if (fmt == SparseFormat::kCSC) {
973
    EdgeArray edges = ptr->EdgeIdsAll(etype, dst, src);
974
975
    return EdgeArray{edges.dst, edges.src, edges.id};
  } else {
976
977
978
979
980
    return ptr->EdgeIdsAll(etype, src, dst);
  }
}

IdArray UnitGraph::EdgeIdsOne(dgl_type_t etype, IdArray src, IdArray dst) const {
981
  const SparseFormat fmt = SelectFormat(CSR_CODE);
982
983
984
985
986
  const auto ptr = GetFormat(fmt);
  if (fmt == SparseFormat::kCSC) {
    return ptr->EdgeIdsOne(etype, dst, src);
  } else {
    return ptr->EdgeIdsOne(etype, src, dst);
987
988
989
  }
}

Minjie Wang's avatar
Minjie Wang committed
990
std::pair<dgl_id_t, dgl_id_t> UnitGraph::FindEdge(dgl_type_t etype, dgl_id_t eid) const {
991
  const SparseFormat fmt = SelectFormat(COO_CODE);
992
993
  const auto ptr = GetFormat(fmt);
  return ptr->FindEdge(etype, eid);
994
995
}

Minjie Wang's avatar
Minjie Wang committed
996
EdgeArray UnitGraph::FindEdges(dgl_type_t etype, IdArray eids) const {
997
  const SparseFormat fmt = SelectFormat(COO_CODE);
998
999
  const auto ptr = GetFormat(fmt);
  return ptr->FindEdges(etype, eids);
1000
1001
}

Minjie Wang's avatar
Minjie Wang committed
1002
EdgeArray UnitGraph::InEdges(dgl_type_t etype, dgl_id_t vid) const {
1003
  const SparseFormat fmt = SelectFormat(CSC_CODE);
1004
  const auto ptr = GetFormat(fmt);
1005
  if (fmt == SparseFormat::kCSC) {
1006
1007
1008
1009
1010
    const EdgeArray& ret = ptr->OutEdges(etype, vid);
    return {ret.dst, ret.src, ret.id};
  } else {
    return ptr->InEdges(etype, vid);
  }
1011
1012
}

Minjie Wang's avatar
Minjie Wang committed
1013
EdgeArray UnitGraph::InEdges(dgl_type_t etype, IdArray vids) const {
1014
  const SparseFormat fmt = SelectFormat(CSC_CODE);
1015
  const auto ptr = GetFormat(fmt);
1016
  if (fmt == SparseFormat::kCSC) {
1017
1018
1019
1020
1021
    const EdgeArray& ret = ptr->OutEdges(etype, vids);
    return {ret.dst, ret.src, ret.id};
  } else {
    return ptr->InEdges(etype, vids);
  }
1022
1023
}

Minjie Wang's avatar
Minjie Wang committed
1024
EdgeArray UnitGraph::OutEdges(dgl_type_t etype, dgl_id_t vid) const {
1025
  const SparseFormat fmt = SelectFormat(CSR_CODE);
1026
1027
  const auto ptr = GetFormat(fmt);
  return ptr->OutEdges(etype, vid);
1028
1029
}

Minjie Wang's avatar
Minjie Wang committed
1030
EdgeArray UnitGraph::OutEdges(dgl_type_t etype, IdArray vids) const {
1031
  const SparseFormat fmt = SelectFormat(CSR_CODE);
1032
1033
  const auto ptr = GetFormat(fmt);
  return ptr->OutEdges(etype, vids);
1034
1035
}

Minjie Wang's avatar
Minjie Wang committed
1036
EdgeArray UnitGraph::Edges(dgl_type_t etype, const std::string &order) const {
1037
1038
  SparseFormat fmt;
  if (order == std::string("eid")) {
1039
    fmt = SelectFormat(COO_CODE);
1040
  } else if (order.empty()) {
1041
    // arbitrary order
1042
    fmt = SelectFormat(ALL_CODE);
1043
  } else if (order == std::string("srcdst")) {
1044
    fmt = SelectFormat(CSR_CODE);
1045
1046
  } else {
    LOG(FATAL) << "Unsupported order request: " << order;
1047
    return {};
1048
  }
1049
1050

  const auto& edges = GetFormat(fmt)->Edges(etype, order);
1051
  if (fmt == SparseFormat::kCSC)
1052
1053
1054
    return EdgeArray{edges.dst, edges.src, edges.id};
  else
    return edges;
1055
1056
}

Minjie Wang's avatar
Minjie Wang committed
1057
uint64_t UnitGraph::InDegree(dgl_type_t etype, dgl_id_t vid) const {
1058
  SparseFormat fmt = SelectFormat(CSC_CODE);
1059
  const auto ptr = GetFormat(fmt);
1060
1061
1062
1063
1064
  CHECK(fmt == SparseFormat::kCSC || fmt == SparseFormat::kCOO)
      << "In degree cannot be computed as neither CSC nor COO format is "
         "allowed for this graph. Please enable one of them at least.";
  return fmt == SparseFormat::kCSC ? ptr->OutDegree(etype, vid)
                                   : ptr->InDegree(etype, vid);
1065
1066
}

Minjie Wang's avatar
Minjie Wang committed
1067
DegreeArray UnitGraph::InDegrees(dgl_type_t etype, IdArray vids) const {
1068
  SparseFormat fmt = SelectFormat(CSC_CODE);
1069
  const auto ptr = GetFormat(fmt);
1070
1071
1072
1073
1074
  CHECK(fmt == SparseFormat::kCSC || fmt == SparseFormat::kCOO)
      << "In degree cannot be computed as neither CSC nor COO format is "
         "allowed for this graph. Please enable one of them at least.";
  return fmt == SparseFormat::kCSC ? ptr->OutDegrees(etype, vids)
                                   : ptr->InDegrees(etype, vids);
1075
1076
}

Minjie Wang's avatar
Minjie Wang committed
1077
uint64_t UnitGraph::OutDegree(dgl_type_t etype, dgl_id_t vid) const {
1078
  SparseFormat fmt = SelectFormat(CSR_CODE);
1079
  const auto ptr = GetFormat(fmt);
1080
1081
1082
  CHECK(fmt == SparseFormat::kCSR || fmt == SparseFormat::kCOO)
      << "Out degree cannot be computed as neither CSR nor COO format is "
         "allowed for this graph. Please enable one of them at least.";
1083
  return ptr->OutDegree(etype, vid);
1084
1085
}

Minjie Wang's avatar
Minjie Wang committed
1086
DegreeArray UnitGraph::OutDegrees(dgl_type_t etype, IdArray vids) const {
1087
  SparseFormat fmt = SelectFormat(CSR_CODE);
1088
  const auto ptr = GetFormat(fmt);
1089
1090
1091
  CHECK(fmt == SparseFormat::kCSR || fmt == SparseFormat::kCOO)
      << "Out degree cannot be computed as neither CSR nor COO format is "
         "allowed for this graph. Please enable one of them at least.";
1092
  return ptr->OutDegrees(etype, vids);
1093
1094
}

Minjie Wang's avatar
Minjie Wang committed
1095
DGLIdIters UnitGraph::SuccVec(dgl_type_t etype, dgl_id_t vid) const {
1096
  SparseFormat fmt = SelectFormat(CSR_CODE);
1097
1098
  const auto ptr = GetFormat(fmt);
  return ptr->SuccVec(etype, vid);
1099
1100
}

1101
DGLIdIters32 UnitGraph::SuccVec32(dgl_type_t etype, dgl_id_t vid) const {
1102
  SparseFormat fmt = SelectFormat(CSR_CODE);
1103
1104
1105
1106
1107
  const auto ptr = std::dynamic_pointer_cast<CSR>(GetFormat(fmt));
  CHECK_NOTNULL(ptr);
  return ptr->SuccVec32(etype, vid);
}

Minjie Wang's avatar
Minjie Wang committed
1108
DGLIdIters UnitGraph::OutEdgeVec(dgl_type_t etype, dgl_id_t vid) const {
1109
  SparseFormat fmt = SelectFormat(CSR_CODE);
1110
1111
  const auto ptr = GetFormat(fmt);
  return ptr->OutEdgeVec(etype, vid);
1112
1113
}

Minjie Wang's avatar
Minjie Wang committed
1114
DGLIdIters UnitGraph::PredVec(dgl_type_t etype, dgl_id_t vid) const {
1115
  SparseFormat fmt = SelectFormat(CSC_CODE);
1116
  const auto ptr = GetFormat(fmt);
1117
  if (fmt == SparseFormat::kCSC)
1118
1119
1120
    return ptr->SuccVec(etype, vid);
  else
    return ptr->PredVec(etype, vid);
1121
1122
}

Minjie Wang's avatar
Minjie Wang committed
1123
DGLIdIters UnitGraph::InEdgeVec(dgl_type_t etype, dgl_id_t vid) const {
1124
  SparseFormat fmt = SelectFormat(CSC_CODE);
1125
  const auto ptr = GetFormat(fmt);
1126
  if (fmt == SparseFormat::kCSC)
1127
1128
1129
    return ptr->OutEdgeVec(etype, vid);
  else
    return ptr->InEdgeVec(etype, vid);
1130
1131
}

Minjie Wang's avatar
Minjie Wang committed
1132
std::vector<IdArray> UnitGraph::GetAdj(
1133
1134
1135
1136
1137
1138
1139
1140
1141
    dgl_type_t etype, bool transpose, const std::string &fmt) const {
  // TODO(minjie): Our current semantics of adjacency matrix is row for dst nodes and col for
  //   src nodes. Therefore, we need to flip the transpose flag. For example, transpose=False
  //   is equal to in edge CSR.
  //   We have this behavior because previously we use framework's SPMM and we don't cache
  //   reverse adj. This is not intuitive and also not consistent with networkx's
  //   to_scipy_sparse_matrix. With the upcoming custom kernel change, we should change the
  //   behavior and make row for src and col for dst.
  if (fmt == std::string("csr")) {
1142
    return !transpose ? GetOutCSR()->GetAdj(etype, false, "csr")
1143
1144
      : GetInCSR()->GetAdj(etype, false, "csr");
  } else if (fmt == std::string("coo")) {
1145
    return GetCOO()->GetAdj(etype, transpose, fmt);
1146
1147
1148
1149
1150
1151
  } else {
    LOG(FATAL) << "unsupported adjacency matrix format: " << fmt;
    return {};
  }
}

Minjie Wang's avatar
Minjie Wang committed
1152
HeteroSubgraph UnitGraph::VertexSubgraph(const std::vector<IdArray>& vids) const {
1153
  // We prefer to generate a subgraph from out-csr.
1154
  SparseFormat fmt = SelectFormat(CSR_CODE);
1155
  HeteroSubgraph sg = GetFormat(fmt)->VertexSubgraph(vids);
1156
  HeteroSubgraph ret;
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
1175
1176

  CSRPtr subcsr = nullptr;
  CSRPtr subcsc = nullptr;
  COOPtr subcoo = nullptr;
  switch (fmt) {
    case SparseFormat::kCSR:
      subcsr = std::dynamic_pointer_cast<CSR>(sg.graph);
      break;
    case SparseFormat::kCSC:
      subcsc = std::dynamic_pointer_cast<CSR>(sg.graph);
      break;
    case SparseFormat::kCOO:
      subcoo = std::dynamic_pointer_cast<COO>(sg.graph);
      break;
    default:
      LOG(FATAL) << "[BUG] unsupported format " << static_cast<int>(fmt);
      return ret;
  }

  ret.graph = HeteroGraphPtr(new UnitGraph(meta_graph(), subcsc, subcsr, subcoo));
1177
1178
1179
1180
1181
  ret.induced_vertices = std::move(sg.induced_vertices);
  ret.induced_edges = std::move(sg.induced_edges);
  return ret;
}

Minjie Wang's avatar
Minjie Wang committed
1182
HeteroSubgraph UnitGraph::EdgeSubgraph(
1183
    const std::vector<IdArray>& eids, bool preserve_nodes) const {
1184
  SparseFormat fmt = SelectFormat(COO_CODE);
1185
  auto sg = GetFormat(fmt)->EdgeSubgraph(eids, preserve_nodes);
1186
  HeteroSubgraph ret;
Quan (Andy) Gan's avatar
Quan (Andy) Gan committed
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206

  CSRPtr subcsr = nullptr;
  CSRPtr subcsc = nullptr;
  COOPtr subcoo = nullptr;
  switch (fmt) {
    case SparseFormat::kCSR:
      subcsr = std::dynamic_pointer_cast<CSR>(sg.graph);
      break;
    case SparseFormat::kCSC:
      subcsc = std::dynamic_pointer_cast<CSR>(sg.graph);
      break;
    case SparseFormat::kCOO:
      subcoo = std::dynamic_pointer_cast<COO>(sg.graph);
      break;
    default:
      LOG(FATAL) << "[BUG] unsupported format " << static_cast<int>(fmt);
      return ret;
  }

  ret.graph = HeteroGraphPtr(new UnitGraph(meta_graph(), subcsc, subcsr, subcoo));
1207
1208
1209
1210
1211
  ret.induced_vertices = std::move(sg.induced_vertices);
  ret.induced_edges = std::move(sg.induced_edges);
  return ret;
}

Minjie Wang's avatar
Minjie Wang committed
1212
HeteroGraphPtr UnitGraph::CreateFromCOO(
1213
1214
    int64_t num_vtypes, int64_t num_src, int64_t num_dst,
    IdArray row, IdArray col,
1215
    bool row_sorted, bool col_sorted,
1216
    dgl_format_code_t formats) {
Minjie Wang's avatar
Minjie Wang committed
1217
1218
1219
1220
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(num_src, num_dst);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
1221
1222
  COOPtr coo(new COO(mg, num_src, num_dst, row, col,
      row_sorted, col_sorted));
1223
1224

  return HeteroGraphPtr(
1225
      new UnitGraph(mg, nullptr, nullptr, coo, formats));
1226
1227
}

1228
1229
HeteroGraphPtr UnitGraph::CreateFromCOO(
    int64_t num_vtypes, const aten::COOMatrix& mat,
1230
    dgl_format_code_t formats) {
1231
1232
1233
1234
1235
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(mat.num_rows, mat.num_cols);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
  COOPtr coo(new COO(mg, mat));
1236

1237
  return HeteroGraphPtr(
1238
      new UnitGraph(mg, nullptr, nullptr, coo, formats));
1239
1240
}

Minjie Wang's avatar
Minjie Wang committed
1241
1242
HeteroGraphPtr UnitGraph::CreateFromCSR(
    int64_t num_vtypes, int64_t num_src, int64_t num_dst,
1243
    IdArray indptr, IdArray indices, IdArray edge_ids, dgl_format_code_t formats) {
Minjie Wang's avatar
Minjie Wang committed
1244
1245
1246
1247
1248
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(num_src, num_dst);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
  CSRPtr csr(new CSR(mg, num_src, num_dst, indptr, indices, edge_ids));
1249
  return HeteroGraphPtr(new UnitGraph(mg, nullptr, csr, nullptr, formats));
1250
1251
}

1252
1253
HeteroGraphPtr UnitGraph::CreateFromCSR(
    int64_t num_vtypes, const aten::CSRMatrix& mat,
1254
    dgl_format_code_t formats) {
1255
1256
1257
1258
1259
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(mat.num_rows, mat.num_cols);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
  CSRPtr csr(new CSR(mg, mat));
1260
  return HeteroGraphPtr(new UnitGraph(mg, nullptr, csr, nullptr, formats));
1261
1262
}

1263
1264
HeteroGraphPtr UnitGraph::CreateFromCSC(
    int64_t num_vtypes, int64_t num_src, int64_t num_dst,
1265
    IdArray indptr, IdArray indices, IdArray edge_ids, dgl_format_code_t formats) {
1266
1267
1268
1269
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(num_src, num_dst);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
1270
  CSRPtr csc(new CSR(mg, num_dst, num_src, indptr, indices, edge_ids));
1271
  return HeteroGraphPtr(new UnitGraph(mg, csc, nullptr, nullptr, formats));
1272
1273
1274
1275
}

HeteroGraphPtr UnitGraph::CreateFromCSC(
    int64_t num_vtypes, const aten::CSRMatrix& mat,
1276
    dgl_format_code_t formats) {
1277
1278
1279
1280
1281
  CHECK(num_vtypes == 1 || num_vtypes == 2);
  if (num_vtypes == 1)
    CHECK_EQ(mat.num_rows, mat.num_cols);
  auto mg = CreateUnitGraphMetaGraph(num_vtypes);
  CSRPtr csc(new CSR(mg, mat));
1282
  return HeteroGraphPtr(new UnitGraph(mg, csc, nullptr, nullptr, formats));
1283
1284
}

Minjie Wang's avatar
Minjie Wang committed
1285
HeteroGraphPtr UnitGraph::AsNumBits(HeteroGraphPtr g, uint8_t bits) {
1286
1287
1288
  if (g->NumBits() == bits) {
    return g;
  } else {
Minjie Wang's avatar
Minjie Wang committed
1289
    auto bg = std::dynamic_pointer_cast<UnitGraph>(g);
1290
    CHECK_NOTNULL(bg);
1291
1292
1293
1294
1295
1296
    CSRPtr new_incsr =
      (bg->in_csr_->defined())? CSRPtr(new CSR(bg->in_csr_->AsNumBits(bits))) : nullptr;
    CSRPtr new_outcsr =
      (bg->out_csr_->defined())? CSRPtr(new CSR(bg->out_csr_->AsNumBits(bits))) : nullptr;
    COOPtr new_coo =
      (bg->coo_->defined())? COOPtr(new COO(bg->coo_->AsNumBits(bits))) : nullptr;
1297
    return HeteroGraphPtr(
1298
        new UnitGraph(g->meta_graph(), new_incsr, new_outcsr, new_coo, bg->formats_));
1299
1300
1301
  }
}

1302
1303
HeteroGraphPtr UnitGraph::CopyTo(HeteroGraphPtr g, const DLContext &ctx,
                                 const DGLStreamHandle &stream) {
1304
1305
  if (ctx == g->Context()) {
    return g;
1306
1307
1308
  } else {
    auto bg = std::dynamic_pointer_cast<UnitGraph>(g);
    CHECK_NOTNULL(bg);
1309
1310
1311
1312
1313
1314
1315
1316
1317
    CSRPtr new_incsr = (bg->in_csr_->defined())
                           ? CSRPtr(new CSR(bg->in_csr_->CopyTo(ctx, stream)))
                           : nullptr;
    CSRPtr new_outcsr = (bg->out_csr_->defined())
                            ? CSRPtr(new CSR(bg->out_csr_->CopyTo(ctx, stream)))
                            : nullptr;
    COOPtr new_coo = (bg->coo_->defined())
                         ? COOPtr(new COO(bg->coo_->CopyTo(ctx, stream)))
                         : nullptr;
1318
    return HeteroGraphPtr(
1319
        new UnitGraph(g->meta_graph(), new_incsr, new_outcsr, new_coo, bg->formats_));
1320
1321
1322
  }
}

1323
1324
1325
1326
1327
1328
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
void UnitGraph::PinMemory_() {
  if (this->in_csr_->defined())
    this->in_csr_->PinMemory_();
  if (this->out_csr_->defined())
    this->out_csr_->PinMemory_();
  if (this->coo_->defined())
    this->coo_->PinMemory_();
}

void UnitGraph::UnpinMemory_() {
  if (this->in_csr_->defined())
    this->in_csr_->UnpinMemory_();
  if (this->out_csr_->defined())
    this->out_csr_->UnpinMemory_();
  if (this->coo_->defined())
    this->coo_->UnpinMemory_();
}

1341
1342
1343
1344
1345
1346
1347
1348
1349
1350
1351
1352
void UnitGraph::InvalidateCSR() {
  this->out_csr_ = CSRPtr(new CSR());
}

void UnitGraph::InvalidateCSC() {
  this->in_csr_ = CSRPtr(new CSR());
}

void UnitGraph::InvalidateCOO() {
  this->coo_ = COOPtr(new COO());
}

1353
UnitGraph::UnitGraph(GraphPtr metagraph, CSRPtr in_csr, CSRPtr out_csr, COOPtr coo,
1354
                     dgl_format_code_t formats)
Minjie Wang's avatar
Minjie Wang committed
1355
  : BaseHeteroGraph(metagraph), in_csr_(in_csr), out_csr_(out_csr), coo_(coo) {
1356
1357
1358
1359
1360
1361
1362
1363
1364
  if (!in_csr_) {
    in_csr_ = CSRPtr(new CSR());
  }
  if (!out_csr_) {
    out_csr_ = CSRPtr(new CSR());
  }
  if (!coo_) {
    coo_ = COOPtr(new COO());
  }
1365
1366
1367
1368
1369
  formats_ = formats;
  dgl_format_code_t created = GetCreatedFormats();
  if ((formats | created) != formats)
    LOG(FATAL) << "Graph created from formats: " << CodeToStr(created) <<
      ", which is not compatible with available formats: " << CodeToStr(formats);
1370
1371
1372
  CHECK(GetAny()) << "At least one graph structure should exist.";
}

1373
1374
1375
1376
1377
1378
1379
HeteroGraphPtr UnitGraph::CreateHomographFrom(
    const aten::CSRMatrix &in_csr,
    const aten::CSRMatrix &out_csr,
    const aten::COOMatrix &coo,
    bool has_in_csr,
    bool has_out_csr,
    bool has_coo,
1380
    dgl_format_code_t formats) {
1381
1382
1383
1384
1385
1386
1387
1388
  auto mg = CreateUnitGraphMetaGraph1();

  CSRPtr in_csr_ptr = nullptr;
  CSRPtr out_csr_ptr = nullptr;
  COOPtr coo_ptr = nullptr;

  if (has_in_csr)
    in_csr_ptr = CSRPtr(new CSR(mg, in_csr));
1389
1390
  else
    in_csr_ptr = CSRPtr(new CSR());
1391
1392
  if (has_out_csr)
    out_csr_ptr = CSRPtr(new CSR(mg, out_csr));
1393
1394
  else
    out_csr_ptr = CSRPtr(new CSR());
1395
1396
  if (has_coo)
    coo_ptr = COOPtr(new COO(mg, coo));
1397
1398
  else
    coo_ptr = COOPtr(new COO());
1399

1400
  return HeteroGraphPtr(new UnitGraph(mg, in_csr_ptr, out_csr_ptr, coo_ptr, formats));
1401
1402
}

1403
1404
UnitGraph::CSRPtr UnitGraph::GetInCSR(bool inplace) const {
  if (inplace)
1405
    if (!(formats_ & CSC_CODE))
1406
1407
      LOG(FATAL) << "The graph have restricted sparse format " <<
        CodeToStr(formats_) << ", cannot create CSC matrix.";
1408
  CSRPtr ret = in_csr_;
1409
1410
  // Prefers converting from COO since it is parallelized.
  // TODO(BarclayII): need benchmarking.
1411
  if (!in_csr_->defined()) {
1412
1413
1414
1415
    // inplace new formats materialization is not allowed for pinned graphs
    if (inplace && IsPinned())
      LOG(FATAL) << "Cannot create new formats for pinned graphs, " <<
        "please create the CSC format before pinning.";
1416
1417
1418
    if (coo_->defined()) {
      const auto& newadj = aten::COOToCSR(
            aten::COOTranspose(coo_->adj()));
1419

1420
      if (inplace)
1421
1422
1423
        *(const_cast<UnitGraph*>(this)->in_csr_) = CSR(meta_graph(), newadj);
      else
        ret = std::make_shared<CSR>(meta_graph(), newadj);
1424
    } else {
1425
1426
      CHECK(out_csr_->defined()) << "None of CSR, COO exist";
      const auto& newadj = aten::CSRTranspose(out_csr_->adj());
1427

1428
      if (inplace)
1429
1430
1431
        *(const_cast<UnitGraph*>(this)->in_csr_) = CSR(meta_graph(), newadj);
      else
        ret = std::make_shared<CSR>(meta_graph(), newadj);
1432
1433
    }
  }
1434
  return ret;
1435
1436
1437
}

/* !\brief Return out csr. If not exist, transpose the other one.*/
1438
1439
UnitGraph::CSRPtr UnitGraph::GetOutCSR(bool inplace) const {
  if (inplace)
1440
    if (!(formats_ & CSR_CODE))
1441
1442
      LOG(FATAL) << "The graph have restricted sparse format " <<
        CodeToStr(formats_) << ", cannot create CSR matrix.";
1443
  CSRPtr ret = out_csr_;
1444
1445
  // Prefers converting from COO since it is parallelized.
  // TODO(BarclayII): need benchmarking.
1446
  if (!out_csr_->defined()) {
1447
1448
1449
1450
    // inplace new formats materialization is not allowed for pinned graphs
    if (inplace && IsPinned())
      LOG(FATAL) << "Cannot create new formats for pinned graphs, " <<
        "please create the CSR format before pinning.";
1451
1452
    if (coo_->defined()) {
      const auto& newadj = aten::COOToCSR(coo_->adj());
1453

1454
      if (inplace)
1455
1456
1457
        *(const_cast<UnitGraph*>(this)->out_csr_) = CSR(meta_graph(), newadj);
      else
        ret = std::make_shared<CSR>(meta_graph(), newadj);
1458
    } else {
1459
1460
      CHECK(in_csr_->defined()) << "None of CSR, COO exist";
      const auto& newadj = aten::CSRTranspose(in_csr_->adj());
1461

1462
      if (inplace)
1463
1464
1465
        *(const_cast<UnitGraph*>(this)->out_csr_) = CSR(meta_graph(), newadj);
      else
        ret = std::make_shared<CSR>(meta_graph(), newadj);
1466
1467
    }
  }
1468
  return ret;
1469
1470
1471
}

/* !\brief Return coo. If not exist, create from csr.*/
1472
1473
UnitGraph::COOPtr UnitGraph::GetCOO(bool inplace) const {
  if (inplace)
1474
    if (!(formats_ & COO_CODE))
1475
1476
      LOG(FATAL) << "The graph have restricted sparse format " <<
        CodeToStr(formats_) << ", cannot create COO matrix.";
1477
  COOPtr ret = coo_;
1478
  if (!coo_->defined()) {
1479
1480
1481
1482
    // inplace new formats materialization is not allowed for pinned graphs
    if (inplace && IsPinned())
      LOG(FATAL) << "Cannot create new formats for pinned graphs, " <<
        "please create the COO format before pinning.";
1483
    if (in_csr_->defined()) {
1484
      const auto& newadj = aten::COOTranspose(aten::CSRToCOO(in_csr_->adj(), true));
1485

1486
      if (inplace)
1487
1488
1489
        *(const_cast<UnitGraph*>(this)->coo_) = COO(meta_graph(), newadj);
      else
        ret = std::make_shared<COO>(meta_graph(), newadj);
1490
    } else {
1491
      CHECK(out_csr_->defined()) << "Both CSR are missing.";
1492
      const auto& newadj = aten::CSRToCOO(out_csr_->adj(), true);
1493

1494
      if (inplace)
1495
1496
1497
        *(const_cast<UnitGraph*>(this)->coo_) = COO(meta_graph(), newadj);
      else
        ret = std::make_shared<COO>(meta_graph(), newadj);
1498
1499
    }
  }
1500
  return ret;
1501
1502
}

1503
aten::CSRMatrix UnitGraph::GetCSCMatrix(dgl_type_t etype) const {
1504
1505
1506
  return GetInCSR()->adj();
}

1507
aten::CSRMatrix UnitGraph::GetCSRMatrix(dgl_type_t etype) const {
1508
1509
1510
  return GetOutCSR()->adj();
}

1511
aten::COOMatrix UnitGraph::GetCOOMatrix(dgl_type_t etype) const {
1512
1513
1514
  return GetCOO()->adj();
}

1515
1516
1517
1518
1519
1520
1521
1522
1523
1524
1525
1526
1527
1528
1529
1530
1531
1532
1533
1534
1535
1536
1537
1538
1539
1540
1541
1542
1543
1544
1545
1546
1547
1548
1549
1550
1551
1552
1553
1554
1555
1556
1557
1558
1559
1560
1561
1562
void UnitGraph::SetCOOMatrix(dgl_type_t etype, COOMatrix coo) {
  if (!(formats_ & COO_CODE)) {
    LOG(FATAL) << "The graph have restricted sparse format " <<
      CodeToStr(formats_) << ", cannot set COO matrix.";
    return;
  }
  if (IsPinned()) {
    LOG(FATAL) << "Cannot set COOMatrix if the graph is pinned, please unpin the graph.";
    return;
  }
  if (!coo_->defined())
    *(const_cast<UnitGraph*>(this)->coo_) = COO(meta_graph(), coo);
  else
    coo_->SetCOOMatrix(0, coo);
}

void UnitGraph::SetCSRMatrix(dgl_type_t etype, CSRMatrix csr) {
  if (!(formats_ & CSR_CODE)) {
    LOG(FATAL) << "The graph have restricted sparse format " <<
      CodeToStr(formats_) << ", cannot set CSR matrix.";
    return;
  }
  if (IsPinned()) {
    LOG(FATAL) << "Cannot set CSRMatrix if the graph is pinned, please unpin the graph.";
    return;
  }
  if (!out_csr_->defined())
    *(const_cast<UnitGraph*>(this)->out_csr_) = CSR(meta_graph(), csr);
  else
    out_csr_->SetCSRMatrix(0, csr);
}

void UnitGraph::SetCSCMatrix(dgl_type_t etype, CSRMatrix csc) {
  if (!(formats_ & CSC_CODE)) {
    LOG(FATAL) << "The graph have restricted sparse format " <<
      CodeToStr(formats_) << ", cannot set CSC matrix.";
    return;
  }
  if (IsPinned()) {
    LOG(FATAL) << "Cannot set CSCMatrix if the graph is pinned, please unpin the graph.";
    return;
  }
  if (!in_csr_->defined())
    *(const_cast<UnitGraph*>(this)->in_csr_) = CSR(meta_graph(), csc);
  else
    in_csr_->SetCSRMatrix(0, csc);
}

Minjie Wang's avatar
Minjie Wang committed
1563
HeteroGraphPtr UnitGraph::GetAny() const {
1564
  if (in_csr_->defined()) {
1565
    return in_csr_;
1566
  } else if (out_csr_->defined()) {
1567
1568
1569
1570
1571
1572
    return out_csr_;
  } else {
    return coo_;
  }
}

1573
dgl_format_code_t UnitGraph::GetCreatedFormats() const {
1574
  dgl_format_code_t ret = 0;
1575
  if (in_csr_->defined())
1576
    ret |= CSC_CODE;
1577
  if (out_csr_->defined())
1578
    ret |= CSR_CODE;
1579
  if (coo_->defined())
1580
    ret |= COO_CODE;
1581
1582
1583
  return ret;
}

1584
1585
1586
1587
dgl_format_code_t UnitGraph::GetAllowedFormats() const {
  return formats_;
}

1588
1589
HeteroGraphPtr UnitGraph::GetFormat(SparseFormat format) const {
  switch (format) {
1590
1591
1592
1593
  case SparseFormat::kCSR:
    return GetOutCSR();
  case SparseFormat::kCSC:
    return GetInCSR();
1594
  default:
1595
    return GetCOO();
1596
1597
1598
  }
}

1599
HeteroGraphPtr UnitGraph::GetGraphInFormat(dgl_format_code_t formats) const {
1600
  if (formats == ALL_CODE)
1601
    return HeteroGraphPtr(
1602
1603
        // TODO(xiangsx) Make it as graph storage.Clone()
        new UnitGraph(meta_graph_,
1604
1605
1606
1607
1608
1609
1610
1611
1612
1613
1614
                      (in_csr_->defined())
                          ? CSRPtr(new CSR(*in_csr_))
                          : nullptr,
                      (out_csr_->defined())
                          ? CSRPtr(new CSR(*out_csr_))
                          : nullptr,
                      (coo_->defined())
                          ? COOPtr(new COO(*coo_))
                          : nullptr,
                      formats));
  int64_t num_vtypes = NumVertexTypes();
1615
  if (formats & COO_CODE)
1616
    return CreateFromCOO(num_vtypes, GetCOO(false)->adj(), formats);
1617
  if (formats & CSR_CODE)
1618
1619
1620
1621
1622
1623
1624
1625
1626
    return CreateFromCSR(num_vtypes, GetOutCSR(false)->adj(), formats);
  return CreateFromCSC(num_vtypes, GetInCSR(false)->adj(), formats);
}

SparseFormat UnitGraph::SelectFormat(dgl_format_code_t preferred_formats) const {
  dgl_format_code_t common = preferred_formats & formats_;
  dgl_format_code_t created = GetCreatedFormats();
  if (common & created)
    return DecodeFormat(common & created);
1627
1628
1629
1630
1631

  // NOTE(zihao): hypersparse is currently disabled since many CUDA operators on COO have
  // not been implmented yet.
  // if (coo_->defined() && coo_->IsHypersparse())  // only allow coo for hypersparse graph.
  //   return SparseFormat::kCOO;
1632
1633
1634
  if (common)
    return DecodeFormat(common);
  return DecodeFormat(created);
1635
1636
}

1637
1638
1639
1640
GraphPtr UnitGraph::AsImmutableGraph() const {
  CHECK(NumVertexTypes() == 1) << "not a homogeneous graph";
  dgl::CSRPtr in_csr_ptr = nullptr, out_csr_ptr = nullptr;
  dgl::COOPtr coo_ptr = nullptr;
1641
  if (in_csr_->defined()) {
1642
    aten::CSRMatrix csc = GetCSCMatrix(0);
1643
    in_csr_ptr = dgl::CSRPtr(new dgl::CSR(csc.indptr, csc.indices, csc.data));
1644
  }
1645
  if (out_csr_->defined()) {
1646
    aten::CSRMatrix csr = GetCSRMatrix(0);
1647
    out_csr_ptr = dgl::CSRPtr(new dgl::CSR(csr.indptr, csr.indices, csr.data));
1648
  }
1649
  if (coo_->defined()) {
1650
1651
    aten::COOMatrix coo = GetCOOMatrix(0);
    if (!COOHasData(coo)) {
1652
      coo_ptr = dgl::COOPtr(new dgl::COO(NumVertices(0), coo.row, coo.col));
1653
1654
1655
    } else {
      IdArray new_src = Scatter(coo.row, coo.data);
      IdArray new_dst = Scatter(coo.col, coo.data);
1656
      coo_ptr = dgl::COOPtr(new dgl::COO(NumVertices(0), new_src, new_dst));
1657
1658
1659
1660
1661
    }
  }
  return GraphPtr(new dgl::ImmutableGraph(in_csr_ptr, out_csr_ptr, coo_ptr));
}

1662
1663
HeteroGraphPtr UnitGraph::LineGraph(bool backtracking) const {
  // TODO(xiangsx) currently we only support homogeneous graph
1664
  auto fmt = SelectFormat(ALL_CODE);
1665
1666
  switch (fmt) {
    case SparseFormat::kCOO: {
1667
      return CreateFromCOO(1, aten::COOLineGraph(coo_->adj(), backtracking));
1668
1669
1670
1671
    }
    case SparseFormat::kCSR: {
      const aten::CSRMatrix csr = GetCSRMatrix(0);
      const aten::COOMatrix coo = aten::COOLineGraph(aten::CSRToCOO(csr, true), backtracking);
1672
      return CreateFromCOO(1, coo);
1673
1674
1675
1676
1677
    }
    case SparseFormat::kCSC: {
      const aten::CSRMatrix csc = GetCSCMatrix(0);
      const aten::CSRMatrix csr = aten::CSRTranspose(csc);
      const aten::COOMatrix coo = aten::COOLineGraph(aten::CSRToCOO(csr, true), backtracking);
1678
      return CreateFromCOO(1, coo);
1679
1680
1681
1682
1683
1684
1685
1686
    }
    default:
      LOG(FATAL) << "None of CSC, CSR, COO exist";
      break;
  }
  return nullptr;
}

1687
1688
1689
1690
1691
1692
constexpr uint64_t kDGLSerialize_UnitGraphMagic = 0xDD2E60F0F6B4A127;

bool UnitGraph::Load(dmlc::Stream* fs) {
  uint64_t magicNum;
  CHECK(fs->Read(&magicNum)) << "Invalid Magic Number";
  CHECK_EQ(magicNum, kDGLSerialize_UnitGraphMagic) << "Invalid UnitGraph Data";
1693

1694
  int64_t save_format_code, formats_code;
1695
  CHECK(fs->Read(&save_format_code)) << "Invalid format";
1696
  CHECK(fs->Read(&formats_code)) << "Invalid format";
1697
  auto save_format = static_cast<SparseFormat>(save_format_code);
1698
1699
1700
1701
1702
1703
  if (formats_code >> 32) {
    formats_ = static_cast<dgl_format_code_t>(0xffffffff & formats_code);
  } else {
    // NOTE(zihao): to be compatible with old formats.
    switch (formats_code & 0xffffffff) {
    case 0:
1704
      formats_ = ALL_CODE;
1705
1706
      break;
    case 1:
1707
      formats_ = COO_CODE;
1708
1709
      break;
    case 2:
1710
      formats_ = CSR_CODE;
1711
1712
      break;
    case 3:
1713
      formats_ = CSC_CODE;
1714
1715
1716
1717
1718
1719
      break;
    default:
      LOG(FATAL) << "Load graph failed, formats code " << formats_code <<
        "not recognized.";
    }
  }
1720

1721
  switch (save_format) {
1722
    case SparseFormat::kCOO:
1723
1724
      fs->Read(&coo_);
      break;
1725
    case SparseFormat::kCSR:
1726
1727
      fs->Read(&out_csr_);
      break;
1728
    case SparseFormat::kCSC:
1729
1730
1731
1732
1733
1734
1735
      fs->Read(&in_csr_);
      break;
    default:
      LOG(FATAL) << "unsupported format code";
      break;
  }

1736
1737
1738
1739
1740
1741
1742
1743
1744
1745
  if (!in_csr_) {
    in_csr_ = CSRPtr(new CSR());
  }
  if (!out_csr_) {
    out_csr_ = CSRPtr(new CSR());
  }
  if (!coo_) {
    coo_ = COOPtr(new COO());
  }

1746
1747
  meta_graph_ = GetAny()->meta_graph();

1748
1749
1750
  return true;
}

1751

1752
1753
void UnitGraph::Save(dmlc::Stream* fs) const {
  fs->Write(kDGLSerialize_UnitGraphMagic);
1754
1755
  // Didn't write UnitGraph::meta_graph_, since it's included in the underlying
  // sparse matrix
1756
  auto avail_fmt = SelectFormat(ALL_CODE);
1757
  fs->Write(static_cast<int64_t>(avail_fmt));
1758
  fs->Write(static_cast<int64_t>(formats_ | 0x100000000));
1759
  switch (avail_fmt) {
1760
    case SparseFormat::kCOO:
1761
1762
      fs->Write(GetCOO());
      break;
1763
    case SparseFormat::kCSR:
1764
1765
      fs->Write(GetOutCSR());
      break;
1766
    case SparseFormat::kCSC:
1767
1768
1769
1770
1771
1772
      fs->Write(GetInCSR());
      break;
    default:
      LOG(FATAL) << "unsupported format code";
      break;
  }
1773
1774
}

1775
1776
1777
1778
1779
1780
1781
1782
1783
1784
UnitGraphPtr UnitGraph::Reverse() const {
  CSRPtr new_incsr = out_csr_, new_outcsr = in_csr_;
  COOPtr new_coo = nullptr;
  if (coo_->defined()) {
    new_coo = COOPtr(new COO(coo_->meta_graph(), aten::COOTranspose(coo_->adj())));
  }

  return UnitGraphPtr(new UnitGraph(meta_graph(), new_incsr, new_outcsr, new_coo));
}

1785
1786
1787
1788
1789
1790
1791
std::tuple<UnitGraphPtr, IdArray, IdArray>
UnitGraph::ToSimple() const {
  CSRPtr new_incsr = nullptr, new_outcsr = nullptr;
  COOPtr new_coo = nullptr;
  IdArray count;
  IdArray edge_map;

1792
  auto avail_fmt = SelectFormat(ALL_CODE);
1793
1794
  switch (avail_fmt) {
    case SparseFormat::kCOO: {
1795
      auto ret = aten::COOToSimple(GetCOO()->adj());
1796
1797
      count = std::get<1>(ret);
      edge_map = std::get<2>(ret);
1798
      new_coo = COOPtr(new COO(meta_graph(), std::get<0>(ret)));
1799
1800
1801
      break;
    }
    case SparseFormat::kCSR: {
1802
      auto ret = aten::CSRToSimple(GetOutCSR()->adj());
1803
1804
      count = std::get<1>(ret);
      edge_map = std::get<2>(ret);
1805
      new_outcsr = CSRPtr(new CSR(meta_graph(), std::get<0>(ret)));
1806
1807
1808
      break;
    }
    case SparseFormat::kCSC: {
1809
      auto ret = aten::CSRToSimple(GetInCSR()->adj());
1810
1811
      count = std::get<1>(ret);
      edge_map = std::get<2>(ret);
1812
      new_incsr = CSRPtr(new CSR(meta_graph(), std::get<0>(ret)));
1813
1814
1815
1816
1817
1818
1819
1820
1821
1822
1823
1824
      break;
    }
    default:
      LOG(FATAL) << "At lease one of COO, CSR or CSC adj should exist.";
      break;
  }

  return std::make_tuple(UnitGraphPtr(new UnitGraph(meta_graph(), new_incsr, new_outcsr, new_coo)),
                         count,
                         edge_map);
}

1825
}  // namespace dgl