[BUGFIX] fix a bug in partition book. (#1698)

* fix a bug. * add msg for assert

[BUGFIX] fix a bug in partition book. (#1698)
* fix a bug. * add msg for assert
fa1478a4 · Da Zheng · GitHub · b6c4deb4 · fa1478a4 · fa1478a4
Unverified Commit fa1478a4 authored Jun 24, 2020 by Da Zheng Committed by GitHub Jun 24, 2020
Showing with 24 additions and 8 deletions

python/dgl/distributed/graph_partition_book.py python/dgl/distributed/graph_partition_book.py +14 -6

tests/distributed/test_partition.py tests/distributed/test_partition.py +10 -2

No files found.
--- a/python/dgl/distributed/graph_partition_book.py
+++ b/python/dgl/distributed/graph_partition_book.py
@@ -98,12 +98,16 @@ class GraphPartitionBook:
    def __init__(self, part_id, num_parts, node_map, edge_map, part_graph):
        assert part_id >= 0, 'part_id cannot be a negative number.'
        assert num_parts > 0, 'num_parts must be greater than zero.'
-        self._part_id = part_id
+        self._part_id = int(part_id)
-        self._num_partitions = num_parts
+        self._num_partitions = int(num_parts)
        node_map = utils.toindex(node_map)
        self._nid2partid = node_map.tousertensor()
+        assert F.dtype(self._nid2partid) in (F.int32, F.int64), \
+                'the node map must be stored in an integer array'
        edge_map = utils.toindex(edge_map)
        self._eid2partid = edge_map.tousertensor()
+        assert F.dtype(self._eid2partid) in (F.int32, F.int64), \
+                'the edge map must be stored in an integer array'
        # Get meta data of the partition book.
        self._partition_meta_data = []
        _, nid_count = np.unique(F.asnumpy(self._nid2partid), return_counts=True)
@@ -147,8 +151,8 @@ class GraphPartitionBook:
        g2l = F.scatter_row(g2l, global_id, F.arange(0, len(global_id)))
        self._eidg2l[self._part_id] = g2l
        # node size and edge size
-        self._edge_size = len(self.partid2eids(part_id))
+        self._edge_size = len(self.partid2eids(self._part_id))
-        self._node_size = len(self.partid2nids(part_id))
+        self._node_size = len(self.partid2nids(self._part_id))
    def shared_memory(self, graph_name):
        """Move data to shared memory.
@@ -538,8 +542,10 @@ class RangePartitionBook:
            raise RuntimeError('Now RangePartitionBook does not support \
                getting remote tensor of nid2localnid.')
+        nids = utils.toindex(nids)
+        nids = nids.tousertensor()
        start = self._node_map[partid - 1] if partid > 0 else 0
-        return nids - start
+        return nids - int(start)
    def eid2localeid(self, eids, partid):
@@ -561,8 +567,10 @@ class RangePartitionBook:
            raise RuntimeError('Now RangePartitionBook does not support \
                getting remote tensor of eid2localeid.')
+        eids = utils.toindex(eids)
+        eids = eids.tousertensor()
        start = self._edge_map[partid - 1] if partid > 0 else 0
-        return eids - start
+        return eids - int(start)
    def get_partition(self, partid):

--- a/tests/distributed/test_partition.py
+++ b/tests/distributed/test_partition.py
@@ -45,19 +45,23 @@ def check_partition(reshuffle):
        part_sizes.append((gpb_meta[i]['num_nodes'], gpb_meta[i]['num_edges']))
        local_nid = gpb.nid2localnid(F.boolean_mask(part_g.ndata[dgl.NID], part_g.ndata['inner_node']), i)
+        assert F.dtype(local_nid) in (F.int64, F.int32)
        assert np.all(F.asnumpy(local_nid) == np.arange(0, len(local_nid)))
        local_eid = gpb.eid2localeid(F.boolean_mask(part_g.edata[dgl.EID], part_g.edata['inner_edge']), i)
+        assert F.dtype(local_eid) in (F.int64, F.int32)
        assert np.all(F.asnumpy(local_eid) == np.arange(0, len(local_eid)))
        # Check the node map.
        local_nodes = F.boolean_mask(part_g.ndata[dgl.NID], part_g.ndata['inner_node'])
        llocal_nodes = F.nonzero_1d(part_g.ndata['inner_node'])
        local_nodes1 = gpb.partid2nids(i)
+        assert F.dtype(local_nodes1) in (F.int32, F.int64)
        assert np.all(np.sort(F.asnumpy(local_nodes)) == np.sort(F.asnumpy(local_nodes1)))
        # Check the edge map.
        local_edges = F.boolean_mask(part_g.edata[dgl.EID], part_g.edata['inner_edge'])
        local_edges1 = gpb.partid2eids(i)
+        assert F.dtype(local_edges1) in (F.int32, F.int64)
        assert np.all(np.sort(F.asnumpy(local_edges)) == np.sort(F.asnumpy(local_edges1)))
        if reshuffle:
@@ -93,8 +97,12 @@ def check_partition(reshuffle):
            edge_map.append(np.ones(num_edges) * i)
        node_map = np.concatenate(node_map)
        edge_map = np.concatenate(edge_map)
-        assert np.all(F.asnumpy(gpb.nid2partid(F.arange(0, len(node_map)))) == node_map)
+        nid2pid = gpb.nid2partid(F.arange(0, len(node_map)))
-        assert np.all(F.asnumpy(gpb.eid2partid(F.arange(0, len(edge_map)))) == edge_map)
+        assert F.dtype(nid2pid) in (F.int32, F.int64)
+        assert np.all(F.asnumpy(nid2pid) == node_map)
+        eid2pid = gpb.eid2partid(F.arange(0, len(edge_map)))
+        assert F.dtype(eid2pid) in (F.int32, F.int64)
+        assert np.all(F.asnumpy(eid2pid) == edge_map)
 def test_partition():
    check_partition(True)