[Feature] Add left normalizer for GCN (#3114)

* add left normalizer for gcn * fix * fixes and some bug stuff

[Feature] Add left normalizer for GCN (#3114)
* add left normalizer for gcn * fix * fixes and some bug stuff
b576e617 · Quan (Andy) Gan · GitHub · fac75e16 · b576e617 · b576e617
Unverified Commit b576e617 authored Jul 13, 2021 by Quan (Andy) Gan Committed by GitHub Jul 13, 2021
8 changed files
--- a/examples/pytorch/GATNE-T/README.md
+++ b/examples/pytorch/GATNE-T/README.md
@@ -12,6 +12,8 @@ Requirements
 pip install -r requirements.txt
 ```
+Also requires PyTorch 1.7.0+.
 Datasets
 --------

--- a/python/dgl/dataloading/pytorch/dataloader.py
+++ b/python/dgl/dataloading/pytorch/dataloader.py
@@ -14,7 +14,10 @@ from ... import backend as F
 from ...base import DGLError
 from ...utils import to_dgl_context
-__all__ = ['NodeDataLoader', 'EdgeDataLoader', 'GraphDataLoader']
+__all__ = ['NodeDataLoader', 'EdgeDataLoader', 'GraphDataLoader',
+           # Temporary exposure.
+           '_pop_subgraph_storage', '_pop_blocks_storage',
+           '_restore_subgraph_storage', '_restore_blocks_storage']
 PYTORCH_VER = LooseVersion(th.__version__)
 PYTORCH_16 = PYTORCH_VER >= LooseVersion("1.6.0")

--- a/python/dgl/nn/mxnet/conv/graphconv.py
+++ b/python/dgl/nn/mxnet/conv/graphconv.py
@@ -32,10 +32,18 @@ class GraphConv(gluon.Block):
    out_feats : int
        Output feature size; i.e., the number of dimensions of :math:`h_i^{(l+1)}`.
    norm : str, optional
-        How to apply the normalizer. If is `'right'`, divide the aggregated messages
+        How to apply the normalizer.  Can be one of the following values:
-        by each node's in-degrees, which is equivalent to averaging the received messages.
-        If is `'none'`, no normalization is applied. Default is `'both'`,
+        * ``right``, to divide the aggregated messages by each node's in-degrees,
-        where the :math:`c_{ij}` in the paper is applied.
+          which is equivalent to averaging the received messages.
+        * ``none``, where no normalization is applied.
+        * ``both`` (default), where the messages are scaled with :math:`1/c_{ji}` above, equivalent
+          to symmetric normalization.
+        * ``left``, to divide the messages sent out from each node by its out-degrees,
+          equivalent to random walk normalization.
    weight : bool, optional
        If True, apply a linear layer. Otherwise, aggregating the messages
        without a weight matrix.
@@ -136,8 +144,8 @@ class GraphConv(gluon.Block):
                 activation=None,
                 allow_zero_in_degree=False):
        super(GraphConv, self).__init__()
-        if norm not in ('none', 'both', 'right'):
+        if norm not in ('none', 'both', 'right', 'left'):
-            raise DGLError('Invalid norm value. Must be either "none", "both" or "right".'
+            raise DGLError('Invalid norm value. Must be either "none", "both", "right" or "left".'
                           ' But got "{}".'.format(norm))
        self._in_feats = in_feats
        self._out_feats = out_feats
@@ -230,15 +238,18 @@ class GraphConv(gluon.Block):
                                   'suppress the check and let the code run.')
            feat_src, feat_dst = expand_as_pair(feat, graph)
+            if self._norm in ['both', 'left']:
-            if self._norm == 'both':
+                degs = graph.out_degrees().as_in_context(feat_dst.context).astype('float32')
-                degs = graph.out_degrees().as_in_context(feat_src.context).astype('float32')
                degs = mx.nd.clip(degs, a_min=1, a_max=float("inf"))
-                norm = mx.nd.power(degs, -0.5)
+                if self._norm == 'both':
+                    norm = mx.nd.power(degs, -0.5)
+                else:
+                    norm = 1.0 / degs
                shp = norm.shape + (1,) * (feat_src.ndim - 1)
                norm = norm.reshape(shp)
                feat_src = feat_src * norm
            if weight is not None:
                if self.weight is not None:
                    raise DGLError('External weight is provided while at the same time the'
@@ -264,7 +275,7 @@ class GraphConv(gluon.Block):
                if weight is not None:
                    rst = mx.nd.dot(rst, weight)
-            if self._norm != 'none':
+            if self._norm in ['both', 'right']:
                degs = graph.in_degrees().as_in_context(feat_dst.context).astype('float32')
                degs = mx.nd.clip(degs, a_min=1, a_max=float("inf"))
                if self._norm == 'both':

--- a/python/dgl/nn/pytorch/conv/graphconv.py
+++ b/python/dgl/nn/pytorch/conv/graphconv.py
@@ -173,10 +173,18 @@ class GraphConv(nn.Module):
    out_feats : int
        Output feature size; i.e., the number of dimensions of :math:`h_i^{(l+1)}`.
    norm : str, optional
-        How to apply the normalizer. If is `'right'`, divide the aggregated messages
+        How to apply the normalizer.  Can be one of the following values:
-        by each node's in-degrees, which is equivalent to averaging the received messages.
-        If is `'none'`, no normalization is applied. Default is `'both'`,
+        * ``right``, to divide the aggregated messages by each node's in-degrees,
-        where the :math:`c_{ji}` in the paper is applied.
+          which is equivalent to averaging the received messages.
+        * ``none``, where no normalization is applied.
+        * ``both`` (default), where the messages are scaled with :math:`1/c_{ji}` above, equivalent
+          to symmetric normalization.
+        * ``left``, to divide the messages sent out from each node by its out-degrees,
+          equivalent to random walk normalization.
    weight : bool, optional
        If True, apply a linear layer. Otherwise, aggregating the messages
        without a weight matrix.
@@ -270,8 +278,8 @@ class GraphConv(nn.Module):
                 activation=None,
                 allow_zero_in_degree=False):
        super(GraphConv, self).__init__()
-        if norm not in ('none', 'both', 'right'):
+        if norm not in ('none', 'both', 'right', 'left'):
-            raise DGLError('Invalid norm value. Must be either "none", "both" or "right".'
+            raise DGLError('Invalid norm value. Must be either "none", "both", "right" or "left".'
                           ' But got "{}".'.format(norm))
        self._in_feats = in_feats
        self._out_feats = out_feats
@@ -395,9 +403,12 @@ class GraphConv(nn.Module):
            # (BarclayII) For RGCN on heterogeneous graphs we need to support GCN on bipartite.
            feat_src, feat_dst = expand_as_pair(feat, graph)
-            if self._norm == 'both':
+            if self._norm in ['left', 'both']:
                degs = graph.out_degrees().float().clamp(min=1)
-                norm = th.pow(degs, -0.5)
+                if self._norm == 'both':
+                    norm = th.pow(degs, -0.5)
+                else:
+                    norm = 1.0 / degs
                shp = norm.shape + (1,) * (feat_src.dim() - 1)
                norm = th.reshape(norm, shp)
                feat_src = feat_src * norm
@@ -425,7 +436,7 @@ class GraphConv(nn.Module):
                if weight is not None:
                    rst = th.matmul(rst, weight)
-            if self._norm != 'none':
+            if self._norm in ['right', 'both']:
                degs = graph.in_degrees().float().clamp(min=1)
                if self._norm == 'both':
                    norm = th.pow(degs, -0.5)

--- a/python/dgl/nn/tensorflow/conv/graphconv.py
+++ b/python/dgl/nn/tensorflow/conv/graphconv.py
@@ -34,10 +34,18 @@ class GraphConv(layers.Layer):
    out_feats : int
        Output feature size; i.e., the number of dimensions of :math:`h_i^{(l+1)}`.
    norm : str, optional
-        How to apply the normalizer. If is `'right'`, divide the aggregated messages
+        How to apply the normalizer.  Can be one of the following values:
-        by each node's in-degrees, which is equivalent to averaging the received messages.
-        If is `'none'`, no normalization is applied. Default is `'both'`,
+        * ``right``, to divide the aggregated messages by each node's in-degrees,
-        where the :math:`c_{ij}` in the paper is applied.
+          which is equivalent to averaging the received messages.
+        * ``none``, where no normalization is applied.
+        * ``both`` (default), where the messages are scaled with :math:`1/c_{ji}` above, equivalent
+          to symmetric normalization.
+        * ``left``, to divide the messages sent out from each node by its out-degrees,
+          equivalent to random walk normalization.
    weight : bool, optional
        If True, apply a linear layer. Otherwise, aggregating the messages
        without a weight matrix.
@@ -137,8 +145,8 @@ class GraphConv(layers.Layer):
                 activation=None,
                 allow_zero_in_degree=False):
        super(GraphConv, self).__init__()
-        if norm not in ('none', 'both', 'right'):
+        if norm not in ('none', 'both', 'right', 'left'):
-            raise DGLError('Invalid norm value. Must be either "none", "both" or "right".'
+            raise DGLError('Invalid norm value. Must be either "none", "both", "right" or "left".'
                           ' But got "{}".'.format(norm))
        self._in_feats = in_feats
        self._out_feats = out_feats
@@ -230,13 +238,15 @@ class GraphConv(layers.Layer):
                                   'suppress the check and let the code run.')
            feat_src, feat_dst = expand_as_pair(feat, graph)
+            if self._norm in ['both', 'left']:
-            if self._norm == 'both':
                degs = tf.clip_by_value(tf.cast(graph.out_degrees(), tf.float32),
                                        clip_value_min=1,
                                        clip_value_max=np.inf)
-                norm = tf.pow(degs, -0.5)
+                if self._norm == 'both':
-                shp = norm.shape + (1,) * (feat_src.ndim - 1)
+                    norm = tf.pow(degs, -0.5)
+                else:
+                    norm = 1.0 / degs
+                shp = norm.shape + (1,) * (feat_dst.ndim - 1)
                norm = tf.reshape(norm, shp)
                feat_src = feat_src * norm
@@ -265,7 +275,7 @@ class GraphConv(layers.Layer):
                if weight is not None:
                    rst = tf.matmul(rst, weight)
-            if self._norm != 'none':
+            if self._norm in ['both', 'right']:
                degs = tf.clip_by_value(tf.cast(graph.in_degrees(), tf.float32),
                                        clip_value_min=1,
                                        clip_value_max=np.inf)

--- a/tests/mxnet/test_nn.py
+++ b/tests/mxnet/test_nn.py
@@ -81,7 +81,7 @@ def test_graph_conv(idtype, out_dim):
 @parametrize_dtype
 @pytest.mark.parametrize('g', get_cases(['homo', 'block-bipartite'], exclude=['zero-degree', 'dglgraph']))
-@pytest.mark.parametrize('norm', ['none', 'both', 'right'])
+@pytest.mark.parametrize('norm', ['none', 'both', 'right', 'left'])
 @pytest.mark.parametrize('weight', [True, False])
 @pytest.mark.parametrize('bias', [False])
 @pytest.mark.parametrize('out_dim', [1, 2])

--- a/tests/pytorch/test_nn.py
+++ b/tests/pytorch/test_nn.py
@@ -81,7 +81,7 @@ def test_graph_conv0(out_dim):
 @parametrize_dtype
 @pytest.mark.parametrize('g', get_cases(['homo', 'bipartite'], exclude=['zero-degree', 'dglgraph']))
-@pytest.mark.parametrize('norm', ['none', 'both', 'right'])
+@pytest.mark.parametrize('norm', ['none', 'both', 'right', 'left'])
 @pytest.mark.parametrize('weight', [True, False])
 @pytest.mark.parametrize('bias', [True, False])
 @pytest.mark.parametrize('out_dim', [1, 2])

--- a/tests/tensorflow/test_nn.py
+++ b/tests/tensorflow/test_nn.py
@@ -74,7 +74,7 @@ def test_graph_conv(out_dim):
 @parametrize_dtype
 @pytest.mark.parametrize('g', get_cases(['homo', 'block-bipartite'], exclude=['zero-degree', 'dglgraph']))
-@pytest.mark.parametrize('norm', ['none', 'both', 'right'])
+@pytest.mark.parametrize('norm', ['none', 'both', 'right', 'left'])
 @pytest.mark.parametrize('weight', [True, False])
 @pytest.mark.parametrize('bias', [True, False])
 @pytest.mark.parametrize('out_dim', [1, 2])