[Performance] Only copy and slice index's in subcolumn when data is used. (#2930)

* Make column double indices lazy * Copy indices to proper contexts * Fix initialization * Add unit test * Fix unit test for tensorflow * Remove unused member Co-authored-by: Quan (Andy) Gan <coin2028@hotmail.com>

[Performance] Only copy and slice index's in subcolumn when data is used. (#2930)
* Make column double indices lazy * Copy indices to proper contexts * Fix initialization * Add unit test * Fix unit test for tensorflow * Remove unused member Co-authored-by: Quan (Andy) Gan <coin2028@hotmail.com>
a53783c8 · nv-dlasalle · GitHub · 6476b829 · a53783c8 · a53783c8
Unverified Commit a53783c8 authored Aug 30, 2021 by nv-dlasalle Committed by GitHub Aug 30, 2021
Hide whitespace changes
Inline Side-by-side

Showing with 80 additions and 10 deletions

python/dgl/frame.py python/dgl/frame.py +41 -10

tests/compute/test_frame.py tests/compute/test_frame.py +39 -0

No files found.
--- a/python/dgl/frame.py
+++ b/python/dgl/frame.py
@@ -8,6 +8,36 @@ from . import backend as F
 from .base import DGLError, dgl_warning
 from .init import zero_initializer
+class _LazyIndex(object):
+    def __init__(self, index):
+        if isinstance(index, list):
+            self._indices = index
+        else:
+            self._indices = [index]
+    def __len__(self):
+        return len(self._indices[-1])
+    def slice(self, index):
+        """ Create a new _LazyIndex object sliced by the given index tensor.
+        """
+        # if our indices are in the same context, lets just slice now and free
+        # memory, otherwise do nothing until we have to
+        if F.context(self._indices[-1]) == F.context(index):
+            return _LazyIndex(self._indices[:-1] + [F.gather_row(self._indices[-1], index)])
+        return _LazyIndex(self._indices + [index])
+    def flatten(self):
+        """ Evaluate the chain of indices, and return a single index tensor.
+        """
+        flat_index = self._indices[0]
+        # here we actually need to resolve it
+        for index in self._indices[1:]:
+            if F.context(index) != F.context(flat_index):
+                index = F.copy_to(index, F.context(flat_index))
+            flat_index = F.gather_row(flat_index, index)
+        return flat_index
 class Scheme(namedtuple('Scheme', ['shape', 'dtype'])):
    """The column scheme.
@@ -111,6 +141,8 @@ class Column(object):
    def data(self):
        """Return the feature data. Perform index selecting if needed."""
        if self.index is not None:
+            if isinstance(self.index, _LazyIndex):
+                self.index = self.index.flatten()
            # If index and storage is not in the same context,
            # copy index to the same context of storage.
            # Copy index is usually cheaper than copy data
@@ -237,9 +269,10 @@ class Column(object):
        """Return a subcolumn.
        The resulting column will share the same storage as this column so this operation
-        is quite efficient. If the current column is also a sub-column (i.e., the
+        is quite efficient. If the current column is also a sub-column (i.e.,
-        index tensor is not None), it slices the index tensor with the given
+        the index tensor is not None), the current index tensor will be sliced
-        rowids as the index tensor of the resulting column.
+        by 'rowids', if they are on the same context. Otherwise, both index
+        tensors are saved, and only applied when the data is accessed.
        Parameters
        ----------
@@ -254,13 +287,11 @@ class Column(object):
        if self.index is None:
            return Column(self.storage, self.scheme, rowids, self.device)
        else:
-            if F.context(self.index) != F.context(rowids):
+            index = self.index
-                # make sure index and row ids are on the same context
+            if not isinstance(index, _LazyIndex):
-                kwargs = {}
+                index = _LazyIndex(self.index)
-                if self.device is not None:
+            index = index.slice(rowids)
-                    kwargs = self.device[1]
+            return Column(self.storage, self.scheme, index, self.device)
-                rowids = F.copy_to(rowids, F.context(self.index), **kwargs)
-            return Column(self.storage, self.scheme, F.gather_row(self.index, rowids), self.device)
    @staticmethod
    def create(data):

--- a/tests/compute/test_frame.py
+++ b/tests/compute/test_frame.py
+import dgl
+import dgl.ndarray as nd
+from dgl.frame import Column
+import numpy as np
+import backend as F
+import unittest
+from test_utils import parametrize_dtype
+def test_column_subcolumn():
+    data = F.copy_to(F.tensor([[1., 1., 1., 1.],
+                               [0., 2., 9., 0.],
+                               [3., 2., 1., 0.],
+                               [1., 1., 1., 1.],
+                               [0., 2., 4., 0.]]), F.ctx())
+    original = Column(data)
+    # subcolumn from cpu context 
+    i1 = F.tensor([0, 2, 1, 3], dtype=F.int64)
+    l1 = original.subcolumn(i1)
+    assert len(l1) == i1.shape[0]
+    assert F.array_equal(l1.data, F.gather_row(data, i1))
+    # next subcolumn from target context
+    i2 = F.copy_to(F.tensor([0, 2], dtype=F.int64), F.ctx())
+    l2 = l1.subcolumn(i2)
+    assert len(l2) == i2.shape[0]
+    i1i2 = F.copy_to(F.gather_row(i1, F.copy_to(i2, F.context(i1))), F.ctx())
+    assert F.array_equal(l2.data, F.gather_row(data,i1i2))
+    # next subcolumn also from target context
+    i3 = F.copy_to(F.tensor([1], dtype=F.int64), F.ctx())
+    l3 = l2.subcolumn(i3)
+    assert len(l3) == i3.shape[0]
+    i1i2i3 = F.copy_to(F.gather_row(i1i2, F.copy_to(i3, F.context(i1i2))), F.ctx())
+    assert F.array_equal(l3.data, F.gather_row(data, i1i2i3))