test_frame.py 11.2 KB
Newer Older
1
import numpy as np
Minjie Wang's avatar
Minjie Wang committed
2
from dgl.frame import Frame, FrameRef
Minjie Wang's avatar
Minjie Wang committed
3
from dgl.utils import Index, toindex
4
import backend as F
5
6

N = 10
Minjie Wang's avatar
Minjie Wang committed
7
D = 5
8

Minjie Wang's avatar
Minjie Wang committed
9
10
11
12
13
14
def check_fail(fn):
    try:
        fn()
        return False
    except:
        return True
15
16

def create_test_data(grad=False):
17
18
19
20
21
22
23
    c1 = F.randn((N, D))
    c2 = F.randn((N, D))
    c3 = F.randn((N, D))
    if grad:
        c1 = F.attach_grad(c1)
        c2 = F.attach_grad(c2)
        c3 = F.attach_grad(c3)
24
25
26
27
    return {'a1' : c1, 'a2' : c2, 'a3' : c3}

def test_create():
    data = create_test_data()
28
    f1 = Frame(num_rows=N)
29
    for k, v in data.items():
Minjie Wang's avatar
Minjie Wang committed
30
31
32
        f1.update_column(k, v)
    print(f1.schemes)
    assert f1.keys() == set(data.keys())
33
34
35
    assert f1.num_columns == 3
    assert f1.num_rows == N
    f2 = Frame(data)
Minjie Wang's avatar
Minjie Wang committed
36
    assert f2.keys() == set(data.keys())
37
38
39
40
41
42
    assert f2.num_columns == 3
    assert f2.num_rows == N
    f1.clear()
    assert len(f1.schemes) == 0
    assert f1.num_rows == 0

Minjie Wang's avatar
Minjie Wang committed
43
44
def test_column1():
    # Test frame column getter/setter
45
46
    data = create_test_data()
    f = Frame(data)
Minjie Wang's avatar
Minjie Wang committed
47
48
    assert f.num_rows == N
    assert len(f) == 3
49
    assert F.allclose(f['a1'].data, data['a1'])
50
    f['a1'] = data['a2']
51
    assert F.allclose(f['a2'].data, data['a2'])
Minjie Wang's avatar
Minjie Wang committed
52
53
    # add a different length column should fail
    def failed_add_col():
54
        f['a4'] = F.zeros([N+1, D])
Minjie Wang's avatar
Minjie Wang committed
55
56
57
58
59
60
61
62
63
64
65
    assert check_fail(failed_add_col)
    # delete all the columns
    del f['a1']
    del f['a2']
    assert len(f) == 1
    del f['a3']
    assert len(f) == 0

def test_column2():
    # Test frameref column getter/setter
    data = Frame(create_test_data())
Minjie Wang's avatar
Minjie Wang committed
66
    f = FrameRef(data, toindex([3, 4, 5, 6, 7]))
Minjie Wang's avatar
Minjie Wang committed
67
68
    assert f.num_rows == 5
    assert len(f) == 3
69
    assert F.allclose(f['a1'], F.narrow_row(data['a1'].data, 3, 8))
Minjie Wang's avatar
Minjie Wang committed
70
    # set column should reflect on the referenced data
71
72
    f['a1'] = F.zeros([5, D])
    assert F.allclose(F.narrow_row(data['a1'].data, 3, 8), F.zeros([5, D]))
Minjie Wang's avatar
Minjie Wang committed
73
74
75
    # add new partial column should fail with error initializer
    f.set_initializer(lambda shape, dtype : assert_(False))
    def failed_add_col():
76
        f['a4'] = F.ones([5, D])
Minjie Wang's avatar
Minjie Wang committed
77
    assert check_fail(failed_add_col)
78

Minjie Wang's avatar
Minjie Wang committed
79
80
def test_append1():
    # test append API on Frame
81
    data = create_test_data()
Minjie Wang's avatar
Minjie Wang committed
82
83
84
85
86
87
88
    f1 = Frame()
    f2 = Frame(data)
    f1.append(data)
    assert f1.num_rows == N
    f1.append(f2)
    assert f1.num_rows == 2 * N
    c1 = f1['a1']
89
90
91
    assert tuple(F.shape(c1.data)) == (2 * N, D)
    truth = F.cat([data['a1'], data['a1']], 0)
    assert F.allclose(truth, c1.data)
Minjie Wang's avatar
Minjie Wang committed
92
    # append dict of different length columns should fail
93
    f3 = {'a1' : F.zeros((3, D)), 'a2' : F.zeros((3, D)), 'a3' : F.zeros((2, D))}
Minjie Wang's avatar
Minjie Wang committed
94
95
96
    def failed_append():
        f1.append(f3)
    assert check_fail(failed_append)
Minjie Wang's avatar
Minjie Wang committed
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115

def test_append2():
    # test append on FrameRef
    data = Frame(create_test_data())
    f = FrameRef(data)
    assert f.is_contiguous()
    assert f.is_span_whole_column()
    assert f.num_rows == N
    # append on the underlying frame should not reflect on the ref
    data.append(data)
    assert f.is_contiguous()
    assert not f.is_span_whole_column()
    assert f.num_rows == N
    # append on the FrameRef should work
    f.append(data)
    assert not f.is_contiguous()
    assert not f.is_span_whole_column()
    assert f.num_rows == 3 * N
    new_idx = list(range(N)) + list(range(2*N, 4*N))
116
    assert F.array_equal(f._index.tousertensor(), F.tensor(new_idx, dtype=F.int64))
Minjie Wang's avatar
Minjie Wang committed
117
118
    assert data.num_rows == 4 * N

119
120
121
def test_append3():
    # test append on empty frame
    f = Frame(num_rows=5)
122
    data = {'h' : F.ones((3, 2))}
123
124
    f.append(data)
    assert f.num_rows == 8
125
126
    ans = F.cat([F.zeros((5, 2)), F.ones((3, 2))], 0)
    assert F.allclose(f['h'].data, ans)
127
    # test append with new column
128
    data = {'h' : 2 * F.ones((3, 2)), 'w' : 2 * F.ones((3, 2))}
129
130
    f.append(data)
    assert f.num_rows == 11
131
132
133
134
    ans1 = F.cat([ans, 2 * F.ones((3, 2))], 0)
    ans2 = F.cat([F.zeros((8, 2)), 2 * F.ones((3, 2))], 0)
    assert F.allclose(f['h'].data, ans1)
    assert F.allclose(f['w'].data, ans2)
135

Minjie Wang's avatar
Minjie Wang committed
136
137
138
139
def test_row1():
    # test row getter/setter
    data = create_test_data()
    f = FrameRef(Frame(data))
140
141
142

    # getter
    # test non-duplicate keys
143
    rowid = Index(F.tensor([0, 2]))
144
    rows = f[rowid]
Minjie Wang's avatar
Minjie Wang committed
145
    for k, v in rows.items():
146
147
        assert tuple(F.shape(v)) == (len(rowid), D)
        assert F.allclose(v, F.gather_row(data[k], rowid.tousertensor()))
148
    # test duplicate keys
149
    rowid = Index(F.tensor([8, 2, 2, 1]))
150
    rows = f[rowid]
Minjie Wang's avatar
Minjie Wang committed
151
    for k, v in rows.items():
152
153
        assert tuple(F.shape(v)) == (len(rowid), D)
        assert F.allclose(v, F.gather_row(data[k], rowid.tousertensor()))
154
155

    # setter
156
157
158
159
    rowid = Index(F.tensor([0, 2, 4]))
    vals = {'a1' : F.zeros((len(rowid), D)),
            'a2' : F.zeros((len(rowid), D)),
            'a3' : F.zeros((len(rowid), D)),
160
161
            }
    f[rowid] = vals
Minjie Wang's avatar
Minjie Wang committed
162
    for k, v in f[rowid].items():
163
        assert F.allclose(v, F.zeros((len(rowid), D)))
164

Minjie Wang's avatar
Minjie Wang committed
165
166
167
    # setting rows with new column should raise error with error initializer
    f.set_initializer(lambda shape, dtype : assert_(False))
    def failed_update_rows():
168
        vals['a4'] = F.ones((len(rowid), D))
Minjie Wang's avatar
Minjie Wang committed
169
170
        f[rowid] = vals
    assert check_fail(failed_update_rows)
171

Minjie Wang's avatar
Minjie Wang committed
172
173
def test_row2():
    # test row getter/setter autograd compatibility
174
    data = create_test_data(grad=True)
Minjie Wang's avatar
Minjie Wang committed
175
    f = FrameRef(Frame(data))
176

177
178
179
180
181
182
183
184
185
    with F.record_grad():
        # getter
        c1 = f['a1']
        # test non-duplicate keys
        rowid = Index(F.tensor([0, 2]))
        rows = f[rowid]
        y = rows['a1']
    F.backward(y, F.ones((len(rowid), D)))
    assert F.allclose(F.grad(c1)[:,0], F.tensor([1., 0., 1., 0., 0., 0., 0., 0., 0., 0.]))
186

187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
    f['a1'] = F.attach_grad(f['a1'])
    with F.record_grad():
        c1 = f['a1']
        # test duplicate keys
        rowid = Index(F.tensor([8, 2, 2, 1]))
        rows = f[rowid]
        y = rows['a1']
    F.backward(y, F.ones((len(rowid), D)))
    assert F.allclose(F.grad(c1)[:,0], F.tensor([0., 1., 2., 0., 0., 0., 0., 0., 1., 0.]))

    f['a1'] = F.attach_grad(f['a1'])
    with F.record_grad():
        # setter
        c1 = f['a1']
        rowid = Index(F.tensor([0, 2, 4]))
        vals = {'a1' : F.attach_grad(F.zeros((len(rowid), D))),
                'a2' : F.attach_grad(F.zeros((len(rowid), D))),
                'a3' : F.attach_grad(F.zeros((len(rowid), D))),
                }
        f[rowid] = vals
        c11 = f['a1']
    F.backward(c11, F.ones((N, D)))
    assert F.allclose(F.grad(c1)[:,0], F.tensor([0., 1., 0., 1., 0., 1., 1., 1., 1., 1.]))
    assert F.allclose(F.grad(vals['a1']), F.ones((len(rowid), D)))
    assert F.is_no_grad(vals['a2'])
212

Minjie Wang's avatar
Minjie Wang committed
213
214
215
216
217
218
219
def test_row3():
    # test row delete
    data = Frame(create_test_data())
    f = FrameRef(data)
    assert f.is_contiguous()
    assert f.is_span_whole_column()
    assert f.num_rows == N
220
    del f[toindex(F.tensor([2, 3]))]
Minjie Wang's avatar
Minjie Wang committed
221
222
223
224
225
226
227
228
229
    assert not f.is_contiguous()
    assert not f.is_span_whole_column()
    # delete is lazy: only reflect on the ref while the
    # underlying storage should not be touched
    assert f.num_rows == N - 2
    assert data.num_rows == N
    newidx = list(range(N))
    newidx.pop(2)
    newidx.pop(2)
Minjie Wang's avatar
Minjie Wang committed
230
    newidx = toindex(newidx)
Minjie Wang's avatar
Minjie Wang committed
231
    for k, v in f.items():
232
        assert F.allclose(v, data[k][newidx])
Minjie Wang's avatar
Minjie Wang committed
233

234
235
236
def test_row4():
    # test updating row with empty frame but has preset num_rows
    f = FrameRef(Frame(num_rows=5))
237
238
239
240
241
    rowid = Index(F.tensor([0, 2, 4]))
    f[rowid] = {'h' : F.ones((3, 2))}
    ans = F.zeros((5, 2))
    ans[F.tensor([0, 2, 4])] = F.ones((3, 2))
    assert F.allclose(f['h'], ans)
242

Minjie Wang's avatar
Minjie Wang committed
243
244
def test_sharing():
    data = Frame(create_test_data())
Minjie Wang's avatar
Minjie Wang committed
245
246
    f1 = FrameRef(data, index=toindex([0, 1, 2, 3]))
    f2 = FrameRef(data, index=toindex([2, 3, 4, 5, 6]))
Minjie Wang's avatar
Minjie Wang committed
247
248
    # test read
    for k, v in f1.items():
249
        assert F.allclose(F.narrow_row(data[k].data, 0, 4), v)
Minjie Wang's avatar
Minjie Wang committed
250
    for k, v in f2.items():
251
252
        assert F.allclose(F.narrow_row(data[k].data, 2, 7), v)
    f2_a1 = f2['a1']
Minjie Wang's avatar
Minjie Wang committed
253
254
    # test write
    # update own ref should not been seen by the other.
255
256
257
258
    f1[Index(F.tensor([0, 1]))] = {
            'a1' : F.zeros([2, D]),
            'a2' : F.zeros([2, D]),
            'a3' : F.zeros([2, D]),
Minjie Wang's avatar
Minjie Wang committed
259
            }
260
    assert F.allclose(f2['a1'], f2_a1)
Minjie Wang's avatar
Minjie Wang committed
261
    # update shared space should been seen by the other.
262
263
264
265
    f1[Index(F.tensor([2, 3]))] = {
            'a1' : F.ones([2, D]),
            'a2' : F.ones([2, D]),
            'a3' : F.ones([2, D]),
Minjie Wang's avatar
Minjie Wang committed
266
            }
267
268
    F.narrow_row_set(f2_a1, 0, 2, F.ones([2, D]))
    assert F.allclose(f2['a1'], f2_a1)
269

270
271
def test_slicing():
    data = Frame(create_test_data(grad=True))
Minjie Wang's avatar
Minjie Wang committed
272
273
    f1 = FrameRef(data, index=toindex(slice(1, 5)))
    f2 = FrameRef(data, index=toindex(slice(3, 8)))
274
275
    # test read
    for k, v in f1.items():
276
277
        assert F.allclose(F.narrow_row(data[k].data, 1, 5), v)
    f2_a1 = f2['a1']    # is a tensor
278
    # test write
279
280
281
282
    f1[Index(F.tensor([0, 1]))] = {
            'a1': F.zeros([2, D]),
            'a2': F.zeros([2, D]),
            'a3': F.zeros([2, D]),
283
            }
284
    assert F.allclose(f2['a1'], f2_a1)
285
    
286
287
288
289
    f1[Index(F.tensor([2, 3]))] = {
            'a1': F.ones([2, D]),
            'a2': F.ones([2, D]),
            'a3': F.ones([2, D]),
290
            }
291
292
    F.narrow_row_set(f2_a1, 0, 2, 1)
    assert F.allclose(f2['a1'], f2_a1)
293

294
295
296
297
    f1[toindex(slice(2, 4))] = {
            'a1': F.zeros([2, D]),
            'a2': F.zeros([2, D]),
            'a3': F.zeros([2, D]),
298
            }
299
300
    F.narrow_row_set(f2_a1, 0, 2, 0)
    assert F.allclose(f2['a1'], f2_a1)
301

302
303
304
305
def test_add_rows():
    data = Frame()
    f1 = FrameRef(data)
    f1.add_rows(4)
306
307
308
309
    x = F.randn((1, 4))
    f1[Index(F.tensor([0]))] = {'x': x}
    ans = F.cat([x, F.zeros((3, 4))], 0)
    assert F.allclose(f1['x'], ans)
310
    f1.add_rows(4)
311
312
313
314
315
    f1[toindex(slice(4, 8))] = {'x': F.ones((4, 4)), 'y': F.ones((4, 5))}
    ans = F.cat([ans, F.ones((4, 4))], 0)
    assert F.allclose(f1['x'], ans)
    ans = F.cat([F.zeros((4, 5)), F.ones((4, 5))], 0)
    assert F.allclose(f1['y'], ans)
316

Minjie Wang's avatar
Minjie Wang committed
317
318
319
def test_inplace():
    f = FrameRef(Frame(create_test_data()))
    print(f.schemes)
320
321
322
    a1addr = id(f['a1'])
    a2addr = id(f['a2'])
    a3addr = id(f['a3'])
Minjie Wang's avatar
Minjie Wang committed
323
324

    # column updates are always out-of-place
325
326
    f['a1'] = F.ones((N, D))
    newa1addr = id(f['a1'])
Minjie Wang's avatar
Minjie Wang committed
327
328
329
    assert a1addr != newa1addr
    a1addr = newa1addr
    # full row update that becomes column update
330
331
    f[toindex(slice(0, N))] = {'a1' : F.ones((N, D))}
    assert id(f['a1']) != a1addr
Minjie Wang's avatar
Minjie Wang committed
332
333

    # row update (outplace) w/ slice
334
335
    f[toindex(slice(1, 4))] = {'a2' : F.ones((3, D))}
    newa2addr = id(f['a2'])
Minjie Wang's avatar
Minjie Wang committed
336
337
338
    assert a2addr != newa2addr
    a2addr = newa2addr
    # row update (outplace) w/ list
339
340
    f[toindex([1, 3, 5])] = {'a2' : F.ones((3, D))}
    newa2addr = id(f['a2'])
Minjie Wang's avatar
Minjie Wang committed
341
342
343
344
    assert a2addr != newa2addr
    a2addr = newa2addr

    # row update (inplace) w/ slice
345
346
    f.update_data(toindex(slice(1, 4)), {'a2' : F.ones((3, D))}, True)
    newa2addr = id(f['a2'])
Minjie Wang's avatar
Minjie Wang committed
347
348
    assert a2addr == newa2addr
    # row update (inplace) w/ list
349
350
    f.update_data(toindex([1, 3, 5]), {'a2' : F.ones((3, D))}, True)
    newa2addr = id(f['a2'])
Minjie Wang's avatar
Minjie Wang committed
351
352
    assert a2addr == newa2addr

353
354
if __name__ == '__main__':
    test_create()
Minjie Wang's avatar
Minjie Wang committed
355
356
357
358
    test_column1()
    test_column2()
    test_append1()
    test_append2()
359
    test_append3()
Minjie Wang's avatar
Minjie Wang committed
360
361
362
    test_row1()
    test_row2()
    test_row3()
363
    test_row4()
Minjie Wang's avatar
Minjie Wang committed
364
    test_sharing()
365
    test_slicing()
366
    test_add_rows()
Minjie Wang's avatar
Minjie Wang committed
367
    test_inplace()