test_occupancy.py 3.34 KB
Newer Older
dugupeiwen's avatar
dugupeiwen committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
from numba.roc.gcn_occupancy import get_limiting_factors
import unittest


class TestOccupancy(unittest.TestCase):
    def check_limits(self, inputs, expected_outputs):
        outputs = get_limiting_factors(**inputs)
        for k, expect in expected_outputs.items():
            got = getattr(outputs, k)
            if k == 'occupancy':
                self.assertAlmostEqual(got, expect, msg=k)
            else:
                self.assertEqual(got, expect, k)

    def test_limits_1(self):
        inputs = dict(group_size=400,
                      vgpr_per_workitem=139,
                      sgpr_per_wave=49)
        outputs = dict(
            allowed_wave_due_to_sgpr=10,
            allowed_wave_due_to_vgpr=1,
            allowed_wave=1,
            allowed_vgpr_per_workitem=128,
            occupancy=0,
            reasons=set(['allowed_wave_due_to_vgpr',
                         'allowed_wave',
                         'group_size']),
        )
        self.check_limits(inputs, outputs)

    def test_limits_2(self):
        inputs = dict(group_size=256,
                      vgpr_per_workitem=139,
                      sgpr_per_wave=49)
        outputs = dict(
            allowed_wave_due_to_sgpr=10,
            allowed_wave_due_to_vgpr=1,
            allowed_wave=1,
            allowed_vgpr_per_workitem=256,
            occupancy=.10,
            reasons=set(),
        )
        self.check_limits(inputs, outputs)

    def test_limits_3(self):
        inputs = dict(group_size=2048,
                      vgpr_per_workitem=16,
                      sgpr_per_wave=70)
        outputs = dict(
            allowed_wave_due_to_sgpr=7,
            allowed_wave_due_to_vgpr=16,
            allowed_wave=7,
            allowed_vgpr_per_workitem=32,
            occupancy=0,
            reasons=set(['allowed_wave_due_to_sgpr',
                         'allowed_wave',
                         'group_size']),
        )
        self.check_limits(inputs, outputs)

    def test_limits_4(self):
        inputs = dict(group_size=2048,
                      vgpr_per_workitem=32,
                      sgpr_per_wave=50)
        outputs = dict(
            allowed_wave_due_to_sgpr=10,
            allowed_wave_due_to_vgpr=8,
            allowed_wave=8,
            allowed_vgpr_per_workitem=32,
            occupancy=0,
            reasons=set(['group_size']),
        )
        self.check_limits(inputs, outputs)

    def test_limits_5(self):
        inputs = dict(group_size=4,
                      vgpr_per_workitem=128,
                      sgpr_per_wave=10)
        outputs = dict(
            allowed_wave_due_to_sgpr=51,
            allowed_wave_due_to_vgpr=2,
            allowed_wave=2,
            allowed_vgpr_per_workitem=256,
            occupancy=.1,
            reasons=set(),
        )
        self.check_limits(inputs, outputs)

    def test_limits_6(self):
        inputs = dict(group_size=4,
                      vgpr_per_workitem=257,
                      sgpr_per_wave=3)
        outputs = dict(
            allowed_wave_due_to_sgpr=170,
            allowed_wave_due_to_vgpr=0,
            allowed_wave=0,
            allowed_vgpr_per_workitem=256,
            occupancy=0,
            reasons=set(['allowed_wave_due_to_vgpr',
                         'allowed_wave']),
        )
        self.check_limits(inputs, outputs)


if __name__ == '__main__':
    unittest.main()