test_tilelang_language_reshape.py 1.78 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
from tilelang import tvm as tvm
import tilelang.testing
import tilelang as tl


def reshape_test(N, M, dtype):
    import tilelang.language as T

    @T.prim_func
    def main(
11
12
            A: T.Tensor((N,), dtype),
            B: T.Tensor((N // M, M), dtype),
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
    ):
        with T.Kernel(1) as _:
            A_reshaped = T.reshape(A, [N // M, M])
            T.copy(A_reshaped, B)

    return main


def run_reshape(N, M, dtype):
    program = reshape_test(N, M, dtype)
    jit_kernel = tl.compile(program, out_idx=-1)
    profiler = jit_kernel.get_profiler()

    def ref_program(A):
        return A.reshape(N // M, M)

    profiler.assert_allclose(ref_program, atol=1e-2, rtol=1e-2)


def test_reshape_smem():
    # Test reshape
    run_reshape(1024, 32, "float32")
    run_reshape(2048, 64, "float16")


def reshape_test_smem(N, M, dtype):
    import tilelang.language as T

    @T.prim_func
    def main(
43
44
            A: T.Tensor((N,), dtype),
            B: T.Tensor((N // M, M), dtype),
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
    ):
        with T.Kernel(1) as _:
            A_shared = T.alloc_shared((N,), dtype)
            for i in range(N):
                A_shared[i] = A[i]

            A_smem_reshaped = T.reshape(A_shared, [N // M, M])
            for i in range(N // M):
                for j in range(M):
                    B[i, j] = A_smem_reshaped[i, j]

    return main


def run_reshape_smem(N, M, dtype):
    program = reshape_test_smem(N, M, dtype)
    jit_kernel = tl.compile(program, out_idx=-1)
    profiler = jit_kernel.get_profiler()

    def ref_program(A):
        return A.reshape(N // M, M)

    profiler.assert_allclose(ref_program, atol=1e-2, rtol=1e-2)


def test_reshape_smem_shared():
    run_reshape_smem(1024, 32, "float32")
    run_reshape_smem(2048, 64, "float16")


if __name__ == "__main__":
    tilelang.testing.main()