CMakeLists.txt 8.97 KB
Newer Older
1
include_directories(BEFORE
Adam Osewski's avatar
Adam Osewski committed
2
    ${PROJECT_SOURCE_DIR}/
3
    ${PROJECT_SOURCE_DIR}/profiler/include
4
5
)

6
include(gtest)
JD's avatar
JD committed
7

8
9
add_custom_target(tests)

Chao Liu's avatar
Chao Liu committed
10
11
function(add_test_executable TEST_NAME)
    message("adding test ${TEST_NAME}")
12
13
    set(result 1)
    if(DEFINED DTYPES)
14
15
        foreach(source IN LISTS ARGN)
            set(test 0)
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
            if((source MATCHES "_fp16" OR source MATCHES "_f16") AND NOT "fp16" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_fp32" OR source MATCHES "_f32") AND NOT "fp32" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_fp64" OR source MATCHES "_f64") AND NOT "fp64" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_fp8" OR source MATCHES "_f8") AND NOT "fp8" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_bf8" OR source MATCHES "_bf8") AND NOT "bf8" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_bf16" OR source MATCHES "_b16") AND NOT "bf16" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_int8" OR source MATCHES "_i8") AND NOT "int8" IN_LIST DTYPES)
                set(test 1)
            endif()
37
38
39
            if(test EQUAL 1)
                message("removing test ${source} ")
                list(REMOVE_ITEM ARGN "${source}")
40
41
            endif()
        endforeach()
42
    endif()
43

44
    set(TEST_TARGETS ${SUPPORTED_GPU_TARGETS})
45

46
47
48
49
50
51
    foreach(source IN LISTS ARGN)
        if(NOT DEFINED DPP_KERNELS AND source MATCHES "_dpp")
            message("removing dpp test ${source} ")
            list(REMOVE_ITEM ARGN "${source}")
        endif()
    endforeach()
52
    foreach(source IN LISTS ARGN)
53
54
55
56
57
        if(NOT DEFINED DL_KERNELS AND source MATCHES "_dl")
            message("removing dl test ${source} ")
            list(REMOVE_ITEM ARGN "${source}")
        endif()
    endforeach()
58
    foreach(source IN LISTS ARGN)
59
        if(NOT TEST_TARGETS MATCHES "gfx9" AND source MATCHES "xdl")
60
61
62
63
64
            message("removing xdl test ${source} ")
            list(REMOVE_ITEM ARGN "${source}")
        endif()
    endforeach()
    foreach(source IN LISTS ARGN)
65
	if(NOT TEST_TARGETS MATCHES "gfx11" AND NOT TEST_TARGETS MATCHES "gfx12" AND source MATCHES "wmma")
66
67
68
69
            message("removing wmma test ${source} ")
            list(REMOVE_ITEM ARGN "${source}")
        endif()
    endforeach()
70
71
    #only continue if there are some source files left on the list
    if(ARGN)
72
        if(ARGN MATCHES "_xdl")
73
             list(REMOVE_ITEM TEST_TARGETS gfx900 gfx906 gfx906:xnack- gfx1030 gfx1100 gfx1101 gfx1102 gfx1103 gfx1200 gfx1201 gfx10.3-generic gfx11-generic gfx12-generic)
74
        elseif(ARGN MATCHES "_wmma")
75
             list(REMOVE_ITEM TEST_TARGETS gfx900 gfx906 gfx906:xnack- gfx908:xnack+ gfx908:xnack- gfx90a:xnack+ gfx90a:xnack- gfx908 gfx90a gfx940 gfx941 gfx942 gfx1030)
76
        elseif(ARGN MATCHES "_smfmac")
77
             list(REMOVE_ITEM TEST_TARGETS gfx900 gfx906 gfx906:xnack- gfx1030 gfx1100 gfx1101 gfx1102 gfx1103 gfx908 gfx90a gfx1200 gfx1201 gfx10.3-generic gfx11-generic gfx12-generic)
78
79
        endif()
        set_source_files_properties(${ARGN} PROPERTIES LANGUAGE HIP)
80
        add_executable(${TEST_NAME} ${ARGN})
81
        set_property(TARGET ${TEST_NAME} PROPERTY HIP_ARCHITECTURES ${TEST_TARGETS} )
82
        target_link_libraries(${TEST_NAME} PRIVATE getopt::getopt)
83
84
85
86
87
88
89
        add_test(NAME ${TEST_NAME} COMMAND $<TARGET_FILE:${TEST_NAME}>)
        add_dependencies(tests ${TEST_NAME})
        add_dependencies(check ${TEST_NAME})
        rocm_install(TARGETS ${TEST_NAME} COMPONENT tests)
        set(result 0)
    endif()
    #message("add_test returns ${result}")
90
    set(result ${result} PARENT_SCOPE)
91
endfunction()
92
93
94

function(add_gtest_executable TEST_NAME)
    message("adding gtest ${TEST_NAME}")
95
96
    set(result 1)
    if(DEFINED DTYPES)
97
98
        foreach(source IN LISTS ARGN)
            set(test 0)
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
            if((source MATCHES "_fp16" OR source MATCHES "_f16") AND NOT "fp16" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_fp32" OR source MATCHES "_f32") AND NOT "fp32" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_fp64" OR source MATCHES "_f64") AND NOT "fp64" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_fp8" OR source MATCHES "_f8") AND NOT "fp8" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_bf8" OR source MATCHES "_bf8") AND NOT "bf8" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_bf16" OR source MATCHES "_b16") AND NOT "bf16" IN_LIST DTYPES)
                set(test 1)
            endif()
            if((source MATCHES "_int8" OR source MATCHES "_i8") AND NOT "int8" IN_LIST DTYPES)
                set(test 1)
            endif()
120
121
122
            if(test EQUAL 1)
                message("removing gtest ${source} ")
                list(REMOVE_ITEM ARGN "${source}")
123
124
125
            endif()
        endforeach()
    endif()
126

127
    set(TEST_TARGETS ${SUPPORTED_GPU_TARGETS})
128

129
130
131
132
    foreach(source IN LISTS ARGN)
        if(NOT DEFINED DL_KERNELS AND source MATCHES "_dl")
            message("removing dl test ${source} ")
            list(REMOVE_ITEM ARGN "${source}")
133
134
135
        endif()
    endforeach()
    foreach(source IN LISTS ARGN)
136
        if(NOT TEST_TARGETS MATCHES "gfx9" AND source MATCHES "xdl")
137
138
139
140
141
            message("removing xdl test ${source} ")
            list(REMOVE_ITEM ARGN "${source}")
        endif()
    endforeach()
    foreach(source IN LISTS ARGN)
142
	if(NOT TEST_TARGETS MATCHES "gfx11" AND NOT TEST_TARGETS MATCHES "gfx12" AND source MATCHES "wmma")
143
144
            message("removing wmma test ${source} ")
            list(REMOVE_ITEM ARGN "${source}")
145
146
147
148
        endif()
    endforeach()
    #only continue if there are some source files left on the list
    if(ARGN)
149
        if(ARGN MATCHES "_xdl")
150
             list(REMOVE_ITEM TEST_TARGETS gfx900 gfx906 gfx906:xnack- gfx1030 gfx1100 gfx1101 gfx1102 gfx1103 gfx1200 gfx1201 gfx10.3-generic gfx11-generic gfx12-generic)
151
        elseif(ARGN MATCHES "_wmma")
152
             list(REMOVE_ITEM TEST_TARGETS gfx900 gfx906 gfx906:xnack- gfx908:xnack+ gfx908:xnack- gfx90a:xnack+ gfx90a:xnack- gfx908 gfx90a gfx940 gfx941 gfx942 gfx1030)
153
        elseif(ARGN MATCHES "_smfmac")
154
             list(REMOVE_ITEM TEST_TARGETS gfx900 gfx906 gfx906:xnack- gfx1030 gfx1100 gfx1101 gfx1102 gfx1103 gfx908 gfx90a gfx1200 gfx1201 gfx10.3-generic gfx11-generic gfx12-generic)
155
156
        endif()
        set_source_files_properties(${ARGN} PROPERTIES LANGUAGE HIP)
157
        add_executable(${TEST_NAME} ${ARGN})
158
        set_property(TARGET ${TEST_NAME} PROPERTY HIP_ARCHITECTURES ${TEST_TARGETS} )
159
160
161
162
163
        add_dependencies(tests ${TEST_NAME})
        add_dependencies(check ${TEST_NAME})

        # suppress gtest warnings
        target_compile_options(${TEST_NAME} PRIVATE -Wno-global-constructors -Wno-undef)
164
        target_link_libraries(${TEST_NAME} PRIVATE gtest_main getopt::getopt)
165
166
167
168
169
        add_test(NAME ${TEST_NAME} COMMAND $<TARGET_FILE:${TEST_NAME}>)
        rocm_install(TARGETS ${TEST_NAME} COMPONENT tests)
        set(result 0)
    endif()
    #message("add_gtest returns ${result}")
170
    set(result ${result} PARENT_SCOPE)
171
endfunction()
172

173
add_compile_options(-Wno-c++20-extensions)
174
add_subdirectory(ck_tile)
Chao Liu's avatar
Chao Liu committed
175
176
177
178
179
add_subdirectory(magic_number_division)
add_subdirectory(space_filling_curve)
add_subdirectory(conv_util)
add_subdirectory(reference_conv_fwd)
add_subdirectory(gemm)
180
add_subdirectory(gemm_add)
181
add_subdirectory(gemm_layernorm)
Chao Liu's avatar
Chao Liu committed
182
add_subdirectory(gemm_split_k)
183
add_subdirectory(gemm_universal)
Chao Liu's avatar
Chao Liu committed
184
185
add_subdirectory(gemm_reduce)
add_subdirectory(batched_gemm)
186
add_subdirectory(batched_gemm_reduce)
Anthony Chang's avatar
Anthony Chang committed
187
add_subdirectory(batched_gemm_gemm)
Anthony Chang's avatar
Anthony Chang committed
188
add_subdirectory(batched_gemm_softmax_gemm)
189
add_subdirectory(batched_gemm_softmax_gemm_permute)
Chao Liu's avatar
Chao Liu committed
190
add_subdirectory(grouped_gemm)
191
add_subdirectory(reduce)
192
add_subdirectory(convnd_fwd)
JD's avatar
JD committed
193
add_subdirectory(convnd_bwd_data)
194
add_subdirectory(grouped_convnd_fwd)
195
add_subdirectory(grouped_convnd_bwd_weight)
196
add_subdirectory(block_to_ctile_map)
197
add_subdirectory(softmax)
rocking's avatar
rocking committed
198
add_subdirectory(normalization_fwd)
199
add_subdirectory(normalization_bwd_data)
200
add_subdirectory(normalization_bwd_gamma_beta)
Adam Osewski's avatar
Adam Osewski committed
201
add_subdirectory(data_type)
202
add_subdirectory(elementwise_normalization)
203
add_subdirectory(batchnorm)
204
add_subdirectory(contraction)
205
add_subdirectory(pool)
206
add_subdirectory(batched_gemm_multi_d)
207
add_subdirectory(grouped_convnd_bwd_data)
208
add_subdirectory(conv_tensor_rearrange)
arai713's avatar
arai713 committed
209
add_subdirectory(transpose)
arai713's avatar
arai713 committed
210
add_subdirectory(permute_scale)
211
add_subdirectory(wrapper)
212
if(SUPPORTED_GPU_TARGETS MATCHES "gfx11")
213
214
    add_subdirectory(wmma_op)
endif()
215
if(SUPPORTED_GPU_TARGETS MATCHES "gfx942" AND CK_HIP_VERSION_MAJOR GREATER_EQUAL 6 AND CK_HIP_VERSION_MINOR GREATER_EQUAL 2) # smfmac needs ROCm6.2
216
217
    add_subdirectory(smfmac_op)
endif()
carlushuang's avatar
carlushuang committed
218
add_subdirectory(position_embedding)
219
add_subdirectory(scatter_gather)