Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
7f65ac05
Commit
7f65ac05
authored
Apr 04, 2024
by
Jun Liu
Browse files
Merge branch 'develop' into amd-develop
parents
687d2b7e
7e5c81fe
Changes
234
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
55 additions
and
84 deletions
+55
-84
test/contraction/test_contraction_xdl.cpp
test/contraction/test_contraction_xdl.cpp
+0
-0
test/convnd_bwd_data/CMakeLists.txt
test/convnd_bwd_data/CMakeLists.txt
+3
-8
test/convnd_bwd_data/convnd_bwd_data_xdl.cpp
test/convnd_bwd_data/convnd_bwd_data_xdl.cpp
+0
-0
test/convnd_fwd/CMakeLists.txt
test/convnd_fwd/CMakeLists.txt
+3
-8
test/convnd_fwd/convnd_fwd_xdl.cpp
test/convnd_fwd/convnd_fwd_xdl.cpp
+0
-0
test/gemm_add/CMakeLists.txt
test/gemm_add/CMakeLists.txt
+16
-8
test/gemm_add/test_gemm_add_fastgelu_xdl.cpp
test/gemm_add/test_gemm_add_fastgelu_xdl.cpp
+1
-1
test/gemm_add/test_gemm_add_relu_xdl.cpp
test/gemm_add/test_gemm_add_relu_xdl.cpp
+1
-1
test/gemm_add/test_gemm_add_silu_xdl.cpp
test/gemm_add/test_gemm_add_silu_xdl.cpp
+1
-1
test/gemm_add/test_gemm_add_xdl.hpp
test/gemm_add/test_gemm_add_xdl.hpp
+0
-0
test/gemm_layernorm/CMakeLists.txt
test/gemm_layernorm/CMakeLists.txt
+6
-13
test/gemm_layernorm/test_gemm_add_relu_add_layernorm_fp16_xdl.cpp
...m_layernorm/test_gemm_add_relu_add_layernorm_fp16_xdl.cpp
+0
-0
test/gemm_reduce/CMakeLists.txt
test/gemm_reduce/CMakeLists.txt
+1
-1
test/gemm_reduce/gemm_reduce_fp16_xdl.cpp
test/gemm_reduce/gemm_reduce_fp16_xdl.cpp
+0
-0
test/gemm_split_k/CMakeLists.txt
test/gemm_split_k/CMakeLists.txt
+2
-7
test/gemm_split_k/test_gemm_splitk_xdl.cpp
test/gemm_split_k/test_gemm_splitk_xdl.cpp
+0
-0
test/grouped_convnd_bwd_data/CMakeLists.txt
test/grouped_convnd_bwd_data/CMakeLists.txt
+12
-19
test/grouped_convnd_bwd_data/test_grouped_convnd_bwd_data_xdl_wmma.cpp
...convnd_bwd_data/test_grouped_convnd_bwd_data_xdl_wmma.cpp
+0
-0
test/grouped_convnd_bwd_weight/CMakeLists.txt
test/grouped_convnd_bwd_weight/CMakeLists.txt
+9
-17
test/grouped_convnd_bwd_weight/test_grouped_convnd_bwd_weight_xdl_wmma.cpp
...nd_bwd_weight/test_grouped_convnd_bwd_weight_xdl_wmma.cpp
+0
-0
No files found.
test/contraction/test_contraction.cpp
→
test/contraction/test_contraction
_xdl
.cpp
View file @
7f65ac05
File moved
test/convnd_bwd_data/CMakeLists.txt
View file @
7f65ac05
list
(
APPEND gpu_list gfx908 gfx90a gfx940 gfx941 gfx942
)
add_gtest_executable
(
test_convnd_bwd_data convnd_bwd_data_xdl.cpp
)
set
(
target 0
)
if
(
result EQUAL 0
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
if
(
gpu IN_LIST gpu_list AND target EQUAL 0
)
add_gtest_executable
(
test_convnd_bwd_data convnd_bwd_data.cpp
)
target_link_libraries
(
test_convnd_bwd_data PRIVATE utility device_conv1d_bwd_data_instance device_conv2d_bwd_data_instance device_conv3d_bwd_data_instance
)
target_link_libraries
(
test_convnd_bwd_data PRIVATE utility device_conv1d_bwd_data_instance device_conv2d_bwd_data_instance device_conv3d_bwd_data_instance
)
set
(
target 1
)
endif
()
endif
()
endforeach
()
\ No newline at end of file
test/convnd_bwd_data/convnd_bwd_data.cpp
→
test/convnd_bwd_data/convnd_bwd_data
_xdl
.cpp
View file @
7f65ac05
File moved
test/convnd_fwd/CMakeLists.txt
View file @
7f65ac05
list
(
APPEND gpu_list gfx908 gfx90a gfx940 gfx941 gfx942
)
add_gtest_executable
(
test_convnd_fwd convnd_fwd_xdl.cpp
)
set
(
target 0
)
if
(
result EQUAL 0
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
if
(
gpu IN_LIST gpu_list AND target EQUAL 0
)
add_gtest_executable
(
test_convnd_fwd convnd_fwd.cpp
)
target_link_libraries
(
test_convnd_fwd PRIVATE utility device_conv2d_fwd_instance
)
target_link_libraries
(
test_convnd_fwd PRIVATE utility device_conv2d_fwd_instance
)
set
(
target 1
)
endif
()
endif
()
endforeach
()
test/convnd_fwd/convnd_fwd.cpp
→
test/convnd_fwd/convnd_fwd
_xdl
.cpp
View file @
7f65ac05
File moved
test/gemm_add/CMakeLists.txt
View file @
7f65ac05
add_gtest_executable
(
test_gemm_add test_gemm_add.hpp
)
add_gtest_executable
(
test_gemm_add test_gemm_add_xdl.hpp
)
target_link_libraries
(
test_gemm_add PRIVATE utility device_gemm_add_instance
)
if
(
result EQUAL 0
)
target_link_libraries
(
test_gemm_add PRIVATE utility device_gemm_add_instance
)
endif
()
add_gtest_executable
(
test_gemm_add_relu test_gemm_add_relu.cpp
)
add_gtest_executable
(
test_gemm_add_relu test_gemm_add_relu_xdl.cpp
)
target_link_libraries
(
test_gemm_add_relu PRIVATE utility device_gemm_add_instance device_gemm_add_relu_instance
)
if
(
result EQUAL 0
)
target_link_libraries
(
test_gemm_add_relu PRIVATE utility device_gemm_add_instance device_gemm_add_relu_instance
)
endif
()
add_gtest_executable
(
test_gemm_add_silu test_gemm_add_silu.cpp
)
add_gtest_executable
(
test_gemm_add_silu test_gemm_add_silu_xdl.cpp
)
target_link_libraries
(
test_gemm_add_silu PRIVATE utility device_gemm_add_instance device_gemm_add_silu_instance
)
if
(
result EQUAL 0
)
target_link_libraries
(
test_gemm_add_silu PRIVATE utility device_gemm_add_instance device_gemm_add_silu_instance
)
endif
()
add_gtest_executable
(
test_gemm_add_fastgelu test_gemm_add_fastgelu.cpp
)
add_gtest_executable
(
test_gemm_add_fastgelu test_gemm_add_fastgelu_xdl.cpp
)
target_link_libraries
(
test_gemm_add_fastgelu PRIVATE utility device_gemm_add_instance device_gemm_add_fastgelu_instance
)
if
(
result EQUAL 0
)
target_link_libraries
(
test_gemm_add_fastgelu PRIVATE utility device_gemm_add_instance device_gemm_add_fastgelu_instance
)
endif
()
test/gemm_add/test_gemm_add_fastgelu.cpp
→
test/gemm_add/test_gemm_add_fastgelu
_xdl
.cpp
View file @
7f65ac05
...
@@ -4,7 +4,7 @@
...
@@ -4,7 +4,7 @@
#include "gtest/gtest.h"
#include "gtest/gtest.h"
#include "ck/ck.hpp"
#include "ck/ck.hpp"
#include "profiler/profile_gemm_add_fastgelu_impl.hpp"
#include "profiler/profile_gemm_add_fastgelu_impl.hpp"
#include "test_gemm_add.hpp"
#include "test_gemm_add
_xdl
.hpp"
template
<
typename
Tuple
>
template
<
typename
Tuple
>
class
TestGemmAddFastgelu
:
public
TestGemmAdd
<
Tuple
>
class
TestGemmAddFastgelu
:
public
TestGemmAdd
<
Tuple
>
...
...
test/gemm_add/test_gemm_add_relu.cpp
→
test/gemm_add/test_gemm_add_relu
_xdl
.cpp
View file @
7f65ac05
...
@@ -4,7 +4,7 @@
...
@@ -4,7 +4,7 @@
#include "gtest/gtest.h"
#include "gtest/gtest.h"
#include "ck/ck.hpp"
#include "ck/ck.hpp"
#include "profiler/profile_gemm_add_relu_impl.hpp"
#include "profiler/profile_gemm_add_relu_impl.hpp"
#include "test_gemm_add.hpp"
#include "test_gemm_add
_xdl
.hpp"
template
<
typename
Tuple
>
template
<
typename
Tuple
>
class
TestGemmAddRelu
:
public
TestGemmAdd
<
Tuple
>
class
TestGemmAddRelu
:
public
TestGemmAdd
<
Tuple
>
...
...
test/gemm_add/test_gemm_add_silu.cpp
→
test/gemm_add/test_gemm_add_silu
_xdl
.cpp
View file @
7f65ac05
...
@@ -4,7 +4,7 @@
...
@@ -4,7 +4,7 @@
#include "gtest/gtest.h"
#include "gtest/gtest.h"
#include "ck/ck.hpp"
#include "ck/ck.hpp"
#include "profiler/profile_gemm_add_silu_impl.hpp"
#include "profiler/profile_gemm_add_silu_impl.hpp"
#include "test_gemm_add.hpp"
#include "test_gemm_add
_xdl
.hpp"
template
<
typename
Tuple
>
template
<
typename
Tuple
>
class
TestGemmAddSilu
:
public
TestGemmAdd
<
Tuple
>
class
TestGemmAddSilu
:
public
TestGemmAdd
<
Tuple
>
...
...
test/gemm_add/test_gemm_add.hpp
→
test/gemm_add/test_gemm_add
_xdl
.hpp
View file @
7f65ac05
File moved
test/gemm_layernorm/CMakeLists.txt
View file @
7f65ac05
list
(
APPEND gpu_list gfx908 gfx90a gfx940 gfx941 gfx942
)
add_gtest_executable
(
test_gemm_add_relu_add_layernorm_fp16 test_gemm_add_relu_add_layernorm_fp16_xdl.cpp
)
set
(
target 0
)
if
(
result EQUAL 0
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
add_custom_target
(
test_gemm_layernorm
)
if
(
gpu IN_LIST gpu_list AND target EQUAL 0
)
target_link_libraries
(
test_gemm_add_relu_add_layernorm_fp16 PRIVATE utility device_gemm_add_relu_add_layernorm_instance
)
add_custom_target
(
test_gemm_layernorm
)
add_dependencies
(
test_gemm_layernorm test_gemm_add_relu_add_layernorm_fp16
)
add_gtest_executable
(
test_gemm_add_relu_add_layernorm_fp16 test_gemm_add_relu_add_layernorm_fp16.cpp
)
endif
()
if
(
result EQUAL 0
)
target_link_libraries
(
test_gemm_add_relu_add_layernorm_fp16 PRIVATE utility device_gemm_add_relu_add_layernorm_instance
)
add_dependencies
(
test_gemm_layernorm test_gemm_add_relu_add_layernorm_fp16
)
set
(
target 1
)
endif
()
endif
()
endforeach
()
test/gemm_layernorm/test_gemm_add_relu_add_layernorm_fp16.cpp
→
test/gemm_layernorm/test_gemm_add_relu_add_layernorm_fp16
_xdl
.cpp
View file @
7f65ac05
File moved
test/gemm_reduce/CMakeLists.txt
View file @
7f65ac05
add_test_executable
(
test_gemm_reduce_fp16 gemm_reduce_fp16.cpp
)
add_test_executable
(
test_gemm_reduce_fp16 gemm_reduce_fp16
_xdl
.cpp
)
if
(
result EQUAL 0
)
if
(
result EQUAL 0
)
target_link_libraries
(
test_gemm_reduce_fp16 PRIVATE utility device_gemm_reduce_instance
)
target_link_libraries
(
test_gemm_reduce_fp16 PRIVATE utility device_gemm_reduce_instance
)
endif
()
endif
()
\ No newline at end of file
test/gemm_reduce/gemm_reduce_fp16.cpp
→
test/gemm_reduce/gemm_reduce_fp16
_xdl
.cpp
View file @
7f65ac05
File moved
test/gemm_split_k/CMakeLists.txt
View file @
7f65ac05
list
(
APPEND gpu_list gfx908 gfx90a gfx940 gfx941 gfx942
)
add_gtest_executable
(
test_gemm_splitk test_gemm_splitk_xdl.cpp
)
set
(
target 0
)
if
(
result EQUAL 0
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
if
(
gpu IN_LIST gpu_list AND target EQUAL 0
)
add_gtest_executable
(
test_gemm_splitk test_gemm_splitk.cpp
)
target_link_libraries
(
test_gemm_splitk PRIVATE utility device_gemm_splitk_instance
)
target_link_libraries
(
test_gemm_splitk PRIVATE utility device_gemm_splitk_instance
)
set
(
target 1
)
endif
()
endif
()
endforeach
()
test/gemm_split_k/test_gemm_splitk.cpp
→
test/gemm_split_k/test_gemm_splitk
_xdl
.cpp
View file @
7f65ac05
File moved
test/grouped_convnd_bwd_data/CMakeLists.txt
View file @
7f65ac05
list
(
APPEND gpu_list_xdl gfx908 gfx90a gfx940
)
add_gtest_executable
(
test_grouped_convnd_bwd_data test_grouped_convnd_bwd_data_xdl_wmma.cpp
)
list
(
APPEND gpu_list_wmma gfx1100 gfx1101 gfx1102 gfx1103
)
if
(
result EQUAL 0
)
set
(
target 0
)
target_link_libraries
(
test_grouped_convnd_bwd_data PRIVATE utility device_grouped_conv2d_bwd_data_instance device_grouped_conv3d_bwd_data_instance
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
endif
()
if
(
gpu IN_LIST gpu_list_xdl AND target EQUAL 0
)
add_gtest_executable
(
test_grouped_convnd_bwd_data_interface test_grouped_convnd_bwd_data_interface_xdl.cpp
)
add_gtest_executable
(
test_grouped_convnd_bwd_data test_grouped_convnd_bwd_data.cpp
)
if
(
result EQUAL 0
)
target_link_libraries
(
test_grouped_convnd_bwd_data PRIVATE utility device_grouped_conv2d_bwd_data_instance device_grouped_conv3d_bwd_data_instance
)
target_link_libraries
(
test_grouped_convnd_bwd_data_interface PRIVATE utility device_grouped_conv2d_bwd_data_instance
)
add_gtest_executable
(
test_grouped_convnd_bwd_data_interface test_grouped_convnd_bwd_data_interface_xdl.cpp
)
endif
()
target_link_libraries
(
test_grouped_convnd_bwd_data_interface PRIVATE utility device_grouped_conv2d_bwd_data_instance
)
add_gtest_executable
(
test_grouped_convnd_bwd_data_interface test_grouped_convnd_bwd_data_interface_wmma.cpp
)
set
(
target 1
)
if
(
result EQUAL 0
)
endif
()
target_link_libraries
(
test_grouped_convnd_bwd_data_interface PRIVATE utility device_grouped_conv2d_bwd_data_instance
)
if
(
gpu IN_LIST gpu_list_wmma AND target EQUAL 0
)
endif
()
add_gtest_executable
(
test_grouped_convnd_bwd_data test_grouped_convnd_bwd_data.cpp
)
target_link_libraries
(
test_grouped_convnd_bwd_data PRIVATE utility device_grouped_conv2d_bwd_data_instance device_grouped_conv3d_bwd_data_instance
)
add_gtest_executable
(
test_grouped_convnd_bwd_data_interface test_grouped_convnd_bwd_data_interface_wmma.cpp
)
target_link_libraries
(
test_grouped_convnd_bwd_data_interface PRIVATE utility device_grouped_conv2d_bwd_data_instance
)
set
(
target 1
)
endif
()
endforeach
()
\ No newline at end of file
test/grouped_convnd_bwd_data/test_grouped_convnd_bwd_data.cpp
→
test/grouped_convnd_bwd_data/test_grouped_convnd_bwd_data
_xdl_wmma
.cpp
View file @
7f65ac05
File moved
test/grouped_convnd_bwd_weight/CMakeLists.txt
View file @
7f65ac05
list
(
APPEND gpu_list_xdl gfx908 gfx90a gfx940 gfx941 gfx942
)
add_gtest_executable
(
test_grouped_convnd_bwd_weight test_grouped_convnd_bwd_weight_xdl_wmma.cpp
)
list
(
APPEND gpu_list_wmma gfx1100 gfx1101 gfx1102 gfx1103
)
if
(
result EQUAL 0
)
set
(
target 0
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
if
(
gpu IN_LIST gpu_list_xdl AND target EQUAL 0
)
add_gtest_executable
(
test_grouped_convnd_bwd_weight test_grouped_convnd_bwd_weight.cpp
)
target_link_libraries
(
test_grouped_convnd_bwd_weight PRIVATE utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance
)
target_link_libraries
(
test_grouped_convnd_bwd_weight PRIVATE utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance
)
add_gtest_executable
(
test_grouped_convnd_bwd_weight_interface test_grouped_convnd_bwd_weight_interface_xdl.cpp
)
endif
()
add_gtest_executable
(
test_grouped_convnd_bwd_weight_interface test_grouped_convnd_bwd_weight_interface_xdl.cpp
)
if
(
result EQUAL 0
)
target_link_libraries
(
test_grouped_convnd_bwd_weight_interface PRIVATE utility
)
target_link_libraries
(
test_grouped_convnd_bwd_weight_interface PRIVATE utility
)
set
(
target 1
)
endif
()
endif
()
add_gtest_executable
(
test_grouped_convnd_bwd_weight_interface test_grouped_convnd_bwd_weight_interface_wmma.cpp
)
if
(
gpu IN_LIST gpu_list_wmma AND target EQUAL 0
)
if
(
result EQUAL 0
)
add_gtest_executable
(
test_grouped_convnd_bwd_weight test_grouped_convnd_bwd_weight.cpp
)
target_link_libraries
(
test_grouped_convnd_bwd_weight PRIVATE utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance
)
add_gtest_executable
(
test_grouped_convnd_bwd_weight_interface test_grouped_convnd_bwd_weight_interface_wmma.cpp
)
target_link_libraries
(
test_grouped_convnd_bwd_weight_interface PRIVATE utility
)
target_link_libraries
(
test_grouped_convnd_bwd_weight_interface PRIVATE utility
)
set
(
target 1
)
endif
()
endif
()
endforeach
()
\ No newline at end of file
test/grouped_convnd_bwd_weight/test_grouped_convnd_bwd_weight.cpp
→
test/grouped_convnd_bwd_weight/test_grouped_convnd_bwd_weight
_xdl_wmma
.cpp
View file @
7f65ac05
File moved
Prev
1
…
7
8
9
10
11
12
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment