Commit 7f65ac05 authored by Jun Liu's avatar Jun Liu
Browse files

Merge branch 'develop' into amd-develop

parents 687d2b7e 7e5c81fe
list(APPEND gpu_list gfx908 gfx90a gfx940 gfx941 gfx942) add_gtest_executable(test_convnd_bwd_data convnd_bwd_data_xdl.cpp)
set(target 0) if(result EQUAL 0)
foreach(gpu IN LISTS GPU_TARGETS)
if(gpu IN_LIST gpu_list AND target EQUAL 0)
add_gtest_executable(test_convnd_bwd_data convnd_bwd_data.cpp)
target_link_libraries(test_convnd_bwd_data PRIVATE utility device_conv1d_bwd_data_instance device_conv2d_bwd_data_instance device_conv3d_bwd_data_instance) target_link_libraries(test_convnd_bwd_data PRIVATE utility device_conv1d_bwd_data_instance device_conv2d_bwd_data_instance device_conv3d_bwd_data_instance)
set(target 1) endif()
endif()
endforeach()
\ No newline at end of file
list(APPEND gpu_list gfx908 gfx90a gfx940 gfx941 gfx942) add_gtest_executable(test_convnd_fwd convnd_fwd_xdl.cpp)
set(target 0) if(result EQUAL 0)
foreach(gpu IN LISTS GPU_TARGETS)
if(gpu IN_LIST gpu_list AND target EQUAL 0)
add_gtest_executable(test_convnd_fwd convnd_fwd.cpp)
target_link_libraries(test_convnd_fwd PRIVATE utility device_conv2d_fwd_instance) target_link_libraries(test_convnd_fwd PRIVATE utility device_conv2d_fwd_instance)
set(target 1) endif()
endif()
endforeach()
add_gtest_executable(test_gemm_add test_gemm_add.hpp) add_gtest_executable(test_gemm_add test_gemm_add_xdl.hpp)
target_link_libraries(test_gemm_add PRIVATE utility device_gemm_add_instance) if(result EQUAL 0)
target_link_libraries(test_gemm_add PRIVATE utility device_gemm_add_instance)
endif()
add_gtest_executable(test_gemm_add_relu test_gemm_add_relu.cpp) add_gtest_executable(test_gemm_add_relu test_gemm_add_relu_xdl.cpp)
target_link_libraries(test_gemm_add_relu PRIVATE utility device_gemm_add_instance device_gemm_add_relu_instance) if(result EQUAL 0)
target_link_libraries(test_gemm_add_relu PRIVATE utility device_gemm_add_instance device_gemm_add_relu_instance)
endif()
add_gtest_executable(test_gemm_add_silu test_gemm_add_silu.cpp) add_gtest_executable(test_gemm_add_silu test_gemm_add_silu_xdl.cpp)
target_link_libraries(test_gemm_add_silu PRIVATE utility device_gemm_add_instance device_gemm_add_silu_instance) if(result EQUAL 0)
target_link_libraries(test_gemm_add_silu PRIVATE utility device_gemm_add_instance device_gemm_add_silu_instance)
endif()
add_gtest_executable(test_gemm_add_fastgelu test_gemm_add_fastgelu.cpp) add_gtest_executable(test_gemm_add_fastgelu test_gemm_add_fastgelu_xdl.cpp)
target_link_libraries(test_gemm_add_fastgelu PRIVATE utility device_gemm_add_instance device_gemm_add_fastgelu_instance) if(result EQUAL 0)
target_link_libraries(test_gemm_add_fastgelu PRIVATE utility device_gemm_add_instance device_gemm_add_fastgelu_instance)
endif()
...@@ -4,7 +4,7 @@ ...@@ -4,7 +4,7 @@
#include "gtest/gtest.h" #include "gtest/gtest.h"
#include "ck/ck.hpp" #include "ck/ck.hpp"
#include "profiler/profile_gemm_add_fastgelu_impl.hpp" #include "profiler/profile_gemm_add_fastgelu_impl.hpp"
#include "test_gemm_add.hpp" #include "test_gemm_add_xdl.hpp"
template <typename Tuple> template <typename Tuple>
class TestGemmAddFastgelu : public TestGemmAdd<Tuple> class TestGemmAddFastgelu : public TestGemmAdd<Tuple>
......
...@@ -4,7 +4,7 @@ ...@@ -4,7 +4,7 @@
#include "gtest/gtest.h" #include "gtest/gtest.h"
#include "ck/ck.hpp" #include "ck/ck.hpp"
#include "profiler/profile_gemm_add_relu_impl.hpp" #include "profiler/profile_gemm_add_relu_impl.hpp"
#include "test_gemm_add.hpp" #include "test_gemm_add_xdl.hpp"
template <typename Tuple> template <typename Tuple>
class TestGemmAddRelu : public TestGemmAdd<Tuple> class TestGemmAddRelu : public TestGemmAdd<Tuple>
......
...@@ -4,7 +4,7 @@ ...@@ -4,7 +4,7 @@
#include "gtest/gtest.h" #include "gtest/gtest.h"
#include "ck/ck.hpp" #include "ck/ck.hpp"
#include "profiler/profile_gemm_add_silu_impl.hpp" #include "profiler/profile_gemm_add_silu_impl.hpp"
#include "test_gemm_add.hpp" #include "test_gemm_add_xdl.hpp"
template <typename Tuple> template <typename Tuple>
class TestGemmAddSilu : public TestGemmAdd<Tuple> class TestGemmAddSilu : public TestGemmAdd<Tuple>
......
list(APPEND gpu_list gfx908 gfx90a gfx940 gfx941 gfx942) add_gtest_executable(test_gemm_add_relu_add_layernorm_fp16 test_gemm_add_relu_add_layernorm_fp16_xdl.cpp)
set(target 0) if(result EQUAL 0)
foreach(gpu IN LISTS GPU_TARGETS) add_custom_target(test_gemm_layernorm)
if(gpu IN_LIST gpu_list AND target EQUAL 0) target_link_libraries(test_gemm_add_relu_add_layernorm_fp16 PRIVATE utility device_gemm_add_relu_add_layernorm_instance)
add_custom_target(test_gemm_layernorm) add_dependencies(test_gemm_layernorm test_gemm_add_relu_add_layernorm_fp16)
add_gtest_executable(test_gemm_add_relu_add_layernorm_fp16 test_gemm_add_relu_add_layernorm_fp16.cpp) endif()
if(result EQUAL 0)
target_link_libraries(test_gemm_add_relu_add_layernorm_fp16 PRIVATE utility device_gemm_add_relu_add_layernorm_instance)
add_dependencies(test_gemm_layernorm test_gemm_add_relu_add_layernorm_fp16)
set(target 1)
endif()
endif()
endforeach()
add_test_executable(test_gemm_reduce_fp16 gemm_reduce_fp16.cpp) add_test_executable(test_gemm_reduce_fp16 gemm_reduce_fp16_xdl.cpp)
if(result EQUAL 0) if(result EQUAL 0)
target_link_libraries(test_gemm_reduce_fp16 PRIVATE utility device_gemm_reduce_instance) target_link_libraries(test_gemm_reduce_fp16 PRIVATE utility device_gemm_reduce_instance)
endif() endif()
\ No newline at end of file
list(APPEND gpu_list gfx908 gfx90a gfx940 gfx941 gfx942) add_gtest_executable(test_gemm_splitk test_gemm_splitk_xdl.cpp)
set(target 0) if(result EQUAL 0)
foreach(gpu IN LISTS GPU_TARGETS)
if(gpu IN_LIST gpu_list AND target EQUAL 0)
add_gtest_executable(test_gemm_splitk test_gemm_splitk.cpp)
target_link_libraries(test_gemm_splitk PRIVATE utility device_gemm_splitk_instance) target_link_libraries(test_gemm_splitk PRIVATE utility device_gemm_splitk_instance)
set(target 1)
endif() endif()
endforeach()
list(APPEND gpu_list_xdl gfx908 gfx90a gfx940) add_gtest_executable(test_grouped_convnd_bwd_data test_grouped_convnd_bwd_data_xdl_wmma.cpp)
list(APPEND gpu_list_wmma gfx1100 gfx1101 gfx1102 gfx1103) if(result EQUAL 0)
set(target 0) target_link_libraries(test_grouped_convnd_bwd_data PRIVATE utility device_grouped_conv2d_bwd_data_instance device_grouped_conv3d_bwd_data_instance)
foreach(gpu IN LISTS GPU_TARGETS) endif()
if(gpu IN_LIST gpu_list_xdl AND target EQUAL 0) add_gtest_executable(test_grouped_convnd_bwd_data_interface test_grouped_convnd_bwd_data_interface_xdl.cpp)
add_gtest_executable(test_grouped_convnd_bwd_data test_grouped_convnd_bwd_data.cpp) if(result EQUAL 0)
target_link_libraries(test_grouped_convnd_bwd_data PRIVATE utility device_grouped_conv2d_bwd_data_instance device_grouped_conv3d_bwd_data_instance) target_link_libraries(test_grouped_convnd_bwd_data_interface PRIVATE utility device_grouped_conv2d_bwd_data_instance)
add_gtest_executable(test_grouped_convnd_bwd_data_interface test_grouped_convnd_bwd_data_interface_xdl.cpp) endif()
target_link_libraries(test_grouped_convnd_bwd_data_interface PRIVATE utility device_grouped_conv2d_bwd_data_instance) add_gtest_executable(test_grouped_convnd_bwd_data_interface test_grouped_convnd_bwd_data_interface_wmma.cpp)
set(target 1) if(result EQUAL 0)
endif() target_link_libraries(test_grouped_convnd_bwd_data_interface PRIVATE utility device_grouped_conv2d_bwd_data_instance)
if(gpu IN_LIST gpu_list_wmma AND target EQUAL 0) endif()
add_gtest_executable(test_grouped_convnd_bwd_data test_grouped_convnd_bwd_data.cpp)
target_link_libraries(test_grouped_convnd_bwd_data PRIVATE utility device_grouped_conv2d_bwd_data_instance device_grouped_conv3d_bwd_data_instance)
add_gtest_executable(test_grouped_convnd_bwd_data_interface test_grouped_convnd_bwd_data_interface_wmma.cpp)
target_link_libraries(test_grouped_convnd_bwd_data_interface PRIVATE utility device_grouped_conv2d_bwd_data_instance)
set(target 1)
endif()
endforeach()
\ No newline at end of file
list(APPEND gpu_list_xdl gfx908 gfx90a gfx940 gfx941 gfx942) add_gtest_executable(test_grouped_convnd_bwd_weight test_grouped_convnd_bwd_weight_xdl_wmma.cpp)
list(APPEND gpu_list_wmma gfx1100 gfx1101 gfx1102 gfx1103) if(result EQUAL 0)
set(target 0)
foreach(gpu IN LISTS GPU_TARGETS)
if(gpu IN_LIST gpu_list_xdl AND target EQUAL 0)
add_gtest_executable(test_grouped_convnd_bwd_weight test_grouped_convnd_bwd_weight.cpp)
target_link_libraries(test_grouped_convnd_bwd_weight PRIVATE utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance) target_link_libraries(test_grouped_convnd_bwd_weight PRIVATE utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance)
add_gtest_executable(test_grouped_convnd_bwd_weight_interface test_grouped_convnd_bwd_weight_interface_xdl.cpp) endif()
add_gtest_executable(test_grouped_convnd_bwd_weight_interface test_grouped_convnd_bwd_weight_interface_xdl.cpp)
if(result EQUAL 0)
target_link_libraries(test_grouped_convnd_bwd_weight_interface PRIVATE utility) target_link_libraries(test_grouped_convnd_bwd_weight_interface PRIVATE utility)
set(target 1) endif()
endif() add_gtest_executable(test_grouped_convnd_bwd_weight_interface test_grouped_convnd_bwd_weight_interface_wmma.cpp)
if(gpu IN_LIST gpu_list_wmma AND target EQUAL 0) if(result EQUAL 0)
add_gtest_executable(test_grouped_convnd_bwd_weight test_grouped_convnd_bwd_weight.cpp)
target_link_libraries(test_grouped_convnd_bwd_weight PRIVATE utility device_grouped_conv1d_bwd_weight_instance device_grouped_conv2d_bwd_weight_instance device_grouped_conv3d_bwd_weight_instance)
add_gtest_executable(test_grouped_convnd_bwd_weight_interface test_grouped_convnd_bwd_weight_interface_wmma.cpp)
target_link_libraries(test_grouped_convnd_bwd_weight_interface PRIVATE utility) target_link_libraries(test_grouped_convnd_bwd_weight_interface PRIVATE utility)
set(target 1) endif()
endif()
endforeach()
\ No newline at end of file
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment