Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
8116d2b3
Commit
8116d2b3
authored
Nov 17, 2022
by
Po-Yen, Chen
Browse files
Modularize ckProfiler operations
parent
df021e9d
Changes
24
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
92 additions
and
32 deletions
+92
-32
profiler/src/CMakeLists.txt
profiler/src/CMakeLists.txt
+35
-32
profiler/src/profile_batched_gemm.cpp
profiler/src/profile_batched_gemm.cpp
+3
-0
profiler/src/profile_batched_gemm_add_relu_gemm_add.cpp
profiler/src/profile_batched_gemm_add_relu_gemm_add.cpp
+3
-0
profiler/src/profile_batched_gemm_gemm.cpp
profiler/src/profile_batched_gemm_gemm.cpp
+3
-0
profiler/src/profile_batched_gemm_reduce.cpp
profiler/src/profile_batched_gemm_reduce.cpp
+3
-0
profiler/src/profile_conv_bwd_data.cpp
profiler/src/profile_conv_bwd_data.cpp
+3
-0
profiler/src/profile_conv_fwd.cpp
profiler/src/profile_conv_fwd.cpp
+3
-0
profiler/src/profile_conv_fwd_bias_relu.cpp
profiler/src/profile_conv_fwd_bias_relu.cpp
+3
-0
profiler/src/profile_conv_fwd_bias_relu_add.cpp
profiler/src/profile_conv_fwd_bias_relu_add.cpp
+3
-0
profiler/src/profile_gemm.cpp
profiler/src/profile_gemm.cpp
+3
-0
profiler/src/profile_gemm_add_add_fastgelu.cpp
profiler/src/profile_gemm_add_add_fastgelu.cpp
+3
-0
profiler/src/profile_gemm_bias_add_reduce.cpp
profiler/src/profile_gemm_bias_add_reduce.cpp
+3
-0
profiler/src/profile_gemm_bilinear.cpp
profiler/src/profile_gemm_bilinear.cpp
+3
-0
profiler/src/profile_gemm_reduce.cpp
profiler/src/profile_gemm_reduce.cpp
+3
-0
profiler/src/profile_gemm_splitk.cpp
profiler/src/profile_gemm_splitk.cpp
+3
-0
profiler/src/profile_grouped_conv_bwd_weight.cpp
profiler/src/profile_grouped_conv_bwd_weight.cpp
+3
-0
profiler/src/profile_grouped_conv_fwd.cpp
profiler/src/profile_grouped_conv_fwd.cpp
+3
-0
profiler/src/profile_grouped_gemm.cpp
profiler/src/profile_grouped_gemm.cpp
+3
-0
profiler/src/profile_groupnorm.cpp
profiler/src/profile_groupnorm.cpp
+3
-0
profiler/src/profile_layernorm.cpp
profiler/src/profile_layernorm.cpp
+3
-0
No files found.
profiler/src/CMakeLists.txt
View file @
8116d2b3
# ck
_p
rofiler
set
(
PROFILER_SOURCE
main
.cpp
# ck
P
rofiler
set
(
PROFILER_SOURCE
S
profiler
.cpp
profile_gemm.cpp
profile_gemm_splitk.cpp
profile_gemm_bilinear.cpp
...
...
@@ -24,34 +24,37 @@ set(PROFILER_SOURCE
profile_softmax.cpp
)
add_executable
(
ckProfiler
${
PROFILER_SOURCE
}
)
set
(
PROFILER_EXECUTABLE ckProfiler
)
target_link_libraries
(
ckProfiler PRIVATE utility
)
target_link_libraries
(
ckProfiler PRIVATE device_gemm_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_gemm_splitk_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_gemm_bilinear_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_gemm_add_add_fastgelu_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_gemm_reduce_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_gemm_bias_add_reduce_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_batched_gemm_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_batched_gemm_gemm_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_batched_gemm_add_relu_gemm_add_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_batched_gemm_reduce_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_grouped_gemm_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_conv2d_fwd_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_grouped_conv1d_fwd_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_grouped_conv2d_fwd_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_grouped_conv3d_fwd_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_conv1d_bwd_data_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_conv2d_bwd_data_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_conv3d_bwd_data_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_grouped_conv1d_bwd_weight_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_grouped_conv2d_bwd_weight_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_grouped_conv3d_bwd_weight_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_conv2d_fwd_bias_relu_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_conv2d_fwd_bias_relu_add_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_normalization_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_softmax_instance
)
target_link_libraries
(
ckProfiler PRIVATE device_reduce_instance
)
add_executable
(
${
PROFILER_EXECUTABLE
}
${
PROFILER_SOURCES
}
)
target_compile_options
(
${
PROFILER_EXECUTABLE
}
PRIVATE -Wno-global-constructors
)
rocm_install
(
TARGETS ckProfiler COMPONENT profiler
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE utility
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_gemm_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_gemm_splitk_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_gemm_bilinear_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_gemm_add_add_fastgelu_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_gemm_reduce_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_gemm_bias_add_reduce_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_batched_gemm_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_batched_gemm_gemm_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_batched_gemm_add_relu_gemm_add_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_batched_gemm_reduce_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_grouped_gemm_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_conv2d_fwd_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_grouped_conv1d_fwd_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_grouped_conv2d_fwd_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_grouped_conv3d_fwd_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_conv1d_bwd_data_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_conv2d_bwd_data_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_conv3d_bwd_data_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_grouped_conv1d_bwd_weight_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_grouped_conv2d_bwd_weight_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_grouped_conv3d_bwd_weight_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_conv2d_fwd_bias_relu_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_conv2d_fwd_bias_relu_add_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_normalization_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_softmax_instance
)
target_link_libraries
(
${
PROFILER_EXECUTABLE
}
PRIVATE device_reduce_instance
)
rocm_install
(
TARGETS
${
PROFILER_EXECUTABLE
}
COMPONENT profiler
)
profiler/src/profile_batched_gemm.cpp
View file @
8116d2b3
...
...
@@ -8,6 +8,7 @@
#include <cstdlib>
#include "profiler/profile_batched_gemm_impl.hpp"
#include "profiler_operation_registry.hpp"
enum
struct
GemmMatrixLayout
{
...
...
@@ -195,3 +196,5 @@ int profile_batched_gemm(int argc, char* argv[])
return
1
;
}
}
REGISTER_PROFILER_OPERATION
(
"batched_gemm"
,
profile_batched_gemm
)
profiler/src/profile_batched_gemm_add_relu_gemm_add.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_batched_gemm_add_relu_gemm_add_impl.hpp"
#include "profiler_operation_registry.hpp"
using
F16
=
ck
::
half_t
;
using
F32
=
float
;
...
...
@@ -207,3 +208,5 @@ int profile_batched_gemm_add_relu_gemm_add(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"batched_gemm_add_relu_gemm_add"
,
profile_batched_gemm_add_relu_gemm_add
)
profiler/src/profile_batched_gemm_gemm.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_batched_gemm_gemm_impl.hpp"
#include "profiler_operation_registry.hpp"
using
F16
=
ck
::
half_t
;
using
F32
=
float
;
...
...
@@ -179,3 +180,5 @@ int profile_batched_gemm_gemm(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"batched_gemm_gemm"
,
profile_batched_gemm_gemm
)
profiler/src/profile_batched_gemm_reduce.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_batched_gemm_reduce_impl.hpp"
#include "profiler_operation_registry.hpp"
int
profile_batched_gemm_reduce
(
int
argc
,
char
*
argv
[])
{
...
...
@@ -151,3 +152,5 @@ int profile_batched_gemm_reduce(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"batched_gemm_reduce"
,
profile_batched_gemm_reduce
)
profiler/src/profile_conv_bwd_data.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_conv_bwd_data_impl.hpp"
#include "profiler_operation_registry.hpp"
namespace
{
...
...
@@ -182,3 +183,5 @@ int profile_conv_bwd_data(int argc, char* argv[])
return
1
;
}
REGISTER_PROFILER_OPERATION
(
"conv_bwd_data"
,
profile_conv_bwd_data
)
profiler/src/profile_conv_fwd.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_conv_fwd_impl.hpp"
#include "profiler_operation_registry.hpp"
namespace
{
...
...
@@ -184,3 +185,5 @@ int profile_conv_fwd(int argc, char* argv[])
return
1
;
}
REGISTER_PROFILER_OPERATION
(
"conv_fwd"
,
profile_conv_fwd
)
profiler/src/profile_conv_fwd_bias_relu.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_conv_fwd_bias_relu_impl.hpp"
#include "profiler_operation_registry.hpp"
enum
struct
ConvDataType
{
...
...
@@ -114,3 +115,5 @@ int profile_conv_fwd_bias_relu(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"conv_fwd_bias_relu"
,
profile_conv_fwd_bias_relu
)
profiler/src/profile_conv_fwd_bias_relu_add.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_conv_fwd_bias_relu_add_impl.hpp"
#include "profiler_operation_registry.hpp"
enum
struct
ConvDataType
{
...
...
@@ -115,3 +116,5 @@ int profile_conv_fwd_bias_relu_add(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"conv_fwd_bias_relu_add"
,
profile_conv_fwd_bias_relu_add
)
profiler/src/profile_gemm.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_gemm_impl.hpp"
#include "profiler_operation_registry.hpp"
enum
struct
GemmMatrixLayout
{
...
...
@@ -184,3 +185,5 @@ int profile_gemm(int argc, char* argv[])
return
1
;
}
}
REGISTER_PROFILER_OPERATION
(
"gemm"
,
profile_gemm
)
profiler/src/profile_gemm_add_add_fastgelu.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_gemm_add_add_fastgelu_impl.hpp"
#include "profiler_operation_registry.hpp"
int
profile_gemm_add_add_fastgelu
(
int
argc
,
char
*
argv
[])
{
...
...
@@ -150,3 +151,5 @@ int profile_gemm_add_add_fastgelu(int argc, char* argv[])
return
1
;
}
}
REGISTER_PROFILER_OPERATION
(
"gemm_add_add_fastgelu"
,
profile_gemm_add_add_fastgelu
)
profiler/src/profile_gemm_bias_add_reduce.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_gemm_bias_add_reduce_impl.hpp"
#include "profiler_operation_registry.hpp"
int
profile_gemm_bias_add_reduce
(
int
argc
,
char
*
argv
[])
{
...
...
@@ -159,3 +160,5 @@ int profile_gemm_bias_add_reduce(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"gemm_bias_add_reduce"
,
profile_gemm_bias_add_reduce
)
profiler/src/profile_gemm_bilinear.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_gemm_bilinear_impl.hpp"
#include "profiler_operation_registry.hpp"
int
profile_gemm_bilinear
(
int
argc
,
char
*
argv
[])
{
...
...
@@ -144,3 +145,5 @@ int profile_gemm_bilinear(int argc, char* argv[])
return
1
;
}
}
REGISTER_PROFILER_OPERATION
(
"gemm_bilinear"
,
profile_gemm_bilinear
)
profiler/src/profile_gemm_reduce.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_gemm_reduce_impl.hpp"
#include "profiler_operation_registry.hpp"
int
profile_gemm_reduce
(
int
argc
,
char
*
argv
[])
{
...
...
@@ -146,3 +147,5 @@ int profile_gemm_reduce(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"gemm_reduce"
,
profile_gemm_reduce
)
profiler/src/profile_gemm_splitk.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_gemm_splitk_impl.hpp"
#include "profiler_operation_registry.hpp"
enum
struct
GemmMatrixLayout
{
...
...
@@ -146,3 +147,5 @@ int profile_gemm_splitk(int argc, char* argv[])
return
1
;
}
}
REGISTER_PROFILER_OPERATION
(
"gemm_splitk"
,
profile_gemm_splitk
)
profiler/src/profile_grouped_conv_bwd_weight.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <numeric>
#include "profiler/profile_grouped_conv_bwd_weight_impl.hpp"
#include "profiler_operation_registry.hpp"
namespace
{
...
...
@@ -174,3 +175,5 @@ int profile_grouped_conv_bwd_weight(int argc, char* argv[])
return
1
;
}
REGISTER_PROFILER_OPERATION
(
"grouped_conv_bwd_weight"
,
profile_grouped_conv_bwd_weight
)
profiler/src/profile_grouped_conv_fwd.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_grouped_conv_fwd_impl.hpp"
#include "profiler_operation_registry.hpp"
namespace
{
...
...
@@ -252,3 +253,5 @@ int profile_grouped_conv_fwd(int argc, char* argv[])
return
1
;
}
REGISTER_PROFILER_OPERATION
(
"grouped_conv_fwd"
,
profile_grouped_conv_fwd
)
profiler/src/profile_grouped_gemm.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include <cstdlib>
#include "profiler/profile_grouped_gemm_impl.hpp"
#include "profiler_operation_registry.hpp"
enum
struct
GemmMatrixLayout
{
...
...
@@ -161,3 +162,5 @@ int profile_grouped_gemm(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"grouped_gemm"
,
profile_grouped_gemm
)
profiler/src/profile_groupnorm.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include "profiler/data_type_enum.hpp"
#include "profiler/profile_groupnorm_impl.hpp"
#include "profiler_operation_registry.hpp"
using
ck
::
index_t
;
...
...
@@ -104,3 +105,5 @@ int profile_groupnorm(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"groupnorm"
,
profile_groupnorm
)
profiler/src/profile_layernorm.cpp
View file @
8116d2b3
...
...
@@ -7,6 +7,7 @@
#include "profiler/data_type_enum.hpp"
#include "profiler/profile_layernorm_impl.hpp"
#include "profiler_operation_registry.hpp"
using
ck
::
index_t
;
...
...
@@ -96,3 +97,5 @@ int profile_layernorm(int argc, char* argv[])
return
0
;
}
REGISTER_PROFILER_OPERATION
(
"layernorm"
,
profile_layernorm
)
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment