Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
468b8227
Commit
468b8227
authored
Mar 19, 2024
by
Adam Osewski
Browse files
Merge remote-tracking branch 'origin/develop' into aosewski/ggemm_multi_d2
parents
af469e6b
9e011bcd
Changes
163
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
10 additions
and
20 deletions
+10
-20
script/run_full_performance_tests.sh
script/run_full_performance_tests.sh
+8
-18
test/grouped_convnd_bwd_data/CMakeLists.txt
test/grouped_convnd_bwd_data/CMakeLists.txt
+1
-1
test/grouped_convnd_bwd_weight/CMakeLists.txt
test/grouped_convnd_bwd_weight/CMakeLists.txt
+1
-1
No files found.
script/run_full_performance_tests.sh
View file @
468b8227
...
@@ -121,26 +121,16 @@ print_log_header $reduction_log $env_type $branch $host_name
...
@@ -121,26 +121,16 @@ print_log_header $reduction_log $env_type $branch $host_name
./profile_reduce_no_index.sh
$verify
2 10
--half
2>&1 |
tee
-a
$reduction_log
./profile_reduce_no_index.sh
$verify
2 10
--half
2>&1 |
tee
-a
$reduction_log
#run splitK_gemm tests, first correctness verification, then performance
#run splitK_gemm tests, first correctness verification, then performance
export
splitK_gemm_ver_log
=
"perf_splitK_gemm_verify.log"
print_log_header
$splitK_gemm_ver_log
$env_type
$branch
$host_name
./profile_splitK_gemm.sh gemm_splitk 0 0
$verify
1 0 0 4 2>&1 |
tee
-a
$splitK_gemm_ver_log
./profile_splitK_gemm.sh gemm_splitk 0 1
$verify
1 0 0 4 2>&1 |
tee
-a
$splitK_gemm_ver_log
./profile_splitK_gemm.sh gemm_splitk 0 2
$verify
1 0 0 4 2>&1 |
tee
-a
$splitK_gemm_ver_log
./profile_splitK_gemm.sh gemm_splitk 0 3
$verify
1 0 0 4 2>&1 |
tee
-a
$splitK_gemm_ver_log
./profile_splitK_gemm.sh gemm_splitk 1 0
$verify
1 0 0 4 2>&1 |
tee
-a
$splitK_gemm_ver_log
./profile_splitK_gemm.sh gemm_splitk 1 1
$verify
1 0 0 4 2>&1 |
tee
-a
$splitK_gemm_ver_log
./profile_splitK_gemm.sh gemm_splitk 1 2
$verify
1 0 0 4 2>&1 |
tee
-a
$splitK_gemm_ver_log
./profile_splitK_gemm.sh gemm_splitk 1 3
$verify
1 0 0 4 2>&1 |
tee
-a
$splitK_gemm_ver_log
export
splitK_gemm_log
=
"perf_splitK_gemm.log"
export
splitK_gemm_log
=
"perf_splitK_gemm.log"
print_log_header
$splitK_gemm_log
$env_type
$branch
$host_name
print_log_header
$splitK_gemm_log
$env_type
$branch
$host_name
./profile_splitK_gemm.sh gemm_splitk 0 0
0
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 0 0
$verify
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 0 1
0
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 0 1
$verify
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 0 2
0
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 0 2
$verify
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 0 3
0
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 0 3
$verify
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 1 0
0
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 1 0
$verify
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 1 1
0
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 1 1
$verify
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 1 2
0
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 1 2
$verify
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 1 3
0
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
./profile_splitK_gemm.sh gemm_splitk 1 3
$verify
1 0 1 4 2>&1 |
tee
-a
$splitK_gemm_log
#run ONNX gemm tests
#run ONNX gemm tests
export
onnx_log
=
"perf_onnx_gemm.log"
export
onnx_log
=
"perf_onnx_gemm.log"
...
...
test/grouped_convnd_bwd_data/CMakeLists.txt
View file @
468b8227
list
(
APPEND gpu_list_xdl gfx908 gfx90a gfx940
)
list
(
APPEND gpu_list_xdl gfx908 gfx90a gfx940
)
list
(
APPEND gpu_list_wmma gfx1100 gfx1101 gfx1102
)
list
(
APPEND gpu_list_wmma gfx1100 gfx1101 gfx1102
gfx1103
)
set
(
target 0
)
set
(
target 0
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
if
(
gpu IN_LIST gpu_list_xdl AND target EQUAL 0
)
if
(
gpu IN_LIST gpu_list_xdl AND target EQUAL 0
)
...
...
test/grouped_convnd_bwd_weight/CMakeLists.txt
View file @
468b8227
list
(
APPEND gpu_list_xdl gfx908 gfx90a gfx940 gfx941 gfx942
)
list
(
APPEND gpu_list_xdl gfx908 gfx90a gfx940 gfx941 gfx942
)
list
(
APPEND gpu_list_wmma gfx1100 gfx1101 gfx1102
)
list
(
APPEND gpu_list_wmma gfx1100 gfx1101 gfx1102
gfx1103
)
set
(
target 0
)
set
(
target 0
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
foreach
(
gpu IN LISTS GPU_TARGETS
)
...
...
Prev
1
…
5
6
7
8
9
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment