Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
924639f9
Commit
924639f9
authored
Feb 27, 2024
by
aska-0096
Browse files
remove unnecessary changes
parent
4c102fcc
Changes
7
Hide whitespace changes
Inline
Side-by-side
Showing
7 changed files
with
7 additions
and
59 deletions
+7
-59
CMakeLists.txt
CMakeLists.txt
+1
-0
example/13_pool2d_fwd/pool2d_fwd_common.hpp
example/13_pool2d_fwd/pool2d_fwd_common.hpp
+3
-3
example/13_pool2d_fwd/pool2d_fwd_fp16.cpp
example/13_pool2d_fwd/pool2d_fwd_fp16.cpp
+1
-1
example/32_batched_gemm_scale_softmax_gemm/run_batched_gemm_scale_softmax_gemm_permute.inc
...tmax_gemm/run_batched_gemm_scale_softmax_gemm_permute.inc
+1
-1
include/ck/ck.hpp
include/ck/ck.hpp
+0
-1
script/cmake-ck-dev.sh
script/cmake-ck-dev.sh
+1
-1
script/unet_mha.sh
script/unet_mha.sh
+0
-52
No files found.
CMakeLists.txt
View file @
924639f9
...
...
@@ -410,6 +410,7 @@ include_directories(BEFORE
SET
(
BUILD_DEV ON CACHE BOOL
"BUILD_DEV"
)
if
(
BUILD_DEV
)
add_compile_options
(
-Werror
)
add_compile_options
(
-Weverything
)
endif
()
message
(
"CMAKE_CXX_FLAGS:
${
CMAKE_CXX_FLAGS
}
"
)
...
...
example/13_pool2d_fwd/pool2d_fwd_common.hpp
View file @
924639f9
...
...
@@ -123,9 +123,9 @@ bool pool_test(bool do_verification,
{
N
,
C
,
Hi
,
Wi
},
{
Y
,
X
},
{
N
,
C
,
Ho
,
Wo
},
{},
{},
{},
{
C
*
Hi
*
Wi
,
1
,
Wi
*
C
,
C
},
{
C
*
Ho
*
Wo
,
1
,
Wo
*
C
,
C
},
{
C
*
Ho
*
Wo
,
1
,
Wo
*
C
,
C
},
window_strides
,
window_dilations
,
input_left_pads
,
...
...
example/13_pool2d_fwd/pool2d_fwd_fp16.cpp
View file @
924639f9
...
...
@@ -18,7 +18,7 @@ using IndexDataType = int32_t;
using
InLayout
=
ck
::
tensor_layout
::
convolution
::
NHWC
;
using
OutLayout
=
ck
::
tensor_layout
::
convolution
::
NHWC
;
#if
0
#if
1
static
constexpr
auto
ReduceOpId
=
ck
::
ReduceTensorOp
::
MAX
;
#else
static
constexpr
auto
ReduceOpId
=
ck
::
ReduceTensorOp
::
AVG
;
...
...
example/32_batched_gemm_scale_softmax_gemm/run_batched_gemm_scale_softmax_gemm_permute.inc
View file @
924639f9
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-202
2
, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-202
3
, Advanced Micro Devices, Inc. All rights reserved.
int
run
(
int
argc
,
char
*
argv
[])
{
...
...
include/ck/ck.hpp
View file @
924639f9
...
...
@@ -108,7 +108,6 @@
#define CK_USE_AMD_WMMA
#endif
// TODO: enable buffer load when found correct 3rd dword
// buffer load
#define CK_USE_AMD_BUFFER_LOAD 1
...
...
script/cmake-ck-dev.sh
View file @
924639f9
...
...
@@ -11,7 +11,7 @@ cmake
-D
CMAKE_CXX_FLAGS
=
"-std=c++17 -O3 -ftemplate-backtrace-limit=0 -fPIE -Wno-gnu-line-marker"
\
-D
CMAKE_BUILD_TYPE
=
Release
\
-D
BUILD_DEV
=
ON
\
-D
GPU_TARGETS
=
"gfx
110
0"
\
-D
GPU_TARGETS
=
"gfx
908;gfx90a;gfx94
0"
\
-D
CMAKE_VERBOSE_MAKEFILE:BOOL
=
ON
\
-D
USE_BITINT_EXTENSION_INT4
=
OFF
\
${
MY_PROJECT_SOURCE
}
script/unet_mha.sh
deleted
100644 → 0
View file @
4c102fcc
#!/bin/bash
while
getopts
e: flag
do
case
"
${
flag
}
"
in
e
)
executable
=
${
OPTARG
}
;;
esac
done
echo
"CK-NAVI31 Performance Test: MHA for AITemplate"
VERIFICATION
=
0
INITIALIZE
=
1
TIMING
=
1
ALL_TEST_CASE
=
0
SELF_ATTENTION
=
1
CROSS_ATTENTION
=
0
CAUSAL_MASK
=
0
# self attention with causal mask
if
[
$ALL_TEST_CASE
-eq
1
]
||
{
[
$SELF_ATTENTION
-eq
1
]
&&
[
$CAUSAL_MASK
-eq
1
]
;
}
;
then
echo
"Test launched: self attention with causal mask"
./bin/example_batched_gemm_lower_triangle_scale_softmax_gemm_permute_wmma_fp16
$VERIFICATION
1
$TIMING
4096 4096 40 40 2 8 0.158113881945610 1 1
./bin/example_batched_gemm_lower_triangle_scale_softmax_gemm_permute_wmma_fp16
$VERIFICATION
1
$TIMING
1024 1024 80 80 2 8 0.111803397536277 1 1
./bin/example_batched_gemm_lower_triangle_scale_softmax_gemm_permute_wmma_fp16
$VERIFICATION
1
$TIMING
256 256 160 160 2 8 0.079056940972805 1 1
./bin/example_batched_gemm_lower_triangle_scale_softmax_gemm_permute_wmma_fp16
$VERIFICATION
1
$TIMING
64 64 160 160 2 8 0.079056940972805 1 1
fi
# cross attention with causal mask
if
[
$ALL_TEST_CASE
-eq
1
]
||
{
[
$CROSS_ATTENTION
-eq
1
]
&&
[
$CAUSAL_MASK
-eq
1
]
;
}
;
then
echo
"Test launched: cross attention with causal mask"
./bin/example_batched_gemm_lower_triangle_scale_softmax_gemm_permute_wmma_fp16
$VERIFICATION
1
$TIMING
4096 64 40 40 2 8 0.158113881945610 1 1
./bin/example_batched_gemm_lower_triangle_scale_softmax_gemm_permute_wmma_fp16
$VERIFICATION
1
$TIMING
1024 64 80 80 2 8 0.111803397536277 1 1
./bin/example_batched_gemm_lower_triangle_scale_softmax_gemm_permute_wmma_fp16
$VERIFICATION
1
$TIMING
256 64 160 160 2 8 0.079056940972805 1 1
./bin/example_batched_gemm_lower_triangle_scale_softmax_gemm_permute_wmma_fp16
$VERIFICATION
1
$TIMING
64 64 160 160 2 8 0.079056940972805 1 1
fi
# self attention without causal mask
if
[
$ALL_TEST_CASE
-eq
1
]
||
{
[
$SELF_ATTENTION
-eq
1
]
&&
[
$CAUSAL_MASK
-eq
0
]
;
}
;
then
echo
"Test launched: self attention without causal mask"
$executable
$VERIFICATION
$INITIALIZE
$TIMING
4096 4096 64 64 2 5 0.125 1 1
$executable
$VERIFICATION
$INITIALIZE
$TIMING
1024 1024 64 64 2 10 0.125 1 1
$executable
$VERIFICATION
$INITIALIZE
$TIMING
256 256 64 64 2 20 0.125 1 1
$executable
$VERIFICATION
$INITIALIZE
$TIMING
64 64 64 64 2 20 0.125 1 1
fi
# cross attention without causal mask
if
[
$ALL_TEST_CASE
-eq
1
]
||
{
[
$CROSS_ATTENTION
-eq
1
]
&&
[
$CAUSAL_MASK
-eq
0
]
;
}
;
then
echo
"Test launched: cross attention without causal mask"
$executable
$VERIFICATION
1
$TIMING
4096 64 40 40 2 8 0.158113881945610 1 1
$executable
$VERIFICATION
1
$TIMING
1024 64 80 80 2 8 0.111803397536277 1 1
$executable
$VERIFICATION
1
$TIMING
256 64 160 160 2 8 0.079056940972805 1 1
$executable
$VERIFICATION
1
$TIMING
64 64 160 160 2 8 0.079056940972805 1 1
fi
\ No newline at end of file
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment