Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
a71a3f65
Commit
a71a3f65
authored
Jul 05, 2023
by
ltqin
Browse files
add group
parent
5938d555
Changes
5
Expand all
Show whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
3584 additions
and
4 deletions
+3584
-4
example/32_batched_gemm_scale_softmax_gemm/CMakeLists.txt
example/32_batched_gemm_scale_softmax_gemm/CMakeLists.txt
+2
-1
example/32_batched_gemm_scale_softmax_gemm/grouped_multihead_attention_backward_v3.cpp
..._softmax_gemm/grouped_multihead_attention_backward_v3.cpp
+849
-0
include/ck/tensor_operation/gpu/device/impl/device_grouped_mha_bwd_xdl_cshuffle_qloop_light_v1.hpp
...pl/device_grouped_mha_bwd_xdl_cshuffle_qloop_light_v1.hpp
+1363
-0
include/ck/tensor_operation/gpu/device/impl/device_grouped_mha_bwd_xdl_cshuffle_qloop_light_v2.hpp
...pl/device_grouped_mha_bwd_xdl_cshuffle_qloop_light_v2.hpp
+1369
-0
include/ck/tensor_operation/gpu/grid/gridwise_batched_multihead_attention_bacckward_ydotygrad.hpp
...dwise_batched_multihead_attention_bacckward_ydotygrad.hpp
+1
-3
No files found.
example/32_batched_gemm_scale_softmax_gemm/CMakeLists.txt
View file @
a71a3f65
...
...
@@ -15,10 +15,11 @@ add_example_executable(example_grouped_multihead_attention_forward_v2 grouped_mu
add_example_executable
(
example_batched_multihead_attention_forward_v2 batched_multihead_attention_forward_v2.cpp
)
add_example_executable
(
example_grouped_multihead_attention_backward_v2 grouped_multihead_attention_backward_v2.cpp
)
add_example_executable
(
example_batched_multihead_attention_backward_v2 batched_multihead_attention_backward_v2.cpp
)
add_example_executable
(
example_batched_multihead_attention_backward_v3 batched_multihead_attention_backward_v3.cpp
)
add_example_executable
(
example_batched_multihead_attention_backward_v2_phased batched_multihead_attention_backward_v2_phased.cpp
)
add_example_executable
(
example_grouped_multihead_attention_train_v2 grouped_multihead_attention_train_v2.cpp
)
add_example_executable
(
example_batched_multihead_attention_train_v2 batched_multihead_attention_train_v2.cpp
)
add_example_executable
(
example_batched_multihead_attention_backward_v3 batched_multihead_attention_backward_v3.cpp
)
add_example_executable
(
example_grouped_multihead_attention_backward_v3 grouped_multihead_attention_backward_v3.cpp
)
add_custom_target
(
example_gemm_scale_softmax_gemm
)
add_dependencies
(
example_gemm_scale_softmax_gemm example_batched_gemm_scale_softmax_gemm_xdl_fp16
)
...
...
example/32_batched_gemm_scale_softmax_gemm/grouped_multihead_attention_backward_v3.cpp
0 → 100644
View file @
a71a3f65
This diff is collapsed.
Click to expand it.
include/ck/tensor_operation/gpu/device/impl/device_grouped_mha_bwd_xdl_cshuffle_qloop_light_v1.hpp
0 → 100644
View file @
a71a3f65
This diff is collapsed.
Click to expand it.
include/ck/tensor_operation/gpu/device/impl/device_grouped_mha_bwd_xdl_cshuffle_qloop_light_v2.hpp
0 → 100644
View file @
a71a3f65
This diff is collapsed.
Click to expand it.
include/ck/tensor_operation/gpu/grid/gridwise_batched_multihead_attention_bacckward_ydotygrad.hpp
View file @
a71a3f65
...
...
@@ -135,8 +135,6 @@ struct GridwiseBatchedMultiheadAttentionBackward_YDotYGrad
return
MPerBlock
*
sizeof
(
FloatD
);
}
__device__
static
void
test
()
{}
template
<
typename
Block2CTileMap
>
__device__
static
void
Run
(
const
InputDataType
*
__restrict__
p_y_grid
,
const
InputDataType
*
__restrict__
p_ygrad_grid
,
FloatD
*
__restrict__
p_d_grid
,
...
...
@@ -144,7 +142,7 @@ struct GridwiseBatchedMultiheadAttentionBackward_YDotYGrad
const
YGridDescriptor_MBlock_MPerBlock_OBlock_OPerBlock
&
y_grid_desc_mblock_mperblock_oblock_operblock
,
const
DGridDesc_M
&
d_grid_desc_m
,
const
Block2CTileMap
&
block_2_ctile_map
)
const
Default
Block2CTileMap
&
block_2_ctile_map
)
{
const
auto
y_grid_buf
=
make_dynamic_buffer
<
AddressSpaceEnum
::
Global
>
(
p_y_grid
,
y_grid_desc_mblock_mperblock_oblock_operblock
.
GetElementSpaceSize
());
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment