Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
c6a03cde
Commit
c6a03cde
authored
Nov 29, 2023
by
aska-0096
Browse files
add restrict qualifier for dynamic buffer (LDS) pointer
parent
8cc53111
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
4 additions
and
6 deletions
+4
-6
include/ck/tensor_operation/gpu/grid/gridwise_gemm_xdl_cshuffle_v1_doublelds.hpp
...tion/gpu/grid/gridwise_gemm_xdl_cshuffle_v1_doublelds.hpp
+2
-4
include/ck/utility/dynamic_buffer.hpp
include/ck/utility/dynamic_buffer.hpp
+2
-2
No files found.
include/ck/tensor_operation/gpu/grid/gridwise_gemm_xdl_cshuffle_v1_doublelds.hpp
View file @
c6a03cde
...
@@ -784,8 +784,7 @@ struct GridwiseGemm_k0mk1_k0nk1_mn_xdl_cshuffle_v1
...
@@ -784,8 +784,7 @@ struct GridwiseGemm_k0mk1_k0nk1_mn_xdl_cshuffle_v1
1
,
1
,
1
,
1
,
AThreadTransferSrcResetCoordinateAfterRun
,
AThreadTransferSrcResetCoordinateAfterRun
,
true
,
true
>
(
NumGemmKPrefetchStage
>
(
a_grid_desc_ak0_m_ak1
,
a_grid_desc_ak0_m_ak1
,
make_multi_index
(
0
,
m_block_data_idx_on_grid
,
0
),
make_multi_index
(
0
,
m_block_data_idx_on_grid
,
0
),
a_element_op
,
a_element_op
,
...
@@ -815,8 +814,7 @@ struct GridwiseGemm_k0mk1_k0nk1_mn_xdl_cshuffle_v1
...
@@ -815,8 +814,7 @@ struct GridwiseGemm_k0mk1_k0nk1_mn_xdl_cshuffle_v1
1
,
1
,
1
,
1
,
BThreadTransferSrcResetCoordinateAfterRun
,
BThreadTransferSrcResetCoordinateAfterRun
,
true
,
true
>
(
NumGemmKPrefetchStage
>
(
b_grid_desc_bk0_n_bk1
,
b_grid_desc_bk0_n_bk1
,
make_multi_index
(
0
,
n_block_data_idx_on_grid
,
0
),
make_multi_index
(
0
,
n_block_data_idx_on_grid
,
0
),
b_element_op
,
b_element_op
,
...
...
include/ck/utility/dynamic_buffer.hpp
View file @
c6a03cde
...
@@ -25,7 +25,7 @@ struct DynamicBuffer
...
@@ -25,7 +25,7 @@ struct DynamicBuffer
{
{
using
type
=
T
;
using
type
=
T
;
T
*
p_data_
;
T
*
__restrict__
p_data_
;
ElementSpaceSize
element_space_size_
;
ElementSpaceSize
element_space_size_
;
T
invalid_element_value_
=
T
{
0
};
T
invalid_element_value_
=
T
{
0
};
...
@@ -410,7 +410,7 @@ template <AddressSpaceEnum BufferAddressSpace,
...
@@ -410,7 +410,7 @@ template <AddressSpaceEnum BufferAddressSpace,
AmdBufferCoherenceEnum
coherence
=
AmdBufferCoherenceEnum
::
DefaultCoherence
,
AmdBufferCoherenceEnum
coherence
=
AmdBufferCoherenceEnum
::
DefaultCoherence
,
typename
T
,
typename
T
,
typename
ElementSpaceSize
>
typename
ElementSpaceSize
>
__host__
__device__
constexpr
auto
make_dynamic_buffer
(
T
*
p
,
ElementSpaceSize
element_space_size
)
__host__
__device__
constexpr
auto
make_dynamic_buffer
(
T
*
__restrict__
p
,
ElementSpaceSize
element_space_size
)
{
{
return
DynamicBuffer
<
BufferAddressSpace
,
T
,
ElementSpaceSize
,
true
,
coherence
>
{
return
DynamicBuffer
<
BufferAddressSpace
,
T
,
ElementSpaceSize
,
true
,
coherence
>
{
p
,
element_space_size
};
p
,
element_space_size
};
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment