Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
e3e38fe3
Commit
e3e38fe3
authored
Jun 23, 2023
by
Adam Osewski
Browse files
Debug messages.
parent
8986060e
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
22 additions
and
0 deletions
+22
-0
include/ck/tensor_operation/gpu/thread/threadwise_tensor_slice_transfer.hpp
...operation/gpu/thread/threadwise_tensor_slice_transfer.hpp
+22
-0
No files found.
include/ck/tensor_operation/gpu/thread/threadwise_tensor_slice_transfer.hpp
View file @
e3e38fe3
...
@@ -72,6 +72,13 @@ struct ThreadwiseTensorSliceTransfer_v1r3
...
@@ -72,6 +72,13 @@ struct ThreadwiseTensorSliceTransfer_v1r3
using
DstCoordStep
=
decltype
(
make_tensor_coordinate_step
(
DstDesc
{},
Index
{}));
using
DstCoordStep
=
decltype
(
make_tensor_coordinate_step
(
DstDesc
{},
Index
{}));
template
<
index_t
...
Ids
>
__device__
static
bool
is_thread_local_1d_id_idx
()
{
const
auto
tid
=
get_thread_local_1d_id
();
return
((
tid
==
Ids
)
||
...);
}
__device__
constexpr
ThreadwiseTensorSliceTransfer_v1r3
(
const
DstDesc
&
dst_desc
,
__device__
constexpr
ThreadwiseTensorSliceTransfer_v1r3
(
const
DstDesc
&
dst_desc
,
const
Index
&
dst_slice_origin_idx
,
const
Index
&
dst_slice_origin_idx
,
const
ElementwiseOperation
&
element_op
)
const
ElementwiseOperation
&
element_op
)
...
@@ -155,6 +162,21 @@ struct ThreadwiseTensorSliceTransfer_v1r3
...
@@ -155,6 +162,21 @@ struct ThreadwiseTensorSliceTransfer_v1r3
is_dst_valid
,
is_dst_valid
,
dst_vector
.
template
AsType
<
dst_vector_t
>()[
Number
<
0
>
{}]);
dst_vector
.
template
AsType
<
dst_vector_t
>()[
Number
<
0
>
{}]);
// if (get_block_1d_id() == 0 && is_thread_local_1d_id_idx<3,69>())
// {
// printf("tid: %d, dst_coord_: [%d, %d, %d, %d, %d, %d, %d, %d]\n",
// get_thread_local_1d_id(),
// dst_coord_.GetIndex()[Number<0>{}],
// dst_coord_.GetIndex()[Number<1>{}],
// dst_coord_.GetIndex()[Number<2>{}],
// dst_coord_.GetIndex()[Number<3>{}],
// dst_coord_.GetIndex()[Number<4>{}],
// dst_coord_.GetIndex()[Number<5>{}],
// dst_coord_.GetIndex()[Number<6>{}],
// dst_coord_.GetIndex()[Number<7>{}]
// );
// }
if
constexpr
(
idx_1d
.
value
!=
num_access
-
1
)
if
constexpr
(
idx_1d
.
value
!=
num_access
-
1
)
{
{
constexpr
auto
forward_step
=
SpaceFillingCurve
::
GetForwardStep
(
idx_1d
);
constexpr
auto
forward_step
=
SpaceFillingCurve
::
GetForwardStep
(
idx_1d
);
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment