Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
ca0f9579
"driver/driver.cpp" did not exist on "8bd6ea1a9756c9e6f84df7c794ea3d23389aacd5"
Commit
ca0f9579
authored
Sep 18, 2023
by
Jing Zhang
Browse files
minor fix
parent
9a30e154
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
4 additions
and
3 deletions
+4
-3
example/60_gemm_multiABD/gemm_multiABD_xdl_fp16.cpp
example/60_gemm_multiABD/gemm_multiABD_xdl_fp16.cpp
+1
-1
include/ck/tensor_operation/gpu/thread/threadwise_tensor_slice_transfer_v7r2.hpp
...tion/gpu/thread/threadwise_tensor_slice_transfer_v7r2.hpp
+3
-2
No files found.
example/60_gemm_multiABD/gemm_multiABD_xdl_fp16.cpp
View file @
ca0f9579
...
@@ -55,7 +55,7 @@ struct Add
...
@@ -55,7 +55,7 @@ struct Add
a
=
a0
+
a1
;
a
=
a0
+
a1
;
}
}
static
constexpr
ck
::
index_t
vec_len
=
2
;
static
constexpr
ck
::
index_t
vec_len
=
4
;
};
};
struct
AlphaBetaAdd
struct
AlphaBetaAdd
...
...
include/ck/tensor_operation/gpu/thread/threadwise_tensor_slice_transfer_v7r2.hpp
View file @
ca0f9579
...
@@ -166,8 +166,9 @@ struct ThreadwiseTensorSliceTransfer_v7r2
...
@@ -166,8 +166,9 @@ struct ThreadwiseTensorSliceTransfer_v7r2
static_assert
(
is_same
<
remove_cvref_t
<
decltype
(
elem_op_vec_len
)
>
,
index_t
>::
value
,
static_assert
(
is_same
<
remove_cvref_t
<
decltype
(
elem_op_vec_len
)
>
,
index_t
>::
value
,
"vec_len in element_op_ type is not index_t"
);
"vec_len in element_op_ type is not index_t"
);
static_assert
(
elem_op_vec_len
==
2
||
elem_op_vec_len
==
4
||
elem_op_vec_len
==
8
,
static_assert
(
elem_op_vec_len
==
1
||
elem_op_vec_len
==
2
||
"vec_len in element_op_ must be 2, 4, 8"
);
elem_op_vec_len
==
4
||
elem_op_vec_len
==
8
,
"vec_len in element_op_ must be 1, 2, 4, 8"
);
static_assert
(
SrcScalarPerVector
%
elem_op_vec_len
==
0
,
static_assert
(
SrcScalarPerVector
%
elem_op_vec_len
==
0
,
"vec_len in element_op_ cannot be divided by SrcScalarPerVector!"
);
"vec_len in element_op_ cannot be divided by SrcScalarPerVector!"
);
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment