Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
bdf6cddb
"vscode:/vscode.git/clone" did not exist on "1066fe4cbc24ba21f9d0dec7886f35bb91afa281"
Commit
bdf6cddb
authored
Apr 21, 2024
by
root
Browse files
clean up
parent
1bc44df2
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
2 additions
and
4 deletions
+2
-4
example/04_gemm_add_add_fastgelu/gemm_add_add_fastgelu_xdl_bf16_int8.cpp
..._add_add_fastgelu/gemm_add_add_fastgelu_xdl_bf16_int8.cpp
+2
-4
No files found.
example/04_gemm_add_add_fastgelu/gemm_add_add_fastgelu_xdl_bf16_int8.cpp
View file @
bdf6cddb
...
@@ -79,7 +79,7 @@ struct PassThroughPack2
...
@@ -79,7 +79,7 @@ struct PassThroughPack2
__host__
__device__
constexpr
void
operator
()(
ck
::
bhalf2_t
&
y
,
const
ck
::
int8x2_t
&
x
)
const
__host__
__device__
constexpr
void
operator
()(
ck
::
bhalf2_t
&
y
,
const
ck
::
int8x2_t
&
x
)
const
{
{
y
=
ck
::
bit_cast
<
ck
::
bhalf2_t
>
(
static_cast
<
int32_t
>
(
ck
::
bit_cast
<
int16_t
>
(
x
)));
y
=
ck
::
bit_cast
<
ck
::
bhalf2_t
>
(
static_cast
<
int32_t
>
(
ck
::
bit_cast
<
int16_t
>
(
x
)));
}
}
template
<
>
template
<
>
...
@@ -91,12 +91,10 @@ struct PassThroughPack2
...
@@ -91,12 +91,10 @@ struct PassThroughPack2
constexpr
const
static
bool
is_pack2_invocable
=
true
;
constexpr
const
static
bool
is_pack2_invocable
=
true
;
};
};
using
PassThrough
=
ck
::
tensor_operation
::
element_wise
::
PassThrough
;
using
PassThrough
=
ck
::
tensor_operation
::
element_wise
::
PassThrough
;
using
AddFastGelu
=
ck
::
tensor_operation
::
element_wise
::
AddFastGelu
;
using
AElementOp
=
PassThrough
;
using
AElementOp
=
PassThrough
;
using
BElementOp
=
PassThrough
Pack2
;
using
BElementOp
=
PassThrough
;
using
CDEElementOp
=
MultiplyAddFastGelu
;
using
CDEElementOp
=
MultiplyAddFastGelu
;
static
constexpr
auto
GemmSpec
=
ck
::
tensor_operation
::
device
::
GemmSpecialization
::
Default
;
static
constexpr
auto
GemmSpec
=
ck
::
tensor_operation
::
device
::
GemmSpecialization
::
Default
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment