Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
3b290001
Commit
3b290001
authored
Oct 17, 2024
by
rocking
Browse files
Refine variable name
parent
d5efa5e5
Changes
5
Hide whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
21 additions
and
21 deletions
+21
-21
example/ck_tile/02_layernorm2d/instances/layernorm2d_fwd_bf16_instance.cpp
...2_layernorm2d/instances/layernorm2d_fwd_bf16_instance.cpp
+4
-4
example/ck_tile/02_layernorm2d/instances/layernorm2d_fwd_bf16_pad_instance.cpp
...yernorm2d/instances/layernorm2d_fwd_bf16_pad_instance.cpp
+4
-4
example/ck_tile/02_layernorm2d/instances/layernorm2d_fwd_fp16_instance.cpp
...2_layernorm2d/instances/layernorm2d_fwd_fp16_instance.cpp
+4
-4
example/ck_tile/02_layernorm2d/instances/layernorm2d_fwd_fp16_pad_instance.cpp
...yernorm2d/instances/layernorm2d_fwd_fp16_pad_instance.cpp
+4
-4
example/ck_tile/02_layernorm2d/layernorm2d_fwd.hpp
example/ck_tile/02_layernorm2d/layernorm2d_fwd.hpp
+5
-5
No files found.
example/ck_tile/02_layernorm2d/instances/layernorm2d_fwd_bf16_instance.cpp
View file @
3b290001
...
@@ -4,16 +4,16 @@
...
@@ -4,16 +4,16 @@
#include "layernorm2d_fwd_instance_common.hpp"
#include "layernorm2d_fwd_instance_common.hpp"
template
<
ck_tile
::
index_t
NRepeat
,
template
<
ck_tile
::
index_t
k
NRepeat
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
VectorAccessSize
,
ck_tile
::
index_t
kk
VectorAccessSize
,
bool
kTwoPass
>
bool
kTwoPass
>
using
t
=
layernorm2d_fwd_traits_
<
ck_tile
::
bf16_t
,
using
t
=
layernorm2d_fwd_traits_
<
ck_tile
::
bf16_t
,
NRepeat
,
k
NRepeat
,
kMThreadPerBlock
,
kMThreadPerBlock
,
kNThreadPerBlock
,
kNThreadPerBlock
,
VectorAccessSize
,
kk
VectorAccessSize
,
false
,
false
,
false
,
false
,
kTwoPass
>
;
kTwoPass
>
;
...
...
example/ck_tile/02_layernorm2d/instances/layernorm2d_fwd_bf16_pad_instance.cpp
View file @
3b290001
...
@@ -4,16 +4,16 @@
...
@@ -4,16 +4,16 @@
#include "layernorm2d_fwd_instance_common.hpp"
#include "layernorm2d_fwd_instance_common.hpp"
template
<
ck_tile
::
index_t
NRepeat
,
template
<
ck_tile
::
index_t
k
NRepeat
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
VectorAccessSize
,
ck_tile
::
index_t
k
VectorAccessSize
,
bool
kTwoPass
>
bool
kTwoPass
>
using
t
=
layernorm2d_fwd_traits_
<
ck_tile
::
bf16_t
,
using
t
=
layernorm2d_fwd_traits_
<
ck_tile
::
bf16_t
,
NRepeat
,
k
NRepeat
,
kMThreadPerBlock
,
kMThreadPerBlock
,
kNThreadPerBlock
,
kNThreadPerBlock
,
VectorAccessSize
,
k
VectorAccessSize
,
true
,
true
,
false
,
false
,
kTwoPass
>
;
kTwoPass
>
;
...
...
example/ck_tile/02_layernorm2d/instances/layernorm2d_fwd_fp16_instance.cpp
View file @
3b290001
...
@@ -4,16 +4,16 @@
...
@@ -4,16 +4,16 @@
#include "layernorm2d_fwd_instance_common.hpp"
#include "layernorm2d_fwd_instance_common.hpp"
template
<
ck_tile
::
index_t
NRepeat
,
template
<
ck_tile
::
index_t
k
NRepeat
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
VectorAccessSize
,
ck_tile
::
index_t
k
VectorAccessSize
,
bool
kTwoPass
>
bool
kTwoPass
>
using
t
=
layernorm2d_fwd_traits_
<
ck_tile
::
fp16_t
,
using
t
=
layernorm2d_fwd_traits_
<
ck_tile
::
fp16_t
,
NRepeat
,
k
NRepeat
,
kMThreadPerBlock
,
kMThreadPerBlock
,
kNThreadPerBlock
,
kNThreadPerBlock
,
VectorAccessSize
,
k
VectorAccessSize
,
false
,
false
,
false
,
false
,
kTwoPass
>
;
kTwoPass
>
;
...
...
example/ck_tile/02_layernorm2d/instances/layernorm2d_fwd_fp16_pad_instance.cpp
View file @
3b290001
...
@@ -4,16 +4,16 @@
...
@@ -4,16 +4,16 @@
#include "layernorm2d_fwd_instance_common.hpp"
#include "layernorm2d_fwd_instance_common.hpp"
template
<
ck_tile
::
index_t
NRepeat
,
template
<
ck_tile
::
index_t
k
NRepeat
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
VectorAccessSize
,
ck_tile
::
index_t
k
VectorAccessSize
,
bool
kTwoPass
>
bool
kTwoPass
>
using
t
=
layernorm2d_fwd_traits_
<
ck_tile
::
fp16_t
,
using
t
=
layernorm2d_fwd_traits_
<
ck_tile
::
fp16_t
,
NRepeat
,
k
NRepeat
,
kMThreadPerBlock
,
kMThreadPerBlock
,
kNThreadPerBlock
,
kNThreadPerBlock
,
VectorAccessSize
,
k
VectorAccessSize
,
true
,
true
,
false
,
false
,
kTwoPass
>
;
kTwoPass
>
;
...
...
example/ck_tile/02_layernorm2d/layernorm2d_fwd.hpp
View file @
3b290001
...
@@ -51,10 +51,10 @@ struct layernorm2d_fwd_args
...
@@ -51,10 +51,10 @@ struct layernorm2d_fwd_args
// this is used to pattern-match internl kernel implementation, not to instantiate kernel
// this is used to pattern-match internl kernel implementation, not to instantiate kernel
template
<
typename
DataType_
,
template
<
typename
DataType_
,
ck_tile
::
index_t
NRepeat
,
ck_tile
::
index_t
k
NRepeat
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kMThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
kNThreadPerBlock
,
ck_tile
::
index_t
VectorAccessSize
,
ck_tile
::
index_t
k
VectorAccessSize
,
bool
kPadN_
,
bool
kPadN_
,
bool
kSaveMeanInvStd_
,
bool
kSaveMeanInvStd_
,
bool
kTwoPass_
>
bool
kTwoPass_
>
...
@@ -69,11 +69,11 @@ struct layernorm2d_fwd_traits_
...
@@ -69,11 +69,11 @@ struct layernorm2d_fwd_traits_
kMThreadPerBlock
*
kNThreadPerBlock
/
warpSize
;
kMThreadPerBlock
*
kNThreadPerBlock
/
warpSize
;
// kNThreadPerBlock / 16;
// kNThreadPerBlock / 16;
using
thread_tile
=
ck_tile
::
sequence
<
MRepeat
,
NRepeat
,
VectorAccessSize
>
;
using
thread_tile
=
ck_tile
::
sequence
<
MRepeat
,
k
NRepeat
,
k
VectorAccessSize
>
;
using
warp_tile
=
ck_tile
::
sequence
<
MRepeat
*
warpSize
/
kNThreadPerBlock
,
using
warp_tile
=
ck_tile
::
sequence
<
MRepeat
*
warpSize
/
kNThreadPerBlock
,
NRepeat
*
kNThreadPerBlock
*
VectorAccessSize
>
;
k
NRepeat
*
kNThreadPerBlock
*
k
VectorAccessSize
>
;
using
block_tile
=
ck_tile
::
sequence
<
kMWarpPerBlock
*
MRepeat
*
warpSize
/
kNThreadPerBlock
,
using
block_tile
=
ck_tile
::
sequence
<
kMWarpPerBlock
*
MRepeat
*
warpSize
/
kNThreadPerBlock
,
NRepeat
*
kNThreadPerBlock
*
VectorAccessSize
>
;
k
NRepeat
*
kNThreadPerBlock
*
k
VectorAccessSize
>
;
using
Shape
=
ck_tile
::
TileLayernorm2dShape
<
thread_tile
,
warp_tile
,
block_tile
>
;
using
Shape
=
ck_tile
::
TileLayernorm2dShape
<
thread_tile
,
warp_tile
,
block_tile
>
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment