Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
69ad91b2
Commit
69ad91b2
authored
Feb 16, 2024
by
illsilin
Browse files
fix the gfx12 assembly syntax
parent
bfdda4fe
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
8 additions
and
9 deletions
+8
-9
include/ck/tensor_operation/gpu/block/blockwise_gemm_xdlops.hpp
...e/ck/tensor_operation/gpu/block/blockwise_gemm_xdlops.hpp
+2
-2
include/ck/utility/synchronization.hpp
include/ck/utility/synchronization.hpp
+6
-7
No files found.
include/ck/tensor_operation/gpu/block/blockwise_gemm_xdlops.hpp
View file @
69ad91b2
...
...
@@ -481,8 +481,8 @@ struct BlockwiseGemmXdlopsInterwave_k0mk1_k0nk1_m0n0m1n1m2m3m4n2_v1
{
#ifdef __gfx12__
asm
volatile
(
"\
s_barrier_signal
\n
\
s_barrier_wait \
s_barrier_signal
-1
\n
\
s_barrier_wait
-1
\
"
::
);
#else
asm
volatile
(
"s_barrier"
::
);
...
...
include/ck/utility/synchronization.hpp
View file @
69ad91b2
...
...
@@ -12,9 +12,9 @@ __device__ void block_sync_lds()
#if CK_EXPERIMENTAL_BLOCK_SYNC_LDS_WITHOUT_SYNC_VMEM
#ifdef __gfx12__
asm
volatile
(
"\
s_wait_idle
lgkmcnt(0)
\n
\
s_barrier_signal
\n
\
s_barrier_wait \
s_wait_idle
\n
\
s_barrier_signal
-1
\n
\
s_barrier_wait
-1
\
"
::
);
#else
asm
volatile
(
"\
...
...
@@ -31,10 +31,9 @@ __device__ void block_sync_lds_direct_load()
{
#ifdef __gfx12__
asm
volatile
(
"\
s_wait_idle vmcnt(0)
\n
\
s_wait_idle lgkmcnt(0)
\n
\
s_barrier_signal
\n
\
s_barrier_wait \
s_wait_idle
\n
\
s_barrier_signal -1
\n
\
s_barrier_wait -1 \
"
::
);
#else
asm
volatile
(
"\
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment