Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
fengzch-das
nunchaku
Commits
a43eabbc
"torchvision/csrc/io/decoder/audio_sampler.cpp" did not exist on "32e16805a17401f5ef5ec825c808d645f5c26509"
Commit
a43eabbc
authored
Nov 24, 2025
by
fengzch
Browse files
fix: asm movmatrix.sync.aligned.m8n8.trans.b16 is not supported
parent
0343f43e
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
3 deletions
+4
-3
src/kernels/zgemm/gemm_utils.cuh
src/kernels/zgemm/gemm_utils.cuh
+4
-3
No files found.
src/kernels/zgemm/gemm_utils.cuh
View file @
a43eabbc
...
...
@@ -199,9 +199,10 @@ __device__ __forceinline__ static void ldmatrix(const void *ptr, uint4 &out) {
template
<
typename
T
>
__device__
__forceinline__
static
T
movmatrix
(
T
x
)
{
asm
volatile
(
"movmatrix.sync.aligned.m8n8.trans.b16 %0, %1;"
:
"=r"
(
*
reinterpret_cast
<
uint32_t
*>
(
&
x
))
:
"r"
(
*
reinterpret_cast
<
uint32_t
*>
(
&
x
)));
// asm volatile("movmatrix.sync.aligned.m8n8.trans.b16 %0, %1;"
// : "=r"(*reinterpret_cast<uint32_t *>(&x))
// : "r"(*reinterpret_cast<uint32_t *>(&x)));
printf
(
"%s: asm movmatrix.sync.aligned.m8n8.trans.b16 is not supported in HIP yet!
\n
"
,
__func__
);
return
x
;
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment