Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
tilelang
Commits
3a6a31c5
Commit
3a6a31c5
authored
Nov 26, 2025
by
guchaoyang
Browse files
[Bugfix] Pass pre commit check
parent
bbbf4207
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
6 additions
and
7 deletions
+6
-7
src/op/gemm.cc
src/op/gemm.cc
+4
-4
tilelang/contrib/rocm.py
tilelang/contrib/rocm.py
+2
-3
No files found.
src/op/gemm.cc
View file @
3a6a31c5
...
@@ -865,12 +865,12 @@ LayoutMap GemmNode::InferLayout(const LayoutInferArgs &T,
...
@@ -865,12 +865,12 @@ LayoutMap GemmNode::InferLayout(const LayoutInferArgs &T,
<<
"CDNA gemm (FMMA) only supports C in local.fragment scope, got "
<<
"CDNA gemm (FMMA) only supports C in local.fragment scope, got "
<<
c_
.
scope
();
<<
c_
.
scope
();
if
(
TargetIsDCU
(
T
.
target
))
{
if
(
TargetIsDCU
(
T
.
target
))
{
auto
fragment
=
auto
fragment
=
makeGemmFragmentCDCU
(
m_
,
n_
,
m_
/
warp_m
,
n_
/
warp_n
,
makeGemmFragmentCDCU
(
m_
,
n_
,
m_
/
warp_m
,
n_
/
warp_n
,
c_
->
dtype
.
bits
());
c_
->
dtype
.
bits
());
results
.
Set
(
c_
,
fragment
->
BindThreadRange
(
thread_range
));
results
.
Set
(
c_
,
fragment
->
BindThreadRange
(
thread_range
));
}
else
{
}
else
{
auto
fragment
=
auto
fragment
=
makeGemmFragmentCCDNA
(
m_
,
n_
,
m_
/
warp_m
,
n_
/
warp_n
,
makeGemmFragmentCCDNA
(
m_
,
n_
,
m_
/
warp_m
,
n_
/
warp_n
,
c_
->
dtype
.
bits
());
c_
->
dtype
.
bits
());
results
.
Set
(
c_
,
fragment
->
BindThreadRange
(
thread_range
));
results
.
Set
(
c_
,
fragment
->
BindThreadRange
(
thread_range
));
}
}
if
(
a_
.
scope
()
==
"shared"
||
a_
.
scope
()
==
"shared.dyn"
)
{
if
(
a_
.
scope
()
==
"shared"
||
a_
.
scope
()
==
"shared.dyn"
)
{
...
...
tilelang/contrib/rocm.py
View file @
3a6a31c5
...
@@ -226,11 +226,10 @@ def have_matrixcore(compute_version=None):
...
@@ -226,11 +226,10 @@ def have_matrixcore(compute_version=None):
return
False
return
False
@
tvm_ffi
.
register_global_func
(
"tvm_callback_rocm_get_arch"
,
override
=
True
)
@
tvm_ffi
.
register_global_func
(
"tvm_callback_rocm_get_arch"
,
override
=
True
)
def
get_rocm_arch
(
rocm_path
=
"/opt/rocm"
):
def
get_rocm_arch
(
rocm_path
=
"/opt/rocm"
):
# @tvm.ffi.register_func("tvm_callback_rocm_get_arch", override=True)
# @tvm.ffi.register_func("tvm_callback_rocm_get_arch", override=True)
# def get_rocm_arch(rocm_path="/opt/dtk"):
# def get_rocm_arch(rocm_path="/opt/dtk"):
"""Utility function to get the AMD GPU architecture
"""Utility function to get the AMD GPU architecture
Parameters
Parameters
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment