Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
c6a3bd9f
Commit
c6a3bd9f
authored
Jan 15, 2025
by
ozturkosu
Browse files
Comment other instance in Profiler CMAKE
parent
bffb335b
Changes
2
Expand all
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
168 additions
and
169 deletions
+168
-169
include/ck/tensor_operation/gpu/grid/gridwise_gemm_xdl_cshuffle_streamk_v3.hpp
...ration/gpu/grid/gridwise_gemm_xdl_cshuffle_streamk_v3.hpp
+11
-10
profiler/src/CMakeLists.txt
profiler/src/CMakeLists.txt
+157
-159
No files found.
include/ck/tensor_operation/gpu/grid/gridwise_gemm_xdl_cshuffle_streamk_v3.hpp
View file @
c6a3bd9f
...
...
@@ -946,7 +946,7 @@ struct GridwiseGemm_xdl_cshuffle_streamk_v3
if
constexpr
(
!
(
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
MPadding
||
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
MNPadding
||
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
MKPadding
||
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
MNKPadding
)
)
&&
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
MNKPadding
)
&&
!
(
is_same
<
tensor_layout
::
gemm
::
RowMajor
,
ALayout
>::
value
))
{
if
(
!
(
karg
.
M
%
MPerBlock
==
0
))
...
...
@@ -964,7 +964,7 @@ struct GridwiseGemm_xdl_cshuffle_streamk_v3
if
constexpr
(
!
(
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
NPadding
||
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
MNPadding
||
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
NKPadding
||
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
MNKPadding
)
)
&&
GemmSpec
==
tensor_operation
::
device
::
GemmSpecialization
::
MNKPadding
)
&&
(
is_same
<
tensor_layout
::
gemm
::
RowMajor
,
BLayout
>::
value
))
{
if
(
!
(
karg
.
N
%
NPerBlock
==
0
))
...
...
@@ -986,6 +986,7 @@ struct GridwiseGemm_xdl_cshuffle_streamk_v3
{
auto
K_t
=
KPerBlock
;
// auto K_t = karg.KBatch * KPerBlock;
if
(
!
(
karg
.
K
%
K_t
==
0
))
{
if
(
ck
::
EnvIsEnabled
(
CK_ENV
(
CK_LOGGING
)))
...
...
@@ -1000,17 +1001,17 @@ struct GridwiseGemm_xdl_cshuffle_streamk_v3
else
{
// if(karg.K <= 0)
// {
// return false;
// }
constexpr
auto
KReadVec
=
math
::
lcm
(
AK1Number
,
BK1Number
);
auto
K_t
=
karg
.
KBatch
*
KReadVec
;
auto
KReadPadSplited
=
math
::
integer_divide_ceil
(
karg
.
K
,
K_t
)
*
KReadVec
;
if
((
KReadPadSplited
*
(
karg
.
KBatch
-
1
))
>=
karg
.
K
)
if
(
karg
.
K
<=
0
)
{
return
false
;
}
// constexpr auto KReadVec = math::lcm(AK1Number, BK1Number);
// auto K_t = karg.KBatch * KReadVec;
// auto KReadPadSplited = math::integer_divide_ceil(karg.K, K_t) * KReadVec;
// if((KReadPadSplited * (karg.KBatch - 1)) >= karg.K)
// {
// return false;
// }
}
if
constexpr
(
is_same
<
tensor_layout
::
gemm
::
RowMajor
,
ALayout
>::
value
)
...
...
profiler/src/CMakeLists.txt
View file @
c6a3bd9f
This diff is collapsed.
Click to expand it.
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment