Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel_ROCM
Commits
92d5ca70
"...composable_kernel.git" did not exist on "ad00dd1ff4da70dbb7beb0c7c37026e468224cb2"
Commit
92d5ca70
authored
Dec 06, 2024
by
Jing Zhang
Browse files
fix
parent
041ac4c9
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
3 additions
and
3 deletions
+3
-3
example/01_gemm/gemm_xdl_fp16_pk_i4_v3.cpp
example/01_gemm/gemm_xdl_fp16_pk_i4_v3.cpp
+3
-3
No files found.
example/01_gemm/gemm_xdl_fp16_pk_i4_v3.cpp
View file @
92d5ca70
...
@@ -21,7 +21,7 @@ using CElementOp = PassThrough;
...
@@ -21,7 +21,7 @@ using CElementOp = PassThrough;
static
constexpr
auto
GemmDefault
=
ck
::
tensor_operation
::
device
::
GemmSpecialization
::
Default
;
static
constexpr
auto
GemmDefault
=
ck
::
tensor_operation
::
device
::
GemmSpecialization
::
Default
;
static
constexpr
bool
PermuteB
=
fals
e
;
static
constexpr
bool
PermuteB
=
tru
e
;
static
constexpr
ck
::
index_t
KPerBlock
=
128
;
static
constexpr
ck
::
index_t
KPerBlock
=
128
;
...
@@ -179,7 +179,7 @@ bool run_gemm(const ProblemType& problem_size, const ExecutionConfig& config)
...
@@ -179,7 +179,7 @@ bool run_gemm(const ProblemType& problem_size, const ExecutionConfig& config)
}
}
}
}
#if
0
#if
1
// vector pk_i4x4 permute
// vector pk_i4x4 permute
for
(
int
i
=
0
;
i
<
N
;
i
++
)
for
(
int
i
=
0
;
i
<
N
;
i
++
)
{
{
...
@@ -189,7 +189,7 @@ bool run_gemm(const ProblemType& problem_size, const ExecutionConfig& config)
...
@@ -189,7 +189,7 @@ bool run_gemm(const ProblemType& problem_size, const ExecutionConfig& config)
for
(
int
k
=
0
;
k
<
4
;
k
++
)
for
(
int
k
=
0
;
k
<
4
;
k
++
)
{
{
int i4x2 = b_k_n_permute(j + k * 2, i);
int
i4x2
=
b_k_n_permute
(
j
+
k
*
2
,
i
)
.
data
;
input
[
k
*
2
+
0
]
=
(
i4x2
>>
4
)
&
0xf
;
input
[
k
*
2
+
0
]
=
(
i4x2
>>
4
)
&
0xf
;
input
[
k
*
2
+
1
]
=
(
i4x2
>>
0
)
&
0xf
;
input
[
k
*
2
+
1
]
=
(
i4x2
>>
0
)
&
0xf
;
}
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment