Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
MIGraphX
Commits
c34561b3
Commit
c34561b3
authored
Mar 17, 2023
by
Alan Turner
Browse files
Use new interface
parent
3ec069ec
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
8 additions
and
7 deletions
+8
-7
src/targets/gpu/jit/ck_gemm.cpp
src/targets/gpu/jit/ck_gemm.cpp
+6
-5
src/targets/gpu/kernels/include/migraphx/kernels/ck_gemm.hpp
src/targets/gpu/kernels/include/migraphx/kernels/ck_gemm.hpp
+2
-2
No files found.
src/targets/gpu/jit/ck_gemm.cpp
View file @
c34561b3
...
...
@@ -328,7 +328,6 @@ struct ck_gemm_compiler : compiler<ck_gemm_compiler>
static_cast
<
ck
::
index_t
>
(
n
),
static_cast
<
ck
::
index_t
>
(
k
),
static_cast
<
ck
::
index_t
>
(
numDTensors
),
static_cast
<
ck
::
index_t
>
(
tuning_value
),
transA
,
transB
,
transCDE
,
...
...
@@ -339,9 +338,11 @@ struct ck_gemm_compiler : compiler<ck_gemm_compiler>
ck_passthrough
,
cde_op
,
cde_layout
};
const
auto
solution
=
problem
.
GetSolution
();
auto
blocks_per_batch
=
problem
.
GetGridSize
();
auto
block_size
=
problem
.
GetBlockSize
();
const
auto
solutions
=
problem
.
GetSolutions
();
const
auto
solution
=
solutions
.
at
(
tuning_value
);
const
auto
template_str
=
solution
.
GetStr
();
const
auto
blocks_per_batch
=
solution
.
GetGridSize
();
const
auto
block_size
=
solution
.
GetBlockSize
();
hip_compile_options
options
;
auto
grid_size
=
can_fold_batch
?
blocks_per_batch
:
batch_count
*
blocks_per_batch
;
...
...
@@ -363,7 +364,7 @@ struct ck_gemm_compiler : compiler<ck_gemm_compiler>
options
.
params
+=
" -DMIGRAPHX_CK_CHECK=1"
;
auto
src
=
interpolate_string
(
ck_gemm_kernel
,
{{
"solution"
,
solution
},
{{
"solution"
,
template_str
},
{
"params"
,
enum_params
(
inputs
.
size
(),
"void * private_p"
)},
{
"args"
,
enum_params
(
inputs
.
size
(),
"private_p"
)},
{
"blocks_per_batch"
,
to_string
(
blocks_per_batch
)},
...
...
src/targets/gpu/kernels/include/migraphx/kernels/ck_gemm.hpp
View file @
c34561b3
...
...
@@ -49,7 +49,7 @@ template <class G, class E, class A, class B, class... Ds>
__device__
void
ck_gemm_matrix
(
E
e
,
A
a
,
B
b
,
Ds
...
ds
)
{
constexpr
auto
desc
=
G
::
make_descriptor
(
to_ck_tensor
<
A
>
(),
to_ck_tensor
<
B
>
(),
to_ck_tensor
<
ck_transposeb
<
B
>
>
(),
ck
::
make_tuple
(
to_ck_tensor
<
Ds
>
()...),
to_ck_tensor
<
E
>
());
G
::
Run
(
desc
,
...
...
@@ -67,4 +67,4 @@ __device__ void ck_gemm(Ts... xs)
}
}
// namespace migraphx
#endif
\ No newline at end of file
#endif
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment