Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
MIGraphX
Commits
b1d86d7c
"src/include/gridwise_implicit_gemm_convolution.cuh" did not exist on "059711633041b73ac3ed3c3b287eee8667092f3f"
Commit
b1d86d7c
authored
Jul 02, 2022
by
Paul
Browse files
Merge branch 'dot-add' into bert-opt2
parents
3b8ae098
9cb9bc09
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
10 additions
and
2 deletions
+10
-2
src/targets/gpu/fuse_ops.cpp
src/targets/gpu/fuse_ops.cpp
+10
-2
No files found.
src/targets/gpu/fuse_ops.cpp
View file @
b1d86d7c
...
@@ -50,6 +50,7 @@
...
@@ -50,6 +50,7 @@
#include <migraphx/array.hpp>
#include <migraphx/array.hpp>
#include <migraphx/make_op.hpp>
#include <migraphx/make_op.hpp>
#include <migraphx/op/clip.hpp>
#include <migraphx/op/clip.hpp>
#include <migraphx/op/contiguous.hpp>
#include <cmath>
#include <cmath>
#include <set>
#include <set>
...
@@ -975,9 +976,8 @@ struct find_gemm_pointwise
...
@@ -975,9 +976,8 @@ struct find_gemm_pointwise
{
{
return
precompile_name
(
"pointwise"
)(
return
precompile_name
(
"pointwise"
)(
match
::
nargs
(
3
),
match
::
nargs
(
3
),
match
::
all_of
[
match
::
inputs
()](
match
::
standard_shape
()),
match
::
either_arg
(
0
,
1
)(
match
::
either_arg
(
0
,
1
)(
match
::
any
(
).
bind
(
"c"
),
match
::
any
_of
(
match
::
standard_shape
(),
match
::
is_constant
()
).
bind
(
"c"
),
match
::
name
(
"gpu::gemm"
)(
match
::
nargs
(
3
),
match
::
used_once
()).
bind
(
"gemm"
)));
match
::
name
(
"gpu::gemm"
)(
match
::
nargs
(
3
),
match
::
used_once
()).
bind
(
"gemm"
)));
}
}
...
@@ -1053,6 +1053,14 @@ struct find_gemm_pointwise
...
@@ -1053,6 +1053,14 @@ struct find_gemm_pointwise
gemm
,
ins
->
module_inputs
().
front
(),
ins
->
inputs
().
front
()
==
gemm_ins
?
0
:
1
))
gemm
,
ins
->
module_inputs
().
front
(),
ins
->
inputs
().
front
()
==
gemm_ins
?
0
:
1
))
return
;
return
;
// const-fold input if not standard shape since rocblas can't handle it
if
(
not
c_ins
->
get_shape
().
standard
())
{
auto
c
=
op
::
contiguous
{};
auto
l
=
c
.
compute
(
c
.
compute_shape
({
c_ins
->
get_shape
()}),
{
c_ins
->
eval
()});
c_ins
=
m
.
add_literal
(
l
.
get_shape
(),
l
.
data
());
}
auto
inputs
=
gemm_ins
->
inputs
();
auto
inputs
=
gemm_ins
->
inputs
();
inputs
.
pop_back
();
inputs
.
pop_back
();
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment