Commit 7e4baf2a authored by Shucai Xiao's avatar Shucai Xiao
Browse files

fix the gemm bug related to alexnet test.

parent dc945bf8
#include <migraphx/gpu/gemm.hpp>
#include <migraphx/gpu/context.hpp>
#include <migraphx/gpu/device/add.hpp>
namespace migraphx {
inline namespace MIGRAPHX_INLINE_NS {
......@@ -186,10 +187,11 @@ argument miopen_gemm::compute(context& ctx,
{
output_shape.visit_type([&](auto as) {
auto to_pointer = [&](auto&& arg) { return to_rocblas_type(as.from(arg.data())); };
hipMemcpy(to_pointer(args[3]),
hipMemcpyAsync(to_pointer(args[3]),
to_pointer(args[2]),
output_shape.bytes(),
hipMemcpyDeviceToDevice);
hipMemcpyDeviceToDevice,
ctx.get_stream().get());
});
output_shape.visit_type([&](auto as) {
......@@ -233,6 +235,7 @@ argument miopen_gemm::compute(context& ctx,
m * n,
num_matrices);
});
//device::add(ctx.get_stream().get(), args[3], args[2], args[3]);
return args[3];
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment