Commit e29a9111 authored by Qianfeng Zhang's avatar Qianfeng Zhang
Browse files

Use hipMemcpyAsync() to replace hipMemcpy() in grouped fwd device operator

parent 299ac0a3
...@@ -912,10 +912,11 @@ struct DeviceGroupedMultiheadAttentionForward_Xdl_CShuffle_V2 ...@@ -912,10 +912,11 @@ struct DeviceGroupedMultiheadAttentionForward_Xdl_CShuffle_V2
some_has_main_k_block_loop |= y; some_has_main_k_block_loop |= y;
} }
hipGetErrorString(hipMemcpy(arg.p_workspace_, HIP_CHECK_ERROR(hipMemcpyAsync(arg.p_workspace_,
arg.group_kernel_args_.data(), arg.group_kernel_args_.data(),
arg.group_kernel_args_.size() * sizeof(GroupKernelArg), arg.group_kernel_args_.size() * sizeof(GroupKernelArg),
hipMemcpyHostToDevice)); hipMemcpyHostToDevice,
stream_config.stream_id_));
float ave_time = 0; float ave_time = 0;
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment