"vscode:/vscode.git/clone" did not exist on "2f0e1c92712416eae04c19a923a219624c86091b"
Unverified Commit 58a80570 authored by Chao Liu's avatar Chao Liu Committed by GitHub
Browse files

default iterator hack for blockwise copy (#47)

parent 1c1b56fe
......@@ -89,6 +89,16 @@ struct BlockwiseDynamicTensorSliceTransfer_v4
}
}
template <typename SrcBuffer>
__device__ void RunRead(const SrcDesc& src_desc, const SrcBuffer& src_buf)
{
if(BlockSize == thread_cluster_desc_.GetElementSize() or
get_thread_local_1d_id() < thread_cluster_desc_.GetElementSize())
{
threadwise_transfer_.RunRead(src_desc, src_buf);
}
}
template <typename DstBuffer>
__device__ void RunWrite(const DstDesc& dst_desc, DstBuffer& dst_buf)
{
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment