Commit 633356c9 authored by Shucai Xiao's avatar Shucai Xiao
Browse files

Merge branch 'reduce' into opt_log_softmax

parents ca23bc79 30b15ebc
...@@ -80,7 +80,7 @@ __device__ auto block_reduce(index idx, Op op, T init, std::size_t n, F f) ...@@ -80,7 +80,7 @@ __device__ auto block_reduce(index idx, Op op, T init, std::size_t n, F f)
const std::size_t index = 2 * s * idx.local; const std::size_t index = 2 * s * idx.local;
if(index + s < idx.nlocal()) if(index + s < idx.nlocal())
{ {
buffer[index + s] = op(buffer[index], buffer[index + s]); buffer[index] = op(buffer[index], buffer[index + s]);
} }
__syncthreads(); __syncthreads();
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment