Commit c1051d51 authored by Ted Themistokleous's avatar Ted Themistokleous
Browse files

Fix error in nonzero

parent 7433c2d3
...@@ -46,7 +46,7 @@ argument nonzero(hipStream_t stream, const argument& result, const argument& arg ...@@ -46,7 +46,7 @@ argument nonzero(hipStream_t stream, const argument& result, const argument& arg
auto* ptr = result.cast<int64_t>(); auto* ptr = result.cast<int64_t>();
gs_launch(stream, block_size, block_size)([=](auto, auto idx) __device__ { gs_launch(stream, block_size, block_size)([=](auto, auto idx) __device__ {
// fill all output to 0 first // fill all output to 0 first
idx.local_stride(out_elem_num, [&](auto j) { ptr[j] = 0; }); idx.local_stride(out_elem_num-1, [&](auto j) { ptr[j] = 0; });
block_scan<block_size>( block_scan<block_size>(
idx, idx,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment