Unverified Commit 02a33875 authored by schetlur's avatar schetlur Committed by GitHub
Browse files

Merge pull request #883 from NVIDIA/schetlur/stream_bug_fix

Update softmax.h
parents 058addbe 060bd5cd
......@@ -465,7 +465,7 @@ bool dispatch_additive_masked_softmax(output_t *dst, const input_t *src, const i
dim3 threads(warp_size, warps_per_block, 1);
// launch
kernel<<<blocks, threads>>>(dst, src, pad_mask, batch_count, softmax_elements_stride, softmax_elements, pad_batch_stride);
kernel<<<blocks, threads, 0, at::cuda::getCurrentCUDAStream()>>>(dst, src, pad_mask, batch_count, softmax_elements_stride, softmax_elements, pad_batch_stride);
return true;
}
return false;
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment