Unverified Commit 513a8502 authored by thatPepe's avatar thatPepe Committed by GitHub
Browse files

Merge pull request #1010 from InfiniTensor/issue/899

issue/899 - fix: fix causal_softmax and rearrange bug 
parents c312f175 e4bce369
......@@ -28,7 +28,7 @@ __device__ void causalSoftmaxKernel(
// 1 | * * * ... * * |
// 2 | * * * ... * * * |
// height: 3 col_id->
if (width + blockIdx.x >= threadIdx.x + height) {
if (width + blockIdx.x >= col + height) {
if constexpr (std::is_same_v<Tdata, half> || std::is_same_v<Tdata, cuda_bfloat16>) {
/*
* MUSA does not support CUDA's native `hexp` function.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment