KU_ASSERT(params.stride_kv_row==BYTES_PER_TOKEN,"Each page block in KV cache must be contiguous for head64 sparse fp8 decoding attention in MODEL1");// Each block must be contiguous
KU_ASSERT(params.stride_kv_row==BYTES_PER_TOKEN,"Each page block in KV cache must be contiguous for head64 sparse fp8 decoding attention in MODEL1");// Each block must be contiguous