flash_fwd_mla_bf16_sm90.cu 151 Bytes
Newer Older
Jiashi Li's avatar
Jiashi Li committed
1
2
3
#include "flash_fwd_mla_kernel.h"

template void run_mha_fwd_splitkv_mla<cutlass::bfloat16_t, 576>(Flash_fwd_mla_params &params, cudaStream_t stream);