#include "flash_fwd_mla_kernel.h" template void run_mha_fwd_splitkv_mla(Flash_fwd_mla_params ¶ms, const std::string& kv_cache_dtype, cudaStream_t stream, bool is_q_nope_pe = false);