splitkv_mla.h 147 Bytes
Newer Older
1
2
3
4
5
6
#pragma once

#include "params.h"

template<typename InputT>
void run_flash_splitkv_mla_kernel(Flash_fwd_mla_params &params, cudaStream_t stream);