splitkv_mla.h 162 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
#pragma once

#include "params.h"

namespace sm90 {

template<typename InputT>
void run_flash_splitkv_mla_kernel(DecodingParams &params, cudaStream_t stream);

}