splitkv_mla.h 147 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
#pragma once

#include "params.h"

namespace sm90 {

void run_flash_splitkv_mla_fp8_sparse_kernel(DecodingParams &params, cudaStream_t stream);

}