kernel.h 189 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
10
11
#pragma once

#include "params.h"

namespace sm100::decode::head64 {

template<ModelType MODEL_TYPE>
void run_flash_splitkv_mla_fp8_sparse_kernel(const SparseAttnDecodeParams &params);

}