splitkv_mla.h 207 Bytes
Newer Older
1
2
3
4
#pragma once

#include "params.h"

5
namespace sm90::decode::sparse_fp8 {
6

7
8
template<ModelType MODEL_TYPE, int NUM_HEADS>
void run_flash_splitkv_mla_fp8_sparse_kernel(const SparseAttnDecodeParams &params);
9
10

}
11