#pragma once #include "params.h" namespace sm90 { template<typename InputT> void run_flash_splitkv_mla_kernel(DecodingParams ¶ms, cudaStream_t stream); }