// Copyright (c) 2024, Tri Dao.// Splitting the different head dimensions to different files to speed up compilation.#include "flash_bwd_launch_template.h"template<>voidrun_mha_bwd_<cutlass::half_t,64>(Flash_bwd_params¶ms,cudaStream_tstream){run_mha_bwd_hdim64<cutlass::half_t>(params,stream);}