// Copyright (c) OpenMMLab. All rights reserved.#include <cuda_runtime.h>namespacefastertransformer{template<typenameT>voidinvokeFusedAddResidualRMSNorm(T*residual,T*inout,constT*scale,floateps,intbatch_size,intn_dims,cudaStream_tstream);}// namespace fastertransformer