m.def("forward_affine_mixed_dtypes",&layer_norm_affine_mixed_dtypes,"LayerNorm forward with mixed dtypes (CUDA) compatible with Megatron's implementation");
m.def("rms_forward_affine_mixed_dtypes",&rms_norm_affine_mixed_dtypes,"RMSNorm forward with mixed dtypes (CUDA) compatible with Megatron's implementation");