Fix comments.

8f455e57 · Andriy Roshchenko · 94b8c629 · 8f455e57
Commit 8f455e57 authored Jan 31, 2025 by Andriy Roshchenko
Hide whitespace changes
Inline Side-by-side

Showing with 6 additions and 8 deletions

include/ck/utility/amd_xdlops.hpp include/ck/utility/amd_xdlops.hpp +6 -8

No files found.
--- a/include/ck/utility/amd_xdlops.hpp
+++ b/include/ck/utility/amd_xdlops.hpp
@@ -482,10 +482,9 @@ struct intrin_mfma_f32_32x32x64f8f6f4;
 /// @brief Performs a matrix fused multiply-accumulate operation on 32x32x64 submatrices for f8, f6,
 /// and f4 data types.
 ///
-/// @note Calls scaled version of the instruction as the original instruction is not supported on
+/// @note Calls scaled version of the instruction as the original instruction is not supported in
-/// the backend. As per Matthew Arsenault: "Use the scaled versions. It's not a workaround, that is
+/// the backend. That is the intended use. There is a backend optimization to select the unscaled
-/// the intended use. There is a backend optimization to select to the unscaled if you use 0
+/// operation if the scale is 0.
-/// scales."
 template <>
 struct intrin_mfma_f32_32x32x64f8f6f4<32, 32>
 {
@@ -590,10 +589,9 @@ struct intrin_mfma_f32_16x16x128f8f6f4;
 /// @brief Performs a matrix fused multiply-accumulate operation on 16x16x128 submatrices for f8f6f4
 /// data types.
 ///
-/// @note Calls scaled version of the instruction as the original instruction is not supported on
+/// @note Calls scaled version of the instruction as the original instruction is not supported in
-/// the backend. As per Matthew Arsenault: "Use the scaled versions. It's not a workaround, that is
+/// the backend. That is the intended use. There is a backend optimization to select the unscaled
-/// the intended use. There is a backend optimization to select to the unscaled if you use 0
+/// operation if the scale is 0.
-/// scales."
 template <>
 struct intrin_mfma_f32_16x16x128f8f6f4<16, 16>
 {