Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
TransformerEngine
Commits
cbb14a5f
Commit
cbb14a5f
authored
Dec 03, 2025
by
wenjh
Browse files
Fix build error
Signed-off-by:
wenjh
<
wenjh@sugon.com
>
parent
b3dcfc28
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
6 additions
and
0 deletions
+6
-0
transformer_engine/common/swizzle/swizzle_block_scaling.cu
transformer_engine/common/swizzle/swizzle_block_scaling.cu
+6
-0
No files found.
transformer_engine/common/swizzle/swizzle_block_scaling.cu
View file @
cbb14a5f
...
@@ -14,6 +14,7 @@
...
@@ -14,6 +14,7 @@
#include "../util/logging.h"
#include "../util/logging.h"
#include "transformer_engine/transformer_engine.h"
#include "transformer_engine/transformer_engine.h"
#ifdef __HIP_PLATFORM_AMD__
namespace
transformer_engine
{
namespace
transformer_engine
{
namespace
{
namespace
{
constexpr
uint32_t
WARP_SIZE
=
32
;
constexpr
uint32_t
WARP_SIZE
=
32
;
...
@@ -311,11 +312,16 @@ void swizzle_block_scaling_to_mxfp8_scaling_factors(const Tensor* input, Tensor*
...
@@ -311,11 +312,16 @@ void swizzle_block_scaling_to_mxfp8_scaling_factors(const Tensor* input, Tensor*
}
}
}
// namespace transformer_engine
}
// namespace transformer_engine
#endif
void
nvte_swizzle_block_scaling_to_mxfp8_scaling_factors
(
const
NVTETensor
input
,
NVTETensor
output
,
void
nvte_swizzle_block_scaling_to_mxfp8_scaling_factors
(
const
NVTETensor
input
,
NVTETensor
output
,
cudaStream_t
stream
)
{
cudaStream_t
stream
)
{
NVTE_API_CALL
(
nvte_swizzle_block_scaling_to_mxfp8_scaling_factors
);
NVTE_API_CALL
(
nvte_swizzle_block_scaling_to_mxfp8_scaling_factors
);
#ifdef __HIP_PLATFORM_AMD__
NVTE_CHECK
(
false
,
"nvte_swizzle_block_scaling_to_mxfp8_scaling_factors is not supported on rocm"
);
#else
using
namespace
transformer_engine
;
using
namespace
transformer_engine
;
swizzle_block_scaling_to_mxfp8_scaling_factors
(
convertNVTETensorCheck
(
input
),
swizzle_block_scaling_to_mxfp8_scaling_factors
(
convertNVTETensorCheck
(
input
),
convertNVTETensorCheck
(
output
),
stream
);
convertNVTETensorCheck
(
output
),
stream
);
#endif
}
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment