Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
TransformerEngine
Commits
0fce42f7
Commit
0fce42f7
authored
Jan 12, 2026
by
wenjh
Browse files
Fix building on nmz
Signed-off-by:
wenjh
<
wenjh@sugon.com
>
parent
13123839
Changes
9
Hide whitespace changes
Inline
Side-by-side
Showing
9 changed files
with
27 additions
and
1 deletion
+27
-1
tests/cpp/operator/test_cast_float8blockwise.cu
tests/cpp/operator/test_cast_float8blockwise.cu
+3
-0
tests/cpp/operator/test_cast_mxfp8.cu
tests/cpp/operator/test_cast_mxfp8.cu
+3
-0
tests/cpp/operator/test_cast_mxfp8_gated_swiglu.cu
tests/cpp/operator/test_cast_mxfp8_gated_swiglu.cu
+3
-0
tests/cpp/operator/test_dequantize_mxfp8.cu
tests/cpp/operator/test_dequantize_mxfp8.cu
+3
-1
tests/cpp/test_common.h
tests/cpp/test_common.h
+3
-0
transformer_engine/common/multi_tensor/adam.cu
transformer_engine/common/multi_tensor/adam.cu
+3
-0
transformer_engine/common/multi_tensor/compute_scale.cu
transformer_engine/common/multi_tensor/compute_scale.cu
+3
-0
transformer_engine/common/multi_tensor/scale.cu
transformer_engine/common/multi_tensor/scale.cu
+3
-0
transformer_engine/common/multi_tensor/sgd.cu
transformer_engine/common/multi_tensor/sgd.cu
+3
-0
No files found.
tests/cpp/operator/test_cast_float8blockwise.cu
View file @
0fce42f7
...
@@ -4,6 +4,9 @@
...
@@ -4,6 +4,9 @@
* See LICENSE for license information.
* See LICENSE for license information.
************************************************************************/
************************************************************************/
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_bf16.h>
#include <cuda_bf16.h>
#include <cuda_fp8.h>
#include <cuda_fp8.h>
#include <cuda_runtime.h>
#include <cuda_runtime.h>
...
...
tests/cpp/operator/test_cast_mxfp8.cu
View file @
0fce42f7
...
@@ -4,6 +4,9 @@
...
@@ -4,6 +4,9 @@
* See LICENSE for license information.
* See LICENSE for license information.
************************************************************************/
************************************************************************/
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_bf16.h>
#include <cuda_bf16.h>
#include <cuda_fp8.h>
#include <cuda_fp8.h>
#include <cuda_runtime.h>
#include <cuda_runtime.h>
...
...
tests/cpp/operator/test_cast_mxfp8_gated_swiglu.cu
View file @
0fce42f7
...
@@ -4,6 +4,9 @@
...
@@ -4,6 +4,9 @@
* See LICENSE for license information.
* See LICENSE for license information.
************************************************************************/
************************************************************************/
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_bf16.h>
#include <cuda_bf16.h>
#include <cuda_fp8.h>
#include <cuda_fp8.h>
#include <cuda_runtime.h>
#include <cuda_runtime.h>
...
...
tests/cpp/operator/test_dequantize_mxfp8.cu
View file @
0fce42f7
...
@@ -10,7 +10,9 @@
...
@@ -10,7 +10,9 @@
#include <memory>
#include <memory>
#include <random>
#include <random>
#include <limits>
#include <limits>
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_bf16.h>
#include <cuda_bf16.h>
#include <cuda_fp8.h>
#include <cuda_fp8.h>
#include <cuda_runtime.h>
#include <cuda_runtime.h>
...
...
tests/cpp/test_common.h
View file @
0fce42f7
...
@@ -15,6 +15,9 @@
...
@@ -15,6 +15,9 @@
#endif
#endif
#define FP4_TYPE_SUPPORTED (CUDA_VERSION >= 12080)
#define FP4_TYPE_SUPPORTED (CUDA_VERSION >= 12080)
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_runtime_api.h>
#include <cuda_runtime_api.h>
#include <cuda_bf16.h>
#include <cuda_bf16.h>
#include <cuda_fp16.h>
#include <cuda_fp16.h>
...
...
transformer_engine/common/multi_tensor/adam.cu
View file @
0fce42f7
...
@@ -5,6 +5,9 @@
...
@@ -5,6 +5,9 @@
************************************************************************/
************************************************************************/
#include <assert.h>
#include <assert.h>
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_fp8.h>
#include <cuda_fp8.h>
#include <transformer_engine/multi_tensor.h>
#include <transformer_engine/multi_tensor.h>
#include <transformer_engine/transformer_engine.h>
#include <transformer_engine/transformer_engine.h>
...
...
transformer_engine/common/multi_tensor/compute_scale.cu
View file @
0fce42f7
...
@@ -7,6 +7,9 @@
...
@@ -7,6 +7,9 @@
#include <limits>
#include <limits>
// Stringstream is a big hammer, but I want to rely on operator<< for dtype.
// Stringstream is a big hammer, but I want to rely on operator<< for dtype.
#include <assert.h>
#include <assert.h>
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_fp8.h>
#include <cuda_fp8.h>
#include <transformer_engine/multi_tensor.h>
#include <transformer_engine/multi_tensor.h>
#include <transformer_engine/transformer_engine.h>
#include <transformer_engine/transformer_engine.h>
...
...
transformer_engine/common/multi_tensor/scale.cu
View file @
0fce42f7
...
@@ -5,6 +5,9 @@
...
@@ -5,6 +5,9 @@
************************************************************************/
************************************************************************/
#include <assert.h>
#include <assert.h>
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_fp8.h>
#include <cuda_fp8.h>
// Stringstream is a big hammer, but I want to rely on operator<< for dtype.
// Stringstream is a big hammer, but I want to rely on operator<< for dtype.
#include <transformer_engine/multi_tensor.h>
#include <transformer_engine/multi_tensor.h>
...
...
transformer_engine/common/multi_tensor/sgd.cu
View file @
0fce42f7
...
@@ -5,6 +5,9 @@
...
@@ -5,6 +5,9 @@
************************************************************************/
************************************************************************/
#include <assert.h>
#include <assert.h>
#ifdef __HIP_PLATFORM_AMD__
#include <hip/hip_runtime.h>
#endif
#include <cuda_fp8.h>
#include <cuda_fp8.h>
#include <transformer_engine/multi_tensor.h>
#include <transformer_engine/multi_tensor.h>
#include <transformer_engine/transformer_engine.h>
#include <transformer_engine/transformer_engine.h>
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment