Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
TransformerEngine
Commits
0d874a4e
Commit
0d874a4e
authored
Mar 03, 2026
by
wenjh
Browse files
Merge branch 'nv_main' of v2.12
parents
a68e5f87
dfdd3820
Changes
646
Show whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
35 additions
and
40 deletions
+35
-40
qa/L0_pytorch_debug_unittest/test.sh
qa/L0_pytorch_debug_unittest/test.sh
+1
-6
qa/L0_pytorch_lint/test.sh
qa/L0_pytorch_lint/test.sh
+1
-1
qa/L0_pytorch_unittest/test.sh
qa/L0_pytorch_unittest/test.sh
+3
-2
qa/L0_pytorch_wheel/test.sh
qa/L0_pytorch_wheel/test.sh
+1
-1
qa/L1_cpp_distributed/test.sh
qa/L1_cpp_distributed/test.sh
+1
-1
qa/L1_jax_distributed_unittest/test.sh
qa/L1_jax_distributed_unittest/test.sh
+4
-1
qa/L1_pytorch_distributed_unittest/test.sh
qa/L1_pytorch_distributed_unittest/test.sh
+2
-8
qa/L1_pytorch_mcore_integration/test.sh
qa/L1_pytorch_mcore_integration/test.sh
+1
-1
qa/L1_pytorch_onnx_unittest/test.sh
qa/L1_pytorch_onnx_unittest/test.sh
+1
-5
qa/L1_pytorch_thunder_integration/test.sh
qa/L1_pytorch_thunder_integration/test.sh
+1
-1
qa/L2_jax_distributed_unittest/test.sh
qa/L2_jax_distributed_unittest/test.sh
+4
-1
qa/L2_jax_unittest/test.sh
qa/L2_jax_unittest/test.sh
+4
-1
qa/L3_pytorch_FA_versions_test/test.sh
qa/L3_pytorch_FA_versions_test/test.sh
+4
-4
qa/format.sh
qa/format.sh
+1
-1
setup.py
setup.py
+1
-1
tests/cpp/CMakeLists.txt
tests/cpp/CMakeLists.txt
+1
-1
tests/cpp/operator/CMakeLists.txt
tests/cpp/operator/CMakeLists.txt
+1
-1
tests/cpp/operator/test_act.cu
tests/cpp/operator/test_act.cu
+1
-1
tests/cpp/operator/test_cast.cu
tests/cpp/operator/test_cast.cu
+1
-1
tests/cpp/operator/test_cast_current_scaling.cu
tests/cpp/operator/test_cast_current_scaling.cu
+1
-1
No files found.
qa/L0_pytorch_debug_unittest/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
@@ -26,11 +26,6 @@ mkdir -p "$XML_LOG_DIR"
# Nvinspect will be disabled if no feature is active.
:
${
NVTE_TEST_NVINSPECT_DUMMY_CONFIG_FILE
:
=
$TE_PATH
/tests/pytorch/debug/test_configs/dummy_feature.yaml
}
# It is not installed as a requirement,
# because it is not available on PyPI.
pip uninstall
-y
nvdlfw-inspect
pip
install
git+https://github.com/NVIDIA/nvidia-dlfw-inspect.git
pip
install
pytest
==
8.2.1
||
error_exit
"Failed to install pytest"
pytest
-v
-s
--junitxml
=
$XML_LOG_DIR
/test_sanity.xml
$TE_PATH
/tests/pytorch/debug/test_sanity.py
--feature_dirs
=
$NVTE_TEST_NVINSPECT_FEATURE_DIRS
||
test_fail
"test_sanity.py"
...
...
qa/L0_pytorch_lint/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
qa/L0_pytorch_unittest/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
@@ -33,7 +33,7 @@ ROCBLAS_ATOMICS_MOD=0 HIPBLASLT_ATOMICS_MOD=0 PYTORCH_JIT=0 NVTE_TORCH_COMPILE=0
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_jit.xml
$TE_PATH
/tests/pytorch/test_jit.py
||
test_fail
"test_jit.py"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_fused_rope.xml
$TE_PATH
/tests/pytorch/test_fused_rope.py
||
test_fail
"test_fused_rope.py"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_nvfp4.xml
$TE_PATH
/tests/pytorch/nvfp4
||
test_fail
"test_nvfp4"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_
float8
tensor.xml
$TE_PATH
/tests/pytorch/test_
float8
tensor.py
||
test_fail
"test_
float8
tensor.py"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_
quantized_
tensor.xml
$TE_PATH
/tests/pytorch/test_
quantized_
tensor.py
||
test_fail
"test_
quantized_
tensor.py"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_float8blockwisetensor.xml
$TE_PATH
/tests/pytorch/test_float8blockwisetensor.py
||
test_fail
"test_float8blockwisetensor.py"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_float8_blockwise_scaling_exact.xml
$TE_PATH
/tests/pytorch/test_float8_blockwise_scaling_exact.py
||
test_fail
"test_float8_blockwise_scaling_exact.py"
NVTE_INT8_SIM_FP8
=
1 python3
-m
pytest
-v
-s
--junitxml
=
$XML_LOG_DIR
/pytest_test_float8_blockwise_gemm_exact_int8.xml
$TE_PATH
/tests/pytorch/test_float8_blockwise_gemm_exact.py
||
test_fail
"test_float8_blockwise_gemm_exact.py_int8"
...
...
@@ -57,6 +57,7 @@ mkdir -p $TE_PATH/artifacts/tests/pytorch/test_checkpoint && python $TE_PATH/tes
NVTE_TEST_CHECKPOINT_ARTIFACT_PATH
=
$TE_PATH
/artifacts/tests/pytorch/test_checkpoint python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_checkpoint.xml
$TE_PATH
/tests/pytorch/test_checkpoint.py
||
test_fail
"test_checkpoint.py"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_batched_linear.xml
$TE_PATH
/tests/pytorch/test_batched_linear.py
||
test_fail
"test_batched_linear.py"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_fused_router.xml
$TE_PATH
/tests/pytorch/test_fused_router.py
||
test_fail
"test_fused_router.py"
python3
-m
pytest
--tb
=
auto
--junitxml
=
$XML_LOG_DIR
/pytest_test_partial_cast.xml
$TE_PATH
/tests/pytorch/test_partial_cast.py
||
test_fail
"test_partial_cast.py"
if
[
"
$RET
"
-ne
0
]
;
then
echo
"Error in the following test cases:
$FAILED_CASES
"
...
...
qa/L0_pytorch_wheel/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
qa/L1_cpp_distributed/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
qa/L1_jax_distributed_unittest/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
export
TRITON_PTXAS_PATH
=
/usr/local/cuda/bin/ptxas
function
test_fail
()
{
RET
=
1
...
...
@@ -11,6 +12,8 @@ function test_fail() {
RET
=
0
FAILED_CASES
=
""
export
NVTE_JAX_TEST_TIMING
=
1
:
${
TE_PATH
:
=/opt/transformerengine
}
:
${
XML_LOG_DIR
:
=/logs
}
mkdir
-p
"
$XML_LOG_DIR
"
...
...
qa/L1_pytorch_distributed_unittest/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
@@ -20,12 +20,6 @@ FAILED_CASES=""
:
${
XML_LOG_DIR
:
=/logs
}
mkdir
-p
"
$XML_LOG_DIR
"
# It is not installed as a requirement,
# because it is not available on PyPI.
pip uninstall
-y
nvdlfw-inspect
pip
install
git+https://github.com/NVIDIA/nvidia-dlfw-inspect.git
pip3
install
pytest
==
8.2.1
||
error_exit
"Failed to install pytest"
python3
-m
pytest
-v
-s
--junitxml
=
$XML_LOG_DIR
/pytest_test_sanity.xml
$TE_PATH
/tests/pytorch/distributed/test_sanity.py
||
test_fail
"test_sanity.py"
...
...
@@ -51,7 +45,7 @@ python3 -m pytest -v -s --junitxml=$XML_LOG_DIR/pytest_test_cast_master_weights_
pytest
-v
-s
--junitxml
=
$XML_LOG_DIR
/pytest_test_distributed.xml
$TE_PATH
/tests/pytorch/debug/test_distributed.py
--feature_dirs
=
$NVTE_TEST_NVINSPECT_FEATURE_DIRS
||
test_fail
"debug test_distributed.py"
# standard numerics tests with initialized debug
NVTE_TEST_NVINSPECT_ENABLED
=
True
NVTE_TEST_NVINSPECT_CONFIG_FILE
=
$NVTE_TEST_NVINSPECT_DUMMY_CONFIG_FILE
NVTE_TEST_NVINSPECT_FEATURE_DIRS
=
$NVTE_TEST_NVINSPECT_FEATURE_DIRS
pytest
-v
-s
--junitxml
=
$XML_LOG_DIR
/pytest_test_numerics_2.xml
$TE_PATH
/tests/pytorch/distributed/test_numerics.py
||
test_fail
"debug test_numerics.py"
NVTE_TEST_NVINSPECT_ENABLED
=
1
NVTE_TEST_NVINSPECT_CONFIG_FILE
=
$NVTE_TEST_NVINSPECT_DUMMY_CONFIG_FILE
NVTE_TEST_NVINSPECT_FEATURE_DIRS
=
$NVTE_TEST_NVINSPECT_FEATURE_DIRS
pytest
-v
-s
--junitxml
=
$XML_LOG_DIR
/pytest_test_numerics_2.xml
$TE_PATH
/tests/pytorch/distributed/test_numerics.py
||
test_fail
"debug test_numerics.py"
if
[
"
$RET
"
-ne
0
]
;
then
echo
"Error in the following test cases:
$FAILED_CASES
"
...
...
qa/L1_pytorch_mcore_integration/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
qa/L1_pytorch_onnx_unittest/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
pip3
install
onnxruntime
pip3
install
onnxruntime_extensions
:
${
TE_PATH
:
=/opt/transformerengine
}
:
${
XML_LOG_DIR
:
=/logs
}
mkdir
-p
"
$XML_LOG_DIR
"
...
...
qa/L1_pytorch_thunder_integration/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
qa/L2_jax_distributed_unittest/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
export
TRITON_PTXAS_PATH
=
/usr/local/cuda/bin/ptxas
set
-xe
export
NVTE_JAX_TEST_TIMING
=
1
:
${
TE_PATH
:
=/opt/transformerengine
}
:
${
XML_LOG_DIR
:
=/logs
}
mkdir
-p
"
$XML_LOG_DIR
"
...
...
qa/L2_jax_unittest/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
export
TRITON_PTXAS_PATH
=
/usr/local/cuda/bin/ptxas
set
-x
...
...
@@ -18,6 +19,8 @@ function test_fail() {
RET
=
0
FAILED_CASES
=
""
export
NVTE_JAX_TEST_TIMING
=
1
pip3
install
"nltk>=3.8.2"
||
error_exit
"Failed to install nltk"
pip3
install
pytest
==
8.2.1
||
error_exit
"Failed to install pytest"
...
...
qa/L3_pytorch_FA_versions_test/test.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
@@ -30,13 +30,13 @@ do
# Build Flash Attention
if
[
"
${
fa_version
}
"
\<
"3.0.0"
]
then
pip3
install
flash-attn
==
${
fa_version
}
pip3
install
flash-attn
==
${
fa_version
}
--no-build-isolation
else
git clone https://github.com/Dao-AILab/flash-attention.git
cd
flash-attention/
&&
git checkout 27f501d
&&
cd
hopper
/
&&
python setup.py
install
cd
flash-attention/hopper
&&
python setup.py
install
python_path
=
`
python
-c
"import site; print(site.getsitepackages()[0])"
`
mkdir
-p
$python_path
/flash_attn_3
wget
-P
$python_path
/flash_attn_3 https://raw.githubusercontent.com/Dao-AILab/flash-attention/27f501dbe011f4371bff938fe7e09311ab3002fa/hopper/flash_attn_interface.py
cp
flash_attn_interface.py
$python_path
/flash_attn_3/
cd
../../
fi
...
...
qa/format.sh
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
setup.py
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
tests/cpp/CMakeLists.txt
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
tests/cpp/operator/CMakeLists.txt
View file @
0d874a4e
# Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
#
# See LICENSE for license information.
...
...
tests/cpp/operator/test_act.cu
View file @
0d874a4e
/*************************************************************************
* Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
* Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
*
* See LICENSE for license information.
************************************************************************/
...
...
tests/cpp/operator/test_cast.cu
View file @
0d874a4e
/*************************************************************************
* Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
* Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
*
* See LICENSE for license information.
************************************************************************/
...
...
tests/cpp/operator/test_cast_current_scaling.cu
View file @
0d874a4e
/*************************************************************************
* Copyright (c) 2022-202
5
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
* Copyright (c) 2022-202
6
, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
*
* See LICENSE for license information.
************************************************************************/
...
...
Prev
1
…
3
4
5
6
7
8
9
10
11
…
33
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment