Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
TransformerEngine
Commits
40a4d896
Commit
40a4d896
authored
Jul 03, 2025
by
wenjh
Browse files
Fix kernel crash on block_len=64
Signed-off-by:
wenjh
<
wenjh@sugon.com
>
parent
b944277c
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
2 additions
and
2 deletions
+2
-2
tests/pytorch/distributed/run_cast_master_weights_to_fp8.py
tests/pytorch/distributed/run_cast_master_weights_to_fp8.py
+1
-1
transformer_engine/common/recipe/fp8_block_scaling.cu
transformer_engine/common/recipe/fp8_block_scaling.cu
+1
-1
No files found.
tests/pytorch/distributed/run_cast_master_weights_to_fp8.py
View file @
40a4d896
...
...
@@ -570,7 +570,7 @@ def _test_cast_master_weights_to_fp8(quantization, dp_group):
mock_groups
=
[
dist
.
new_group
(
ranks
=
[
i
])
for
i
in
range
(
world_size
)]
mock_group
=
mock_groups
[
rank
]
linear_kwargs
=
{
"params_dtype"
:
torch
.
bfloat16
,
"bias"
:
False
,
"fuse_wgrad_accumulation"
:
Tru
e
}
linear_kwargs
=
{
"params_dtype"
:
torch
.
bfloat16
,
"bias"
:
False
,
"fuse_wgrad_accumulation"
:
Fals
e
}
# Create model with FP8 weights
with
te
.
fp8
.
fp8_model_init
(
...
...
transformer_engine/common/recipe/fp8_block_scaling.cu
View file @
40a4d896
...
...
@@ -248,7 +248,7 @@ __global__ void __launch_bounds__(kThreadsPerBlock)
using
transformer_engine
::
Vec
;
static_assert
(
sizeof
(
OType
)
==
1
);
constexpr
int
kNumOutputElemsPerBank
=
4
/
sizeof
(
OType
);
constexpr
int
kNumOutputElemsPerBank
=
2
/
sizeof
(
OType
);
constexpr
int
kThreadsPerWarp
=
32
;
constexpr
int
kLoopsPerRow
=
kTileDim64
/
kThreadsPerWarp
;
constexpr
int
kNumWarps
=
kThreadsPerBlock
/
kThreadsPerWarp
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment