Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
chenpangpang
transformers
Commits
476890e9
Unverified
Commit
476890e9
authored
May 28, 2024
by
Jonny Li
Committed by
GitHub
May 28, 2024
Browse files
Fix DeepSpeed compatibility with weight_norm (#30881) (#31018)
parent
aada568f
Changes
10
Show whitespace changes
Inline
Side-by-side
Showing
10 changed files
with
80 additions
and
20 deletions
+80
-20
src/transformers/models/hubert/modeling_hubert.py
src/transformers/models/hubert/modeling_hubert.py
+8
-2
src/transformers/models/seamless_m4t/modeling_seamless_m4t.py
...transformers/models/seamless_m4t/modeling_seamless_m4t.py
+8
-2
src/transformers/models/sew/modeling_sew.py
src/transformers/models/sew/modeling_sew.py
+8
-2
src/transformers/models/sew_d/modeling_sew_d.py
src/transformers/models/sew_d/modeling_sew_d.py
+8
-2
src/transformers/models/speecht5/modeling_speecht5.py
src/transformers/models/speecht5/modeling_speecht5.py
+8
-2
src/transformers/models/unispeech/modeling_unispeech.py
src/transformers/models/unispeech/modeling_unispeech.py
+8
-2
src/transformers/models/unispeech_sat/modeling_unispeech_sat.py
...ansformers/models/unispeech_sat/modeling_unispeech_sat.py
+8
-2
src/transformers/models/wav2vec2/modeling_wav2vec2.py
src/transformers/models/wav2vec2/modeling_wav2vec2.py
+8
-2
src/transformers/models/wav2vec2_conformer/modeling_wav2vec2_conformer.py
.../models/wav2vec2_conformer/modeling_wav2vec2_conformer.py
+8
-2
src/transformers/models/wavlm/modeling_wavlm.py
src/transformers/models/wavlm/modeling_wavlm.py
+8
-2
No files found.
src/transformers/models/hubert/modeling_hubert.py
View file @
476890e9
...
...
@@ -295,8 +295,14 @@ class HubertPositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/seamless_m4t/modeling_seamless_m4t.py
View file @
476890e9
...
...
@@ -325,8 +325,14 @@ class SeamlessM4TConformerPositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/sew/modeling_sew.py
View file @
476890e9
...
...
@@ -294,8 +294,14 @@ class SEWPositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
nn
.
utils
.
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
nn
.
utils
.
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/sew_d/modeling_sew_d.py
View file @
476890e9
...
...
@@ -354,8 +354,14 @@ class SEWDPositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
nn
.
utils
.
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
nn
.
utils
.
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/speecht5/modeling_speecht5.py
View file @
476890e9
...
...
@@ -368,8 +368,14 @@ class SpeechT5PositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/unispeech/modeling_unispeech.py
View file @
476890e9
...
...
@@ -330,8 +330,14 @@ class UniSpeechPositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/unispeech_sat/modeling_unispeech_sat.py
View file @
476890e9
...
...
@@ -347,8 +347,14 @@ class UniSpeechSatPositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/wav2vec2/modeling_wav2vec2.py
View file @
476890e9
...
...
@@ -398,8 +398,14 @@ class Wav2Vec2PositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/wav2vec2_conformer/modeling_wav2vec2_conformer.py
View file @
476890e9
...
...
@@ -361,8 +361,14 @@ class Wav2Vec2ConformerPositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
src/transformers/models/wavlm/modeling_wavlm.py
View file @
476890e9
...
...
@@ -287,8 +287,14 @@ class WavLMPositionalConvEmbedding(nn.Module):
with
deepspeed
.
zero
.
GatheredParameters
(
self
.
conv
.
weight
,
modifier_rank
=
0
):
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
self
.
conv
.
weight_g
)
if
hasattr
(
self
.
conv
,
"parametrizations"
):
weight_g
=
self
.
conv
.
parametrizations
.
weight
.
original0
weight_v
=
self
.
conv
.
parametrizations
.
weight
.
original1
else
:
weight_g
=
self
.
conv
.
weight_g
weight_v
=
self
.
conv
.
weight_v
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_v
)
deepspeed
.
zero
.
register_external_parameter
(
self
,
weight_g
)
else
:
self
.
conv
=
weight_norm
(
self
.
conv
,
name
=
"weight"
,
dim
=
2
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment