Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
renzhc
diffusers_dcu
Commits
92fe689f
"docs/vscode:/vscode.git/clone" did not exist on "7ebd359446c2cb31bfbbbd98046cd916de8bdc7b"
Unverified
Commit
92fe689f
authored
May 09, 2025
by
Aryan
Committed by
GitHub
May 09, 2025
Browse files
Change Framepack transformer layer initialization order (#11535)
update
parent
0ba1f76d
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
10 additions
and
7 deletions
+10
-7
src/diffusers/models/transformers/transformer_hunyuan_video_framepack.py
...odels/transformers/transformer_hunyuan_video_framepack.py
+10
-7
No files found.
src/diffusers/models/transformers/transformer_hunyuan_video_framepack.py
View file @
92fe689f
...
@@ -152,9 +152,19 @@ class HunyuanVideoFramepackTransformer3DModel(
...
@@ -152,9 +152,19 @@ class HunyuanVideoFramepackTransformer3DModel(
# 1. Latent and condition embedders
# 1. Latent and condition embedders
self
.
x_embedder
=
HunyuanVideoPatchEmbed
((
patch_size_t
,
patch_size
,
patch_size
),
in_channels
,
inner_dim
)
self
.
x_embedder
=
HunyuanVideoPatchEmbed
((
patch_size_t
,
patch_size
,
patch_size
),
in_channels
,
inner_dim
)
# Framepack history projection embedder
self
.
clean_x_embedder
=
None
if
has_clean_x_embedder
:
self
.
clean_x_embedder
=
HunyuanVideoHistoryPatchEmbed
(
in_channels
,
inner_dim
)
self
.
context_embedder
=
HunyuanVideoTokenRefiner
(
self
.
context_embedder
=
HunyuanVideoTokenRefiner
(
text_embed_dim
,
num_attention_heads
,
attention_head_dim
,
num_layers
=
num_refiner_layers
text_embed_dim
,
num_attention_heads
,
attention_head_dim
,
num_layers
=
num_refiner_layers
)
)
# Framepack image-conditioning embedder
self
.
image_projection
=
FramepackClipVisionProjection
(
image_proj_dim
,
inner_dim
)
if
has_image_proj
else
None
self
.
time_text_embed
=
HunyuanVideoConditionEmbedding
(
self
.
time_text_embed
=
HunyuanVideoConditionEmbedding
(
inner_dim
,
pooled_projection_dim
,
guidance_embeds
,
image_condition_type
inner_dim
,
pooled_projection_dim
,
guidance_embeds
,
image_condition_type
)
)
...
@@ -186,13 +196,6 @@ class HunyuanVideoFramepackTransformer3DModel(
...
@@ -186,13 +196,6 @@ class HunyuanVideoFramepackTransformer3DModel(
self
.
norm_out
=
AdaLayerNormContinuous
(
inner_dim
,
inner_dim
,
elementwise_affine
=
False
,
eps
=
1e-6
)
self
.
norm_out
=
AdaLayerNormContinuous
(
inner_dim
,
inner_dim
,
elementwise_affine
=
False
,
eps
=
1e-6
)
self
.
proj_out
=
nn
.
Linear
(
inner_dim
,
patch_size_t
*
patch_size
*
patch_size
*
out_channels
)
self
.
proj_out
=
nn
.
Linear
(
inner_dim
,
patch_size_t
*
patch_size
*
patch_size
*
out_channels
)
# Framepack specific modules
self
.
image_projection
=
FramepackClipVisionProjection
(
image_proj_dim
,
inner_dim
)
if
has_image_proj
else
None
self
.
clean_x_embedder
=
None
if
has_clean_x_embedder
:
self
.
clean_x_embedder
=
HunyuanVideoHistoryPatchEmbed
(
in_channels
,
inner_dim
)
self
.
use_gradient_checkpointing
=
False
self
.
use_gradient_checkpointing
=
False
def
forward
(
def
forward
(
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment