Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
renzhc
diffusers_dcu
Commits
a4f9c3cb
Unverified
Commit
a4f9c3cb
authored
Apr 24, 2025
by
Ishan Modi
Committed by
GitHub
Apr 23, 2025
Browse files
[Feature] Added Xlab Controlnet support (#11249)
update
parent
4b60f4b6
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
29 additions
and
22 deletions
+29
-22
src/diffusers/pipelines/flux/pipeline_flux_controlnet_image_to_image.py
...pipelines/flux/pipeline_flux_controlnet_image_to_image.py
+29
-22
No files found.
src/diffusers/pipelines/flux/pipeline_flux_controlnet_image_to_image.py
View file @
a4f9c3cb
...
@@ -800,17 +800,20 @@ class FluxControlNetImg2ImgPipeline(DiffusionPipeline, FluxLoraLoaderMixin, From
...
@@ -800,17 +800,20 @@ class FluxControlNetImg2ImgPipeline(DiffusionPipeline, FluxLoraLoaderMixin, From
)
)
height
,
width
=
control_image
.
shape
[
-
2
:]
height
,
width
=
control_image
.
shape
[
-
2
:]
control_image
=
retrieve_latents
(
self
.
vae
.
encode
(
control_image
),
generator
=
generator
)
# xlab controlnet has a input_hint_block and instantx controlnet does not
control_image
=
(
control_image
-
self
.
vae
.
config
.
shift_factor
)
*
self
.
vae
.
config
.
scaling_factor
controlnet_blocks_repeat
=
False
if
self
.
controlnet
.
input_hint_block
is
None
else
True
if
self
.
controlnet
.
input_hint_block
is
None
:
height_control_image
,
width_control_image
=
control_image
.
shape
[
2
:]
control_image
=
retrieve_latents
(
self
.
vae
.
encode
(
control_image
),
generator
=
generator
)
control_image
=
self
.
_pack_latents
(
control_image
=
(
control_image
-
self
.
vae
.
config
.
shift_factor
)
*
self
.
vae
.
config
.
scaling_factor
control_image
,
batch_size
*
num_images_per_prompt
,
height_control_image
,
width_control_image
=
control_image
.
shape
[
2
:]
num_channels_latents
,
control_image
=
self
.
_pack_latents
(
height_control_image
,
control_image
,
width_control_image
,
batch_size
*
num_images_per_prompt
,
)
num_channels_latents
,
height_control_image
,
width_control_image
,
)
if
control_mode
is
not
None
:
if
control_mode
is
not
None
:
control_mode
=
torch
.
tensor
(
control_mode
).
to
(
device
,
dtype
=
torch
.
long
)
control_mode
=
torch
.
tensor
(
control_mode
).
to
(
device
,
dtype
=
torch
.
long
)
...
@@ -819,7 +822,9 @@ class FluxControlNetImg2ImgPipeline(DiffusionPipeline, FluxLoraLoaderMixin, From
...
@@ -819,7 +822,9 @@ class FluxControlNetImg2ImgPipeline(DiffusionPipeline, FluxLoraLoaderMixin, From
elif
isinstance
(
self
.
controlnet
,
FluxMultiControlNetModel
):
elif
isinstance
(
self
.
controlnet
,
FluxMultiControlNetModel
):
control_images
=
[]
control_images
=
[]
for
control_image_
in
control_image
:
# xlab controlnet has a input_hint_block and instantx controlnet does not
controlnet_blocks_repeat
=
False
if
self
.
controlnet
.
nets
[
0
].
input_hint_block
is
None
else
True
for
i
,
control_image_
in
enumerate
(
control_image
):
control_image_
=
self
.
prepare_image
(
control_image_
=
self
.
prepare_image
(
image
=
control_image_
,
image
=
control_image_
,
width
=
width
,
width
=
width
,
...
@@ -831,17 +836,18 @@ class FluxControlNetImg2ImgPipeline(DiffusionPipeline, FluxLoraLoaderMixin, From
...
@@ -831,17 +836,18 @@ class FluxControlNetImg2ImgPipeline(DiffusionPipeline, FluxLoraLoaderMixin, From
)
)
height
,
width
=
control_image_
.
shape
[
-
2
:]
height
,
width
=
control_image_
.
shape
[
-
2
:]
control_image_
=
retrieve_latents
(
self
.
vae
.
encode
(
control_image_
),
generator
=
generator
)
if
self
.
controlnet
.
nets
[
0
].
input_hint_block
is
None
:
control_image_
=
(
control_image_
-
self
.
vae
.
config
.
shift_factor
)
*
self
.
vae
.
config
.
scaling_factor
control_image_
=
retrieve_latents
(
self
.
vae
.
encode
(
control_image_
),
generator
=
generator
)
control_image_
=
(
control_image_
-
self
.
vae
.
config
.
shift_factor
)
*
self
.
vae
.
config
.
scaling_factor
height_control_image
,
width_control_image
=
control_image_
.
shape
[
2
:]
height_control_image
,
width_control_image
=
control_image_
.
shape
[
2
:]
control_image_
=
self
.
_pack_latents
(
control_image_
=
self
.
_pack_latents
(
control_image_
,
control_image_
,
batch_size
*
num_images_per_prompt
,
batch_size
*
num_images_per_prompt
,
num_channels_latents
,
num_channels_latents
,
height_control_image
,
height_control_image
,
width_control_image
,
width_control_image
,
)
)
control_images
.
append
(
control_image_
)
control_images
.
append
(
control_image_
)
...
@@ -955,6 +961,7 @@ class FluxControlNetImg2ImgPipeline(DiffusionPipeline, FluxLoraLoaderMixin, From
...
@@ -955,6 +961,7 @@ class FluxControlNetImg2ImgPipeline(DiffusionPipeline, FluxLoraLoaderMixin, From
img_ids
=
latent_image_ids
,
img_ids
=
latent_image_ids
,
joint_attention_kwargs
=
self
.
joint_attention_kwargs
,
joint_attention_kwargs
=
self
.
joint_attention_kwargs
,
return_dict
=
False
,
return_dict
=
False
,
controlnet_blocks_repeat
=
controlnet_blocks_repeat
,
)[
0
]
)[
0
]
latents_dtype
=
latents
.
dtype
latents_dtype
=
latents
.
dtype
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment