__init__.py 10.7 KB
Newer Older
Aryan's avatar
Aryan committed
1
# Copyright 2025 The HuggingFace Team. All rights reserved.
2
3
4
5
6
7
8
9
10
11
12
13
14
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

15
16
from typing import TYPE_CHECKING

Suraj Patil's avatar
Suraj Patil committed
17
18
19
20
21
22
from ..utils import (
    DIFFUSERS_SLOW_IMPORT,
    _LazyModule,
    is_flax_available,
    is_torch_available,
)
23
24


Dhruv Nair's avatar
Dhruv Nair committed
25
26
_import_structure = {}

27
if is_torch_available():
Dhruv Nair's avatar
Dhruv Nair committed
28
    _import_structure["adapter"] = ["MultiAdapter", "T2IAdapter"]
29
    _import_structure["attention_dispatch"] = ["AttentionBackendName", "attention_backend"]
30
    _import_structure["auto_model"] = ["AutoModel"]
31
    _import_structure["autoencoders.autoencoder_asym_kl"] = ["AsymmetricAutoencoderKL"]
32
    _import_structure["autoencoders.autoencoder_dc"] = ["AutoencoderDC"]
33
    _import_structure["autoencoders.autoencoder_kl"] = ["AutoencoderKL"]
Aryan's avatar
Aryan committed
34
    _import_structure["autoencoders.autoencoder_kl_allegro"] = ["AutoencoderKLAllegro"]
35
    _import_structure["autoencoders.autoencoder_kl_cogvideox"] = ["AutoencoderKLCogVideoX"]
Aryan's avatar
Aryan committed
36
    _import_structure["autoencoders.autoencoder_kl_cosmos"] = ["AutoencoderKLCosmos"]
Aryan's avatar
Aryan committed
37
    _import_structure["autoencoders.autoencoder_kl_hunyuan_video"] = ["AutoencoderKLHunyuanVideo"]
Aryan's avatar
Aryan committed
38
    _import_structure["autoencoders.autoencoder_kl_ltx"] = ["AutoencoderKLLTXVideo"]
39
    _import_structure["autoencoders.autoencoder_kl_magvit"] = ["AutoencoderKLMagvit"]
Aryan's avatar
Aryan committed
40
    _import_structure["autoencoders.autoencoder_kl_mochi"] = ["AutoencoderKLMochi"]
41
    _import_structure["autoencoders.autoencoder_kl_temporal_decoder"] = ["AutoencoderKLTemporalDecoder"]
42
    _import_structure["autoencoders.autoencoder_kl_wan"] = ["AutoencoderKLWan"]
43
    _import_structure["autoencoders.autoencoder_oobleck"] = ["AutoencoderOobleck"]
44
45
    _import_structure["autoencoders.autoencoder_tiny"] = ["AutoencoderTiny"]
    _import_structure["autoencoders.consistency_decoder_vae"] = ["ConsistencyDecoderVAE"]
46
    _import_structure["autoencoders.vq_model"] = ["VQModel"]
47
    _import_structure["cache_utils"] = ["CacheMixin"]
48
49
50
51
52
53
    _import_structure["controlnets.controlnet"] = ["ControlNetModel"]
    _import_structure["controlnets.controlnet_flux"] = ["FluxControlNetModel", "FluxMultiControlNetModel"]
    _import_structure["controlnets.controlnet_hunyuan"] = [
        "HunyuanDiT2DControlNetModel",
        "HunyuanDiT2DMultiControlNetModel",
    ]
54
    _import_structure["controlnets.controlnet_sana"] = ["SanaControlNetModel"]
55
56
    _import_structure["controlnets.controlnet_sd3"] = ["SD3ControlNetModel", "SD3MultiControlNetModel"]
    _import_structure["controlnets.controlnet_sparsectrl"] = ["SparseControlNetModel"]
hlky's avatar
hlky committed
57
    _import_structure["controlnets.controlnet_union"] = ["ControlNetUnionModel"]
58
59
    _import_structure["controlnets.controlnet_xs"] = ["ControlNetXSAdapter", "UNetControlNetXSModel"]
    _import_structure["controlnets.multicontrolnet"] = ["MultiControlNetModel"]
60
    _import_structure["controlnets.multicontrolnet_union"] = ["MultiControlNetUnionModel"]
61
    _import_structure["embeddings"] = ["ImageProjection"]
62
    _import_structure["modeling_utils"] = ["ModelMixin"]
Sayak Paul's avatar
Sayak Paul committed
63
    _import_structure["transformers.auraflow_transformer_2d"] = ["AuraFlowTransformer2DModel"]
64
    _import_structure["transformers.cogvideox_transformer_3d"] = ["CogVideoXTransformer3DModel"]
Shenghai Yuan's avatar
Shenghai Yuan committed
65
    _import_structure["transformers.consisid_transformer_3d"] = ["ConsisIDTransformer3DModel"]
66
    _import_structure["transformers.dit_transformer_2d"] = ["DiTTransformer2DModel"]
67
    _import_structure["transformers.dual_transformer_2d"] = ["DualTransformer2DModel"]
68
    _import_structure["transformers.hunyuan_transformer_2d"] = ["HunyuanDiT2DModel"]
69
    _import_structure["transformers.latte_transformer_3d"] = ["LatteTransformer3DModel"]
70
    _import_structure["transformers.lumina_nextdit2d"] = ["LuminaNextDiT2DModel"]
71
    _import_structure["transformers.pixart_transformer_2d"] = ["PixArtTransformer2DModel"]
72
    _import_structure["transformers.prior_transformer"] = ["PriorTransformer"]
73
    _import_structure["transformers.sana_transformer"] = ["SanaTransformer2DModel"]
74
    _import_structure["transformers.stable_audio_transformer"] = ["StableAudioDiTModel"]
75
76
    _import_structure["transformers.t5_film_transformer"] = ["T5FilmDecoder"]
    _import_structure["transformers.transformer_2d"] = ["Transformer2DModel"]
Aryan's avatar
Aryan committed
77
    _import_structure["transformers.transformer_allegro"] = ["AllegroTransformer3DModel"]
Edna's avatar
Edna committed
78
    _import_structure["transformers.transformer_chroma"] = ["ChromaTransformer2DModel"]
Yuxuan.Zhang's avatar
Yuxuan.Zhang committed
79
    _import_structure["transformers.transformer_cogview3plus"] = ["CogView3PlusTransformer2DModel"]
80
    _import_structure["transformers.transformer_cogview4"] = ["CogView4Transformer2DModel"]
Aryan's avatar
Aryan committed
81
    _import_structure["transformers.transformer_cosmos"] = ["CosmosTransformer3DModel"]
82
    _import_structure["transformers.transformer_easyanimate"] = ["EasyAnimateTransformer3DModel"]
Sayak Paul's avatar
Sayak Paul committed
83
    _import_structure["transformers.transformer_flux"] = ["FluxTransformer2DModel"]
hlky's avatar
hlky committed
84
    _import_structure["transformers.transformer_hidream_image"] = ["HiDreamImageTransformer2DModel"]
Aryan's avatar
Aryan committed
85
    _import_structure["transformers.transformer_hunyuan_video"] = ["HunyuanVideoTransformer3DModel"]
Aryan's avatar
Aryan committed
86
    _import_structure["transformers.transformer_hunyuan_video_framepack"] = ["HunyuanVideoFramepackTransformer3DModel"]
Aryan's avatar
Aryan committed
87
    _import_structure["transformers.transformer_ltx"] = ["LTXVideoTransformer3DModel"]
Le Zhuo's avatar
Le Zhuo committed
88
    _import_structure["transformers.transformer_lumina2"] = ["Lumina2Transformer2DModel"]
Aryan's avatar
Aryan committed
89
    _import_structure["transformers.transformer_mochi"] = ["MochiTransformer3DModel"]
Shitao Xiao's avatar
Shitao Xiao committed
90
    _import_structure["transformers.transformer_omnigen"] = ["OmniGenTransformer2DModel"]
Dhruv Nair's avatar
Dhruv Nair committed
91
    _import_structure["transformers.transformer_sd3"] = ["SD3Transformer2DModel"]
92
    _import_structure["transformers.transformer_skyreels_v2"] = ["SkyReelsV2Transformer3DModel"]
93
    _import_structure["transformers.transformer_temporal"] = ["TransformerTemporalModel"]
94
    _import_structure["transformers.transformer_wan"] = ["WanTransformer3DModel"]
Aryan's avatar
Aryan committed
95
    _import_structure["transformers.transformer_wan_vace"] = ["WanVACETransformer3DModel"]
96
97
98
99
    _import_structure["unets.unet_1d"] = ["UNet1DModel"]
    _import_structure["unets.unet_2d"] = ["UNet2DModel"]
    _import_structure["unets.unet_2d_condition"] = ["UNet2DConditionModel"]
    _import_structure["unets.unet_3d_condition"] = ["UNet3DConditionModel"]
100
    _import_structure["unets.unet_i2vgen_xl"] = ["I2VGenXLUNet"]
101
102
103
    _import_structure["unets.unet_kandinsky3"] = ["Kandinsky3UNet"]
    _import_structure["unets.unet_motion_model"] = ["MotionAdapter", "UNetMotionModel"]
    _import_structure["unets.unet_spatio_temporal_condition"] = ["UNetSpatioTemporalConditionModel"]
104
    _import_structure["unets.unet_stable_cascade"] = ["StableCascadeUNet"]
105
    _import_structure["unets.uvit_2d"] = ["UVit2DModel"]
106
107

if is_flax_available():
108
    _import_structure["controlnets.controlnet_flax"] = ["FlaxControlNetModel"]
109
    _import_structure["unets.unet_2d_condition_flax"] = ["FlaxUNet2DConditionModel"]
Dhruv Nair's avatar
Dhruv Nair committed
110
111
112
    _import_structure["vae_flax"] = ["FlaxAutoencoderKL"]


113
if TYPE_CHECKING or DIFFUSERS_SLOW_IMPORT:
114
115
    if is_torch_available():
        from .adapter import MultiAdapter, T2IAdapter
116
        from .attention_dispatch import AttentionBackendName, attention_backend
hlky's avatar
hlky committed
117
        from .auto_model import AutoModel
118
119
        from .autoencoders import (
            AsymmetricAutoencoderKL,
120
            AutoencoderDC,
121
            AutoencoderKL,
Aryan's avatar
Aryan committed
122
            AutoencoderKLAllegro,
123
            AutoencoderKLCogVideoX,
Aryan's avatar
Aryan committed
124
            AutoencoderKLCosmos,
Aryan's avatar
Aryan committed
125
            AutoencoderKLHunyuanVideo,
Aryan's avatar
Aryan committed
126
            AutoencoderKLLTXVideo,
127
            AutoencoderKLMagvit,
Aryan's avatar
Aryan committed
128
            AutoencoderKLMochi,
129
            AutoencoderKLTemporalDecoder,
130
            AutoencoderKLWan,
131
            AutoencoderOobleck,
132
133
            AutoencoderTiny,
            ConsistencyDecoderVAE,
134
            VQModel,
135
        )
136
        from .cache_utils import CacheMixin
137
138
        from .controlnets import (
            ControlNetModel,
hlky's avatar
hlky committed
139
            ControlNetUnionModel,
140
141
142
143
144
145
            ControlNetXSAdapter,
            FluxControlNetModel,
            FluxMultiControlNetModel,
            HunyuanDiT2DControlNetModel,
            HunyuanDiT2DMultiControlNetModel,
            MultiControlNetModel,
146
            MultiControlNetUnionModel,
147
            SanaControlNetModel,
148
149
150
151
152
            SD3ControlNetModel,
            SD3MultiControlNetModel,
            SparseControlNetModel,
            UNetControlNetXSModel,
        )
153
        from .embeddings import ImageProjection
154
        from .modeling_utils import ModelMixin
155
        from .transformers import (
Aryan's avatar
Aryan committed
156
            AllegroTransformer3DModel,
Sayak Paul's avatar
Sayak Paul committed
157
            AuraFlowTransformer2DModel,
Edna's avatar
Edna committed
158
            ChromaTransformer2DModel,
159
            CogVideoXTransformer3DModel,
Yuxuan.Zhang's avatar
Yuxuan.Zhang committed
160
            CogView3PlusTransformer2DModel,
161
            CogView4Transformer2DModel,
Shenghai Yuan's avatar
Shenghai Yuan committed
162
            ConsisIDTransformer3DModel,
Aryan's avatar
Aryan committed
163
            CosmosTransformer3DModel,
164
            DiTTransformer2DModel,
165
            DualTransformer2DModel,
166
            EasyAnimateTransformer3DModel,
Sayak Paul's avatar
Sayak Paul committed
167
            FluxTransformer2DModel,
hlky's avatar
hlky committed
168
            HiDreamImageTransformer2DModel,
169
            HunyuanDiT2DModel,
Aryan's avatar
Aryan committed
170
            HunyuanVideoFramepackTransformer3DModel,
Aryan's avatar
Aryan committed
171
            HunyuanVideoTransformer3DModel,
172
            LatteTransformer3DModel,
Aryan's avatar
Aryan committed
173
            LTXVideoTransformer3DModel,
Le Zhuo's avatar
Le Zhuo committed
174
            Lumina2Transformer2DModel,
175
            LuminaNextDiT2DModel,
Aryan's avatar
Aryan committed
176
            MochiTransformer3DModel,
Shitao Xiao's avatar
Shitao Xiao committed
177
            OmniGenTransformer2DModel,
178
            PixArtTransformer2DModel,
179
            PriorTransformer,
180
            SanaTransformer2DModel,
Dhruv Nair's avatar
Dhruv Nair committed
181
            SD3Transformer2DModel,
182
            SkyReelsV2Transformer3DModel,
183
            StableAudioDiTModel,
184
185
186
            T5FilmDecoder,
            Transformer2DModel,
            TransformerTemporalModel,
187
            WanTransformer3DModel,
Aryan's avatar
Aryan committed
188
            WanVACETransformer3DModel,
189
        )
190
        from .unets import (
191
            I2VGenXLUNet,
192
193
            Kandinsky3UNet,
            MotionAdapter,
194
            StableCascadeUNet,
195
196
197
198
199
200
201
202
            UNet1DModel,
            UNet2DConditionModel,
            UNet2DModel,
            UNet3DConditionModel,
            UNetMotionModel,
            UNetSpatioTemporalConditionModel,
            UVit2DModel,
        )
203
204

    if is_flax_available():
205
        from .controlnets import FlaxControlNetModel
206
        from .unets import FlaxUNet2DConditionModel
207
208
209
210
        from .vae_flax import FlaxAutoencoderKL

else:
    import sys
Dhruv Nair's avatar
Dhruv Nair committed
211

212
    sys.modules[__name__] = _LazyModule(__name__, globals()["__file__"], _import_structure, module_spec=__spec__)