| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| from typing import TYPE_CHECKING |
|
|
| from ..utils import ( |
| DIFFUSERS_SLOW_IMPORT, |
| _LazyModule, |
| is_flax_available, |
| is_torch_available, |
| ) |
|
|
|
|
| _import_structure = {} |
|
|
| if is_torch_available(): |
| _import_structure["_modeling_parallel"] = ["ContextParallelConfig", "ParallelConfig"] |
| _import_structure["adapter"] = ["MultiAdapter", "T2IAdapter"] |
| _import_structure["attention_dispatch"] = ["AttentionBackendName", "attention_backend"] |
| _import_structure["auto_model"] = ["AutoModel"] |
| _import_structure["autoencoders.autoencoder_asym_kl"] = ["AsymmetricAutoencoderKL"] |
| _import_structure["autoencoders.autoencoder_dc"] = ["AutoencoderDC"] |
| _import_structure["autoencoders.autoencoder_kl"] = ["AutoencoderKL"] |
| _import_structure["autoencoders.autoencoder_kl_allegro"] = ["AutoencoderKLAllegro"] |
| _import_structure["autoencoders.autoencoder_kl_cogvideox"] = ["AutoencoderKLCogVideoX"] |
| _import_structure["autoencoders.autoencoder_kl_cosmos"] = ["AutoencoderKLCosmos"] |
| _import_structure["autoencoders.autoencoder_kl_flux2"] = ["AutoencoderKLFlux2"] |
| _import_structure["autoencoders.autoencoder_kl_hunyuan_video"] = ["AutoencoderKLHunyuanVideo"] |
| _import_structure["autoencoders.autoencoder_kl_hunyuanimage"] = ["AutoencoderKLHunyuanImage"] |
| _import_structure["autoencoders.autoencoder_kl_hunyuanimage_refiner"] = ["AutoencoderKLHunyuanImageRefiner"] |
| _import_structure["autoencoders.autoencoder_kl_hunyuanvideo15"] = ["AutoencoderKLHunyuanVideo15"] |
| _import_structure["autoencoders.autoencoder_kl_ltx"] = ["AutoencoderKLLTXVideo"] |
| _import_structure["autoencoders.autoencoder_kl_ltx2"] = ["AutoencoderKLLTX2Video"] |
| _import_structure["autoencoders.autoencoder_kl_ltx2_audio"] = ["AutoencoderKLLTX2Audio"] |
| _import_structure["autoencoders.autoencoder_kl_magvit"] = ["AutoencoderKLMagvit"] |
| _import_structure["autoencoders.autoencoder_kl_mochi"] = ["AutoencoderKLMochi"] |
| _import_structure["autoencoders.autoencoder_kl_qwenimage"] = ["AutoencoderKLQwenImage"] |
| _import_structure["autoencoders.autoencoder_kl_temporal_decoder"] = ["AutoencoderKLTemporalDecoder"] |
| _import_structure["autoencoders.autoencoder_kl_wan"] = ["AutoencoderKLWan"] |
| _import_structure["autoencoders.autoencoder_oobleck"] = ["AutoencoderOobleck"] |
| _import_structure["autoencoders.autoencoder_rae"] = ["AutoencoderRAE"] |
| _import_structure["autoencoders.autoencoder_tiny"] = ["AutoencoderTiny"] |
| _import_structure["autoencoders.consistency_decoder_vae"] = ["ConsistencyDecoderVAE"] |
| _import_structure["autoencoders.vq_model"] = ["VQModel"] |
| _import_structure["cache_utils"] = ["CacheMixin"] |
| _import_structure["controlnets.controlnet"] = ["ControlNetModel"] |
| _import_structure["controlnets.controlnet_cosmos"] = ["CosmosControlNetModel"] |
| _import_structure["controlnets.controlnet_flux"] = ["FluxControlNetModel", "FluxMultiControlNetModel"] |
| _import_structure["controlnets.controlnet_hunyuan"] = [ |
| "HunyuanDiT2DControlNetModel", |
| "HunyuanDiT2DMultiControlNetModel", |
| ] |
| _import_structure["controlnets.controlnet_qwenimage"] = [ |
| "QwenImageControlNetModel", |
| "QwenImageMultiControlNetModel", |
| ] |
| _import_structure["controlnets.controlnet_sana"] = ["SanaControlNetModel"] |
| _import_structure["controlnets.controlnet_sd3"] = ["SD3ControlNetModel", "SD3MultiControlNetModel"] |
| _import_structure["controlnets.controlnet_sparsectrl"] = ["SparseControlNetModel"] |
| _import_structure["controlnets.controlnet_union"] = ["ControlNetUnionModel"] |
| _import_structure["controlnets.controlnet_xs"] = ["ControlNetXSAdapter", "UNetControlNetXSModel"] |
| _import_structure["controlnets.controlnet_z_image"] = ["ZImageControlNetModel"] |
| _import_structure["controlnets.multicontrolnet"] = ["MultiControlNetModel"] |
| _import_structure["controlnets.multicontrolnet_union"] = ["MultiControlNetUnionModel"] |
| _import_structure["embeddings"] = ["ImageProjection"] |
| _import_structure["modeling_utils"] = ["ModelMixin"] |
| _import_structure["transformers.auraflow_transformer_2d"] = ["AuraFlowTransformer2DModel"] |
| _import_structure["transformers.cogvideox_transformer_3d"] = ["CogVideoXTransformer3DModel"] |
| _import_structure["transformers.consisid_transformer_3d"] = ["ConsisIDTransformer3DModel"] |
| _import_structure["transformers.dit_transformer_2d"] = ["DiTTransformer2DModel"] |
| _import_structure["transformers.dual_transformer_2d"] = ["DualTransformer2DModel"] |
| _import_structure["transformers.hunyuan_transformer_2d"] = ["HunyuanDiT2DModel"] |
| _import_structure["transformers.latte_transformer_3d"] = ["LatteTransformer3DModel"] |
| _import_structure["transformers.lumina_nextdit2d"] = ["LuminaNextDiT2DModel"] |
| _import_structure["transformers.pixart_transformer_2d"] = ["PixArtTransformer2DModel"] |
| _import_structure["transformers.prior_transformer"] = ["PriorTransformer"] |
| _import_structure["transformers.sana_transformer"] = ["SanaTransformer2DModel"] |
| _import_structure["transformers.stable_audio_transformer"] = ["StableAudioDiTModel"] |
| _import_structure["transformers.t5_film_transformer"] = ["T5FilmDecoder"] |
| _import_structure["transformers.transformer_2d"] = ["Transformer2DModel"] |
| _import_structure["transformers.transformer_allegro"] = ["AllegroTransformer3DModel"] |
| _import_structure["transformers.transformer_bria"] = ["BriaTransformer2DModel"] |
| _import_structure["transformers.transformer_bria_fibo"] = ["BriaFiboTransformer2DModel"] |
| _import_structure["transformers.transformer_chroma"] = ["ChromaTransformer2DModel"] |
| _import_structure["transformers.transformer_chronoedit"] = ["ChronoEditTransformer3DModel"] |
| _import_structure["transformers.transformer_cogview3plus"] = ["CogView3PlusTransformer2DModel"] |
| _import_structure["transformers.transformer_cogview4"] = ["CogView4Transformer2DModel"] |
| _import_structure["transformers.transformer_cosmos"] = ["CosmosTransformer3DModel"] |
| _import_structure["transformers.transformer_easyanimate"] = ["EasyAnimateTransformer3DModel"] |
| _import_structure["transformers.transformer_flux"] = ["FluxTransformer2DModel"] |
| _import_structure["transformers.transformer_flux2"] = ["Flux2Transformer2DModel"] |
| _import_structure["transformers.transformer_glm_image"] = ["GlmImageTransformer2DModel"] |
| _import_structure["transformers.transformer_helios"] = ["HeliosTransformer3DModel"] |
| _import_structure["transformers.transformer_hidream_image"] = ["HiDreamImageTransformer2DModel"] |
| _import_structure["transformers.transformer_hunyuan_video"] = ["HunyuanVideoTransformer3DModel"] |
| _import_structure["transformers.transformer_hunyuan_video15"] = ["HunyuanVideo15Transformer3DModel"] |
| _import_structure["transformers.transformer_hunyuan_video_framepack"] = ["HunyuanVideoFramepackTransformer3DModel"] |
| _import_structure["transformers.transformer_hunyuanimage"] = ["HunyuanImageTransformer2DModel"] |
| _import_structure["transformers.transformer_kandinsky"] = ["Kandinsky5Transformer3DModel"] |
| _import_structure["transformers.transformer_longcat_image"] = ["LongCatImageTransformer2DModel"] |
| _import_structure["transformers.transformer_ltx"] = ["LTXVideoTransformer3DModel"] |
| _import_structure["transformers.transformer_ltx2"] = ["LTX2VideoTransformer3DModel"] |
| _import_structure["transformers.transformer_lumina2"] = ["Lumina2Transformer2DModel"] |
| _import_structure["transformers.transformer_mochi"] = ["MochiTransformer3DModel"] |
| _import_structure["transformers.transformer_omnigen"] = ["OmniGenTransformer2DModel"] |
| _import_structure["transformers.transformer_ovis_image"] = ["OvisImageTransformer2DModel"] |
| _import_structure["transformers.transformer_prx"] = ["PRXTransformer2DModel"] |
| _import_structure["transformers.transformer_qwenimage"] = ["QwenImageTransformer2DModel"] |
| _import_structure["transformers.transformer_sana_video"] = ["SanaVideoTransformer3DModel"] |
| _import_structure["transformers.transformer_sd3"] = ["SD3Transformer2DModel"] |
| _import_structure["transformers.transformer_skyreels_v2"] = ["SkyReelsV2Transformer3DModel"] |
| _import_structure["transformers.transformer_temporal"] = ["TransformerTemporalModel"] |
| _import_structure["transformers.transformer_wan"] = ["WanTransformer3DModel"] |
| _import_structure["transformers.transformer_wan_animate"] = ["WanAnimateTransformer3DModel"] |
| _import_structure["transformers.transformer_wan_vace"] = ["WanVACETransformer3DModel"] |
| _import_structure["transformers.transformer_z_image"] = ["ZImageTransformer2DModel"] |
| _import_structure["unets.unet_1d"] = ["UNet1DModel"] |
| _import_structure["unets.unet_2d"] = ["UNet2DModel"] |
| _import_structure["unets.unet_2d_condition"] = ["UNet2DConditionModel"] |
| _import_structure["unets.unet_3d_condition"] = ["UNet3DConditionModel"] |
| _import_structure["unets.unet_i2vgen_xl"] = ["I2VGenXLUNet"] |
| _import_structure["unets.unet_kandinsky3"] = ["Kandinsky3UNet"] |
| _import_structure["unets.unet_motion_model"] = ["MotionAdapter", "UNetMotionModel"] |
| _import_structure["unets.unet_spatio_temporal_condition"] = ["UNetSpatioTemporalConditionModel"] |
| _import_structure["unets.unet_stable_cascade"] = ["StableCascadeUNet"] |
| _import_structure["unets.uvit_2d"] = ["UVit2DModel"] |
|
|
| if is_flax_available(): |
| _import_structure["controlnets.controlnet_flax"] = ["FlaxControlNetModel"] |
| _import_structure["unets.unet_2d_condition_flax"] = ["FlaxUNet2DConditionModel"] |
| _import_structure["vae_flax"] = ["FlaxAutoencoderKL"] |
|
|
|
|
| if TYPE_CHECKING or DIFFUSERS_SLOW_IMPORT: |
| if is_torch_available(): |
| from ._modeling_parallel import ContextParallelConfig, ParallelConfig |
| from .adapter import MultiAdapter, T2IAdapter |
| from .attention_dispatch import AttentionBackendName, attention_backend |
| from .auto_model import AutoModel |
| from .autoencoders import ( |
| AsymmetricAutoencoderKL, |
| AutoencoderDC, |
| AutoencoderKL, |
| AutoencoderKLAllegro, |
| AutoencoderKLCogVideoX, |
| AutoencoderKLCosmos, |
| AutoencoderKLFlux2, |
| AutoencoderKLHunyuanImage, |
| AutoencoderKLHunyuanImageRefiner, |
| AutoencoderKLHunyuanVideo, |
| AutoencoderKLHunyuanVideo15, |
| AutoencoderKLLTX2Audio, |
| AutoencoderKLLTX2Video, |
| AutoencoderKLLTXVideo, |
| AutoencoderKLMagvit, |
| AutoencoderKLMochi, |
| AutoencoderKLQwenImage, |
| AutoencoderKLTemporalDecoder, |
| AutoencoderKLWan, |
| AutoencoderOobleck, |
| AutoencoderRAE, |
| AutoencoderTiny, |
| ConsistencyDecoderVAE, |
| VQModel, |
| ) |
| from .cache_utils import CacheMixin |
| from .controlnets import ( |
| ControlNetModel, |
| ControlNetUnionModel, |
| ControlNetXSAdapter, |
| CosmosControlNetModel, |
| FluxControlNetModel, |
| FluxMultiControlNetModel, |
| HunyuanDiT2DControlNetModel, |
| HunyuanDiT2DMultiControlNetModel, |
| MultiControlNetModel, |
| MultiControlNetUnionModel, |
| QwenImageControlNetModel, |
| QwenImageMultiControlNetModel, |
| SanaControlNetModel, |
| SD3ControlNetModel, |
| SD3MultiControlNetModel, |
| SparseControlNetModel, |
| UNetControlNetXSModel, |
| ZImageControlNetModel, |
| ) |
| from .embeddings import ImageProjection |
| from .modeling_utils import ModelMixin |
| from .transformers import ( |
| AllegroTransformer3DModel, |
| AuraFlowTransformer2DModel, |
| BriaFiboTransformer2DModel, |
| BriaTransformer2DModel, |
| ChromaTransformer2DModel, |
| ChronoEditTransformer3DModel, |
| CogVideoXTransformer3DModel, |
| CogView3PlusTransformer2DModel, |
| CogView4Transformer2DModel, |
| ConsisIDTransformer3DModel, |
| CosmosTransformer3DModel, |
| DiTTransformer2DModel, |
| DualTransformer2DModel, |
| EasyAnimateTransformer3DModel, |
| Flux2Transformer2DModel, |
| FluxTransformer2DModel, |
| GlmImageTransformer2DModel, |
| HeliosTransformer3DModel, |
| HiDreamImageTransformer2DModel, |
| HunyuanDiT2DModel, |
| HunyuanImageTransformer2DModel, |
| HunyuanVideo15Transformer3DModel, |
| HunyuanVideoFramepackTransformer3DModel, |
| HunyuanVideoTransformer3DModel, |
| Kandinsky5Transformer3DModel, |
| LatteTransformer3DModel, |
| LongCatImageTransformer2DModel, |
| LTX2VideoTransformer3DModel, |
| LTXVideoTransformer3DModel, |
| Lumina2Transformer2DModel, |
| LuminaNextDiT2DModel, |
| MochiTransformer3DModel, |
| OmniGenTransformer2DModel, |
| OvisImageTransformer2DModel, |
| PixArtTransformer2DModel, |
| PriorTransformer, |
| PRXTransformer2DModel, |
| QwenImageTransformer2DModel, |
| SanaTransformer2DModel, |
| SanaVideoTransformer3DModel, |
| SD3Transformer2DModel, |
| SkyReelsV2Transformer3DModel, |
| StableAudioDiTModel, |
| T5FilmDecoder, |
| Transformer2DModel, |
| TransformerTemporalModel, |
| WanAnimateTransformer3DModel, |
| WanTransformer3DModel, |
| WanVACETransformer3DModel, |
| ZImageTransformer2DModel, |
| ) |
| from .unets import ( |
| I2VGenXLUNet, |
| Kandinsky3UNet, |
| MotionAdapter, |
| StableCascadeUNet, |
| UNet1DModel, |
| UNet2DConditionModel, |
| UNet2DModel, |
| UNet3DConditionModel, |
| UNetMotionModel, |
| UNetSpatioTemporalConditionModel, |
| UVit2DModel, |
| ) |
|
|
| if is_flax_available(): |
| from .controlnets import FlaxControlNetModel |
| from .unets import FlaxUNet2DConditionModel |
| from .vae_flax import FlaxAutoencoderKL |
|
|
| else: |
| import sys |
|
|
| sys.modules[__name__] = _LazyModule(__name__, globals()["__file__"], _import_structure, module_spec=__spec__) |
|
|