diffusers 0.27.0__py3-none-any.whl → 0.32.2__py3-none-any.whl

Sign up to get free protection for your applications and to get access to all the features.
Files changed (445) hide show
  1. diffusers/__init__.py +233 -6
  2. diffusers/callbacks.py +209 -0
  3. diffusers/commands/env.py +102 -6
  4. diffusers/configuration_utils.py +45 -16
  5. diffusers/dependency_versions_table.py +4 -3
  6. diffusers/image_processor.py +434 -110
  7. diffusers/loaders/__init__.py +42 -9
  8. diffusers/loaders/ip_adapter.py +626 -36
  9. diffusers/loaders/lora_base.py +900 -0
  10. diffusers/loaders/lora_conversion_utils.py +991 -125
  11. diffusers/loaders/lora_pipeline.py +3812 -0
  12. diffusers/loaders/peft.py +571 -7
  13. diffusers/loaders/single_file.py +405 -173
  14. diffusers/loaders/single_file_model.py +385 -0
  15. diffusers/loaders/single_file_utils.py +1783 -713
  16. diffusers/loaders/textual_inversion.py +41 -23
  17. diffusers/loaders/transformer_flux.py +181 -0
  18. diffusers/loaders/transformer_sd3.py +89 -0
  19. diffusers/loaders/unet.py +464 -540
  20. diffusers/loaders/unet_loader_utils.py +163 -0
  21. diffusers/models/__init__.py +76 -7
  22. diffusers/models/activations.py +65 -10
  23. diffusers/models/adapter.py +53 -53
  24. diffusers/models/attention.py +605 -18
  25. diffusers/models/attention_flax.py +1 -1
  26. diffusers/models/attention_processor.py +4304 -687
  27. diffusers/models/autoencoders/__init__.py +8 -0
  28. diffusers/models/autoencoders/autoencoder_asym_kl.py +15 -17
  29. diffusers/models/autoencoders/autoencoder_dc.py +620 -0
  30. diffusers/models/autoencoders/autoencoder_kl.py +110 -28
  31. diffusers/models/autoencoders/autoencoder_kl_allegro.py +1149 -0
  32. diffusers/models/autoencoders/autoencoder_kl_cogvideox.py +1482 -0
  33. diffusers/models/autoencoders/autoencoder_kl_hunyuan_video.py +1176 -0
  34. diffusers/models/autoencoders/autoencoder_kl_ltx.py +1338 -0
  35. diffusers/models/autoencoders/autoencoder_kl_mochi.py +1166 -0
  36. diffusers/models/autoencoders/autoencoder_kl_temporal_decoder.py +19 -24
  37. diffusers/models/autoencoders/autoencoder_oobleck.py +464 -0
  38. diffusers/models/autoencoders/autoencoder_tiny.py +21 -18
  39. diffusers/models/autoencoders/consistency_decoder_vae.py +45 -20
  40. diffusers/models/autoencoders/vae.py +41 -29
  41. diffusers/models/autoencoders/vq_model.py +182 -0
  42. diffusers/models/controlnet.py +47 -800
  43. diffusers/models/controlnet_flux.py +70 -0
  44. diffusers/models/controlnet_sd3.py +68 -0
  45. diffusers/models/controlnet_sparsectrl.py +116 -0
  46. diffusers/models/controlnets/__init__.py +23 -0
  47. diffusers/models/controlnets/controlnet.py +872 -0
  48. diffusers/models/{controlnet_flax.py → controlnets/controlnet_flax.py} +9 -9
  49. diffusers/models/controlnets/controlnet_flux.py +536 -0
  50. diffusers/models/controlnets/controlnet_hunyuan.py +401 -0
  51. diffusers/models/controlnets/controlnet_sd3.py +489 -0
  52. diffusers/models/controlnets/controlnet_sparsectrl.py +788 -0
  53. diffusers/models/controlnets/controlnet_union.py +832 -0
  54. diffusers/models/controlnets/controlnet_xs.py +1946 -0
  55. diffusers/models/controlnets/multicontrolnet.py +183 -0
  56. diffusers/models/downsampling.py +85 -18
  57. diffusers/models/embeddings.py +1856 -158
  58. diffusers/models/embeddings_flax.py +23 -9
  59. diffusers/models/model_loading_utils.py +480 -0
  60. diffusers/models/modeling_flax_pytorch_utils.py +2 -1
  61. diffusers/models/modeling_flax_utils.py +2 -7
  62. diffusers/models/modeling_outputs.py +14 -0
  63. diffusers/models/modeling_pytorch_flax_utils.py +1 -1
  64. diffusers/models/modeling_utils.py +611 -146
  65. diffusers/models/normalization.py +361 -20
  66. diffusers/models/resnet.py +18 -23
  67. diffusers/models/transformers/__init__.py +16 -0
  68. diffusers/models/transformers/auraflow_transformer_2d.py +544 -0
  69. diffusers/models/transformers/cogvideox_transformer_3d.py +542 -0
  70. diffusers/models/transformers/dit_transformer_2d.py +240 -0
  71. diffusers/models/transformers/dual_transformer_2d.py +9 -8
  72. diffusers/models/transformers/hunyuan_transformer_2d.py +578 -0
  73. diffusers/models/transformers/latte_transformer_3d.py +327 -0
  74. diffusers/models/transformers/lumina_nextdit2d.py +340 -0
  75. diffusers/models/transformers/pixart_transformer_2d.py +445 -0
  76. diffusers/models/transformers/prior_transformer.py +13 -13
  77. diffusers/models/transformers/sana_transformer.py +488 -0
  78. diffusers/models/transformers/stable_audio_transformer.py +458 -0
  79. diffusers/models/transformers/t5_film_transformer.py +17 -19
  80. diffusers/models/transformers/transformer_2d.py +297 -187
  81. diffusers/models/transformers/transformer_allegro.py +422 -0
  82. diffusers/models/transformers/transformer_cogview3plus.py +386 -0
  83. diffusers/models/transformers/transformer_flux.py +593 -0
  84. diffusers/models/transformers/transformer_hunyuan_video.py +791 -0
  85. diffusers/models/transformers/transformer_ltx.py +469 -0
  86. diffusers/models/transformers/transformer_mochi.py +499 -0
  87. diffusers/models/transformers/transformer_sd3.py +461 -0
  88. diffusers/models/transformers/transformer_temporal.py +21 -19
  89. diffusers/models/unets/unet_1d.py +8 -8
  90. diffusers/models/unets/unet_1d_blocks.py +31 -31
  91. diffusers/models/unets/unet_2d.py +17 -10
  92. diffusers/models/unets/unet_2d_blocks.py +225 -149
  93. diffusers/models/unets/unet_2d_condition.py +50 -53
  94. diffusers/models/unets/unet_2d_condition_flax.py +6 -5
  95. diffusers/models/unets/unet_3d_blocks.py +192 -1057
  96. diffusers/models/unets/unet_3d_condition.py +22 -27
  97. diffusers/models/unets/unet_i2vgen_xl.py +22 -18
  98. diffusers/models/unets/unet_kandinsky3.py +2 -2
  99. diffusers/models/unets/unet_motion_model.py +1413 -89
  100. diffusers/models/unets/unet_spatio_temporal_condition.py +40 -16
  101. diffusers/models/unets/unet_stable_cascade.py +19 -18
  102. diffusers/models/unets/uvit_2d.py +2 -2
  103. diffusers/models/upsampling.py +95 -26
  104. diffusers/models/vq_model.py +12 -164
  105. diffusers/optimization.py +1 -1
  106. diffusers/pipelines/__init__.py +202 -3
  107. diffusers/pipelines/allegro/__init__.py +48 -0
  108. diffusers/pipelines/allegro/pipeline_allegro.py +938 -0
  109. diffusers/pipelines/allegro/pipeline_output.py +23 -0
  110. diffusers/pipelines/amused/pipeline_amused.py +12 -12
  111. diffusers/pipelines/amused/pipeline_amused_img2img.py +14 -12
  112. diffusers/pipelines/amused/pipeline_amused_inpaint.py +13 -11
  113. diffusers/pipelines/animatediff/__init__.py +8 -0
  114. diffusers/pipelines/animatediff/pipeline_animatediff.py +122 -109
  115. diffusers/pipelines/animatediff/pipeline_animatediff_controlnet.py +1106 -0
  116. diffusers/pipelines/animatediff/pipeline_animatediff_sdxl.py +1288 -0
  117. diffusers/pipelines/animatediff/pipeline_animatediff_sparsectrl.py +1010 -0
  118. diffusers/pipelines/animatediff/pipeline_animatediff_video2video.py +236 -180
  119. diffusers/pipelines/animatediff/pipeline_animatediff_video2video_controlnet.py +1341 -0
  120. diffusers/pipelines/animatediff/pipeline_output.py +3 -2
  121. diffusers/pipelines/audioldm/pipeline_audioldm.py +14 -14
  122. diffusers/pipelines/audioldm2/modeling_audioldm2.py +58 -39
  123. diffusers/pipelines/audioldm2/pipeline_audioldm2.py +121 -36
  124. diffusers/pipelines/aura_flow/__init__.py +48 -0
  125. diffusers/pipelines/aura_flow/pipeline_aura_flow.py +584 -0
  126. diffusers/pipelines/auto_pipeline.py +196 -28
  127. diffusers/pipelines/blip_diffusion/blip_image_processing.py +1 -1
  128. diffusers/pipelines/blip_diffusion/modeling_blip2.py +6 -6
  129. diffusers/pipelines/blip_diffusion/modeling_ctx_clip.py +1 -1
  130. diffusers/pipelines/blip_diffusion/pipeline_blip_diffusion.py +2 -2
  131. diffusers/pipelines/cogvideo/__init__.py +54 -0
  132. diffusers/pipelines/cogvideo/pipeline_cogvideox.py +772 -0
  133. diffusers/pipelines/cogvideo/pipeline_cogvideox_fun_control.py +825 -0
  134. diffusers/pipelines/cogvideo/pipeline_cogvideox_image2video.py +885 -0
  135. diffusers/pipelines/cogvideo/pipeline_cogvideox_video2video.py +851 -0
  136. diffusers/pipelines/cogvideo/pipeline_output.py +20 -0
  137. diffusers/pipelines/cogview3/__init__.py +47 -0
  138. diffusers/pipelines/cogview3/pipeline_cogview3plus.py +674 -0
  139. diffusers/pipelines/cogview3/pipeline_output.py +21 -0
  140. diffusers/pipelines/consistency_models/pipeline_consistency_models.py +6 -6
  141. diffusers/pipelines/controlnet/__init__.py +86 -80
  142. diffusers/pipelines/controlnet/multicontrolnet.py +7 -182
  143. diffusers/pipelines/controlnet/pipeline_controlnet.py +134 -87
  144. diffusers/pipelines/controlnet/pipeline_controlnet_blip_diffusion.py +2 -2
  145. diffusers/pipelines/controlnet/pipeline_controlnet_img2img.py +93 -77
  146. diffusers/pipelines/controlnet/pipeline_controlnet_inpaint.py +88 -197
  147. diffusers/pipelines/controlnet/pipeline_controlnet_inpaint_sd_xl.py +136 -90
  148. diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl.py +176 -80
  149. diffusers/pipelines/controlnet/pipeline_controlnet_sd_xl_img2img.py +125 -89
  150. diffusers/pipelines/controlnet/pipeline_controlnet_union_inpaint_sd_xl.py +1790 -0
  151. diffusers/pipelines/controlnet/pipeline_controlnet_union_sd_xl.py +1501 -0
  152. diffusers/pipelines/controlnet/pipeline_controlnet_union_sd_xl_img2img.py +1627 -0
  153. diffusers/pipelines/controlnet/pipeline_flax_controlnet.py +2 -2
  154. diffusers/pipelines/controlnet_hunyuandit/__init__.py +48 -0
  155. diffusers/pipelines/controlnet_hunyuandit/pipeline_hunyuandit_controlnet.py +1060 -0
  156. diffusers/pipelines/controlnet_sd3/__init__.py +57 -0
  157. diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet.py +1133 -0
  158. diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet_inpainting.py +1153 -0
  159. diffusers/pipelines/controlnet_xs/__init__.py +68 -0
  160. diffusers/pipelines/controlnet_xs/pipeline_controlnet_xs.py +916 -0
  161. diffusers/pipelines/controlnet_xs/pipeline_controlnet_xs_sd_xl.py +1111 -0
  162. diffusers/pipelines/ddpm/pipeline_ddpm.py +2 -2
  163. diffusers/pipelines/deepfloyd_if/pipeline_if.py +16 -30
  164. diffusers/pipelines/deepfloyd_if/pipeline_if_img2img.py +20 -35
  165. diffusers/pipelines/deepfloyd_if/pipeline_if_img2img_superresolution.py +23 -41
  166. diffusers/pipelines/deepfloyd_if/pipeline_if_inpainting.py +22 -38
  167. diffusers/pipelines/deepfloyd_if/pipeline_if_inpainting_superresolution.py +25 -41
  168. diffusers/pipelines/deepfloyd_if/pipeline_if_superresolution.py +19 -34
  169. diffusers/pipelines/deepfloyd_if/pipeline_output.py +6 -5
  170. diffusers/pipelines/deepfloyd_if/watermark.py +1 -1
  171. diffusers/pipelines/deprecated/alt_diffusion/modeling_roberta_series.py +11 -11
  172. diffusers/pipelines/deprecated/alt_diffusion/pipeline_alt_diffusion.py +70 -30
  173. diffusers/pipelines/deprecated/alt_diffusion/pipeline_alt_diffusion_img2img.py +48 -25
  174. diffusers/pipelines/deprecated/repaint/pipeline_repaint.py +2 -2
  175. diffusers/pipelines/deprecated/spectrogram_diffusion/pipeline_spectrogram_diffusion.py +7 -7
  176. diffusers/pipelines/deprecated/stable_diffusion_variants/pipeline_cycle_diffusion.py +21 -20
  177. diffusers/pipelines/deprecated/stable_diffusion_variants/pipeline_stable_diffusion_inpaint_legacy.py +27 -29
  178. diffusers/pipelines/deprecated/stable_diffusion_variants/pipeline_stable_diffusion_model_editing.py +33 -27
  179. diffusers/pipelines/deprecated/stable_diffusion_variants/pipeline_stable_diffusion_paradigms.py +33 -23
  180. diffusers/pipelines/deprecated/stable_diffusion_variants/pipeline_stable_diffusion_pix2pix_zero.py +36 -30
  181. diffusers/pipelines/deprecated/versatile_diffusion/modeling_text_unet.py +102 -69
  182. diffusers/pipelines/deprecated/versatile_diffusion/pipeline_versatile_diffusion.py +13 -13
  183. diffusers/pipelines/deprecated/versatile_diffusion/pipeline_versatile_diffusion_dual_guided.py +10 -5
  184. diffusers/pipelines/deprecated/versatile_diffusion/pipeline_versatile_diffusion_image_variation.py +11 -6
  185. diffusers/pipelines/deprecated/versatile_diffusion/pipeline_versatile_diffusion_text_to_image.py +10 -5
  186. diffusers/pipelines/deprecated/vq_diffusion/pipeline_vq_diffusion.py +5 -5
  187. diffusers/pipelines/dit/pipeline_dit.py +7 -4
  188. diffusers/pipelines/flux/__init__.py +69 -0
  189. diffusers/pipelines/flux/modeling_flux.py +47 -0
  190. diffusers/pipelines/flux/pipeline_flux.py +957 -0
  191. diffusers/pipelines/flux/pipeline_flux_control.py +889 -0
  192. diffusers/pipelines/flux/pipeline_flux_control_img2img.py +945 -0
  193. diffusers/pipelines/flux/pipeline_flux_control_inpaint.py +1141 -0
  194. diffusers/pipelines/flux/pipeline_flux_controlnet.py +1006 -0
  195. diffusers/pipelines/flux/pipeline_flux_controlnet_image_to_image.py +998 -0
  196. diffusers/pipelines/flux/pipeline_flux_controlnet_inpainting.py +1204 -0
  197. diffusers/pipelines/flux/pipeline_flux_fill.py +969 -0
  198. diffusers/pipelines/flux/pipeline_flux_img2img.py +856 -0
  199. diffusers/pipelines/flux/pipeline_flux_inpaint.py +1022 -0
  200. diffusers/pipelines/flux/pipeline_flux_prior_redux.py +492 -0
  201. diffusers/pipelines/flux/pipeline_output.py +37 -0
  202. diffusers/pipelines/free_init_utils.py +41 -38
  203. diffusers/pipelines/free_noise_utils.py +596 -0
  204. diffusers/pipelines/hunyuan_video/__init__.py +48 -0
  205. diffusers/pipelines/hunyuan_video/pipeline_hunyuan_video.py +687 -0
  206. diffusers/pipelines/hunyuan_video/pipeline_output.py +20 -0
  207. diffusers/pipelines/hunyuandit/__init__.py +48 -0
  208. diffusers/pipelines/hunyuandit/pipeline_hunyuandit.py +916 -0
  209. diffusers/pipelines/i2vgen_xl/pipeline_i2vgen_xl.py +33 -48
  210. diffusers/pipelines/kandinsky/pipeline_kandinsky.py +8 -8
  211. diffusers/pipelines/kandinsky/pipeline_kandinsky_combined.py +32 -29
  212. diffusers/pipelines/kandinsky/pipeline_kandinsky_img2img.py +11 -11
  213. diffusers/pipelines/kandinsky/pipeline_kandinsky_inpaint.py +12 -12
  214. diffusers/pipelines/kandinsky/pipeline_kandinsky_prior.py +10 -10
  215. diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2.py +6 -6
  216. diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_combined.py +34 -31
  217. diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_controlnet.py +10 -10
  218. diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_controlnet_img2img.py +10 -10
  219. diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_img2img.py +6 -6
  220. diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_inpainting.py +8 -8
  221. diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior.py +7 -7
  222. diffusers/pipelines/kandinsky2_2/pipeline_kandinsky2_2_prior_emb2emb.py +6 -6
  223. diffusers/pipelines/kandinsky3/convert_kandinsky3_unet.py +3 -3
  224. diffusers/pipelines/kandinsky3/pipeline_kandinsky3.py +22 -35
  225. diffusers/pipelines/kandinsky3/pipeline_kandinsky3_img2img.py +26 -37
  226. diffusers/pipelines/kolors/__init__.py +54 -0
  227. diffusers/pipelines/kolors/pipeline_kolors.py +1070 -0
  228. diffusers/pipelines/kolors/pipeline_kolors_img2img.py +1250 -0
  229. diffusers/pipelines/kolors/pipeline_output.py +21 -0
  230. diffusers/pipelines/kolors/text_encoder.py +889 -0
  231. diffusers/pipelines/kolors/tokenizer.py +338 -0
  232. diffusers/pipelines/latent_consistency_models/pipeline_latent_consistency_img2img.py +82 -62
  233. diffusers/pipelines/latent_consistency_models/pipeline_latent_consistency_text2img.py +77 -60
  234. diffusers/pipelines/latent_diffusion/pipeline_latent_diffusion.py +12 -12
  235. diffusers/pipelines/latte/__init__.py +48 -0
  236. diffusers/pipelines/latte/pipeline_latte.py +881 -0
  237. diffusers/pipelines/ledits_pp/pipeline_leditspp_stable_diffusion.py +80 -74
  238. diffusers/pipelines/ledits_pp/pipeline_leditspp_stable_diffusion_xl.py +85 -76
  239. diffusers/pipelines/ledits_pp/pipeline_output.py +2 -2
  240. diffusers/pipelines/ltx/__init__.py +50 -0
  241. diffusers/pipelines/ltx/pipeline_ltx.py +789 -0
  242. diffusers/pipelines/ltx/pipeline_ltx_image2video.py +885 -0
  243. diffusers/pipelines/ltx/pipeline_output.py +20 -0
  244. diffusers/pipelines/lumina/__init__.py +48 -0
  245. diffusers/pipelines/lumina/pipeline_lumina.py +890 -0
  246. diffusers/pipelines/marigold/__init__.py +50 -0
  247. diffusers/pipelines/marigold/marigold_image_processing.py +576 -0
  248. diffusers/pipelines/marigold/pipeline_marigold_depth.py +813 -0
  249. diffusers/pipelines/marigold/pipeline_marigold_normals.py +690 -0
  250. diffusers/pipelines/mochi/__init__.py +48 -0
  251. diffusers/pipelines/mochi/pipeline_mochi.py +748 -0
  252. diffusers/pipelines/mochi/pipeline_output.py +20 -0
  253. diffusers/pipelines/musicldm/pipeline_musicldm.py +14 -14
  254. diffusers/pipelines/pag/__init__.py +80 -0
  255. diffusers/pipelines/pag/pag_utils.py +243 -0
  256. diffusers/pipelines/pag/pipeline_pag_controlnet_sd.py +1328 -0
  257. diffusers/pipelines/pag/pipeline_pag_controlnet_sd_inpaint.py +1543 -0
  258. diffusers/pipelines/pag/pipeline_pag_controlnet_sd_xl.py +1610 -0
  259. diffusers/pipelines/pag/pipeline_pag_controlnet_sd_xl_img2img.py +1683 -0
  260. diffusers/pipelines/pag/pipeline_pag_hunyuandit.py +969 -0
  261. diffusers/pipelines/pag/pipeline_pag_kolors.py +1136 -0
  262. diffusers/pipelines/pag/pipeline_pag_pixart_sigma.py +865 -0
  263. diffusers/pipelines/pag/pipeline_pag_sana.py +886 -0
  264. diffusers/pipelines/pag/pipeline_pag_sd.py +1062 -0
  265. diffusers/pipelines/pag/pipeline_pag_sd_3.py +994 -0
  266. diffusers/pipelines/pag/pipeline_pag_sd_3_img2img.py +1058 -0
  267. diffusers/pipelines/pag/pipeline_pag_sd_animatediff.py +866 -0
  268. diffusers/pipelines/pag/pipeline_pag_sd_img2img.py +1094 -0
  269. diffusers/pipelines/pag/pipeline_pag_sd_inpaint.py +1356 -0
  270. diffusers/pipelines/pag/pipeline_pag_sd_xl.py +1345 -0
  271. diffusers/pipelines/pag/pipeline_pag_sd_xl_img2img.py +1544 -0
  272. diffusers/pipelines/pag/pipeline_pag_sd_xl_inpaint.py +1776 -0
  273. diffusers/pipelines/paint_by_example/pipeline_paint_by_example.py +17 -12
  274. diffusers/pipelines/pia/pipeline_pia.py +74 -164
  275. diffusers/pipelines/pipeline_flax_utils.py +5 -10
  276. diffusers/pipelines/pipeline_loading_utils.py +515 -53
  277. diffusers/pipelines/pipeline_utils.py +411 -222
  278. diffusers/pipelines/pixart_alpha/__init__.py +8 -1
  279. diffusers/pipelines/pixart_alpha/pipeline_pixart_alpha.py +76 -93
  280. diffusers/pipelines/pixart_alpha/pipeline_pixart_sigma.py +873 -0
  281. diffusers/pipelines/sana/__init__.py +47 -0
  282. diffusers/pipelines/sana/pipeline_output.py +21 -0
  283. diffusers/pipelines/sana/pipeline_sana.py +884 -0
  284. diffusers/pipelines/semantic_stable_diffusion/pipeline_semantic_stable_diffusion.py +27 -23
  285. diffusers/pipelines/shap_e/pipeline_shap_e.py +3 -3
  286. diffusers/pipelines/shap_e/pipeline_shap_e_img2img.py +14 -14
  287. diffusers/pipelines/shap_e/renderer.py +1 -1
  288. diffusers/pipelines/stable_audio/__init__.py +50 -0
  289. diffusers/pipelines/stable_audio/modeling_stable_audio.py +158 -0
  290. diffusers/pipelines/stable_audio/pipeline_stable_audio.py +756 -0
  291. diffusers/pipelines/stable_cascade/pipeline_stable_cascade.py +71 -25
  292. diffusers/pipelines/stable_cascade/pipeline_stable_cascade_combined.py +23 -19
  293. diffusers/pipelines/stable_cascade/pipeline_stable_cascade_prior.py +35 -34
  294. diffusers/pipelines/stable_diffusion/__init__.py +0 -1
  295. diffusers/pipelines/stable_diffusion/convert_from_ckpt.py +20 -11
  296. diffusers/pipelines/stable_diffusion/pipeline_flax_stable_diffusion.py +1 -1
  297. diffusers/pipelines/stable_diffusion/pipeline_onnx_stable_diffusion.py +2 -2
  298. diffusers/pipelines/stable_diffusion/pipeline_onnx_stable_diffusion_upscale.py +6 -6
  299. diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion.py +145 -79
  300. diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_depth2img.py +43 -28
  301. diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_image_variation.py +13 -8
  302. diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_img2img.py +100 -68
  303. diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_inpaint.py +109 -201
  304. diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_instruct_pix2pix.py +131 -32
  305. diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_latent_upscale.py +247 -87
  306. diffusers/pipelines/stable_diffusion/pipeline_stable_diffusion_upscale.py +30 -29
  307. diffusers/pipelines/stable_diffusion/pipeline_stable_unclip.py +35 -27
  308. diffusers/pipelines/stable_diffusion/pipeline_stable_unclip_img2img.py +49 -42
  309. diffusers/pipelines/stable_diffusion/safety_checker.py +2 -1
  310. diffusers/pipelines/stable_diffusion_3/__init__.py +54 -0
  311. diffusers/pipelines/stable_diffusion_3/pipeline_output.py +21 -0
  312. diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +1140 -0
  313. diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +1036 -0
  314. diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +1250 -0
  315. diffusers/pipelines/stable_diffusion_attend_and_excite/pipeline_stable_diffusion_attend_and_excite.py +29 -20
  316. diffusers/pipelines/stable_diffusion_diffedit/pipeline_stable_diffusion_diffedit.py +59 -58
  317. diffusers/pipelines/stable_diffusion_gligen/pipeline_stable_diffusion_gligen.py +31 -25
  318. diffusers/pipelines/stable_diffusion_gligen/pipeline_stable_diffusion_gligen_text_image.py +38 -22
  319. diffusers/pipelines/stable_diffusion_k_diffusion/pipeline_stable_diffusion_k_diffusion.py +30 -24
  320. diffusers/pipelines/stable_diffusion_k_diffusion/pipeline_stable_diffusion_xl_k_diffusion.py +24 -23
  321. diffusers/pipelines/stable_diffusion_ldm3d/pipeline_stable_diffusion_ldm3d.py +107 -67
  322. diffusers/pipelines/stable_diffusion_panorama/pipeline_stable_diffusion_panorama.py +316 -69
  323. diffusers/pipelines/stable_diffusion_safe/pipeline_stable_diffusion_safe.py +10 -5
  324. diffusers/pipelines/stable_diffusion_safe/safety_checker.py +1 -1
  325. diffusers/pipelines/stable_diffusion_sag/pipeline_stable_diffusion_sag.py +98 -30
  326. diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl.py +121 -83
  327. diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_img2img.py +161 -105
  328. diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_inpaint.py +142 -218
  329. diffusers/pipelines/stable_diffusion_xl/pipeline_stable_diffusion_xl_instruct_pix2pix.py +45 -29
  330. diffusers/pipelines/stable_diffusion_xl/watermark.py +9 -3
  331. diffusers/pipelines/stable_video_diffusion/pipeline_stable_video_diffusion.py +110 -57
  332. diffusers/pipelines/t2i_adapter/pipeline_stable_diffusion_adapter.py +69 -39
  333. diffusers/pipelines/t2i_adapter/pipeline_stable_diffusion_xl_adapter.py +105 -74
  334. diffusers/pipelines/text_to_video_synthesis/pipeline_output.py +3 -2
  335. diffusers/pipelines/text_to_video_synthesis/pipeline_text_to_video_synth.py +29 -49
  336. diffusers/pipelines/text_to_video_synthesis/pipeline_text_to_video_synth_img2img.py +32 -93
  337. diffusers/pipelines/text_to_video_synthesis/pipeline_text_to_video_zero.py +37 -25
  338. diffusers/pipelines/text_to_video_synthesis/pipeline_text_to_video_zero_sdxl.py +54 -40
  339. diffusers/pipelines/unclip/pipeline_unclip.py +6 -6
  340. diffusers/pipelines/unclip/pipeline_unclip_image_variation.py +6 -6
  341. diffusers/pipelines/unidiffuser/modeling_text_decoder.py +1 -1
  342. diffusers/pipelines/unidiffuser/modeling_uvit.py +12 -12
  343. diffusers/pipelines/unidiffuser/pipeline_unidiffuser.py +29 -28
  344. diffusers/pipelines/wuerstchen/modeling_paella_vq_model.py +5 -5
  345. diffusers/pipelines/wuerstchen/modeling_wuerstchen_common.py +5 -10
  346. diffusers/pipelines/wuerstchen/modeling_wuerstchen_prior.py +6 -8
  347. diffusers/pipelines/wuerstchen/pipeline_wuerstchen.py +4 -4
  348. diffusers/pipelines/wuerstchen/pipeline_wuerstchen_combined.py +12 -12
  349. diffusers/pipelines/wuerstchen/pipeline_wuerstchen_prior.py +15 -14
  350. diffusers/{models/dual_transformer_2d.py → quantizers/__init__.py} +2 -6
  351. diffusers/quantizers/auto.py +139 -0
  352. diffusers/quantizers/base.py +233 -0
  353. diffusers/quantizers/bitsandbytes/__init__.py +2 -0
  354. diffusers/quantizers/bitsandbytes/bnb_quantizer.py +561 -0
  355. diffusers/quantizers/bitsandbytes/utils.py +306 -0
  356. diffusers/quantizers/gguf/__init__.py +1 -0
  357. diffusers/quantizers/gguf/gguf_quantizer.py +159 -0
  358. diffusers/quantizers/gguf/utils.py +456 -0
  359. diffusers/quantizers/quantization_config.py +669 -0
  360. diffusers/quantizers/torchao/__init__.py +15 -0
  361. diffusers/quantizers/torchao/torchao_quantizer.py +292 -0
  362. diffusers/schedulers/__init__.py +12 -2
  363. diffusers/schedulers/deprecated/__init__.py +1 -1
  364. diffusers/schedulers/deprecated/scheduling_karras_ve.py +25 -25
  365. diffusers/schedulers/scheduling_amused.py +5 -5
  366. diffusers/schedulers/scheduling_consistency_decoder.py +11 -11
  367. diffusers/schedulers/scheduling_consistency_models.py +23 -25
  368. diffusers/schedulers/scheduling_cosine_dpmsolver_multistep.py +572 -0
  369. diffusers/schedulers/scheduling_ddim.py +27 -26
  370. diffusers/schedulers/scheduling_ddim_cogvideox.py +452 -0
  371. diffusers/schedulers/scheduling_ddim_flax.py +2 -1
  372. diffusers/schedulers/scheduling_ddim_inverse.py +16 -16
  373. diffusers/schedulers/scheduling_ddim_parallel.py +32 -31
  374. diffusers/schedulers/scheduling_ddpm.py +27 -30
  375. diffusers/schedulers/scheduling_ddpm_flax.py +7 -3
  376. diffusers/schedulers/scheduling_ddpm_parallel.py +33 -36
  377. diffusers/schedulers/scheduling_ddpm_wuerstchen.py +14 -14
  378. diffusers/schedulers/scheduling_deis_multistep.py +150 -50
  379. diffusers/schedulers/scheduling_dpm_cogvideox.py +489 -0
  380. diffusers/schedulers/scheduling_dpmsolver_multistep.py +221 -84
  381. diffusers/schedulers/scheduling_dpmsolver_multistep_flax.py +2 -2
  382. diffusers/schedulers/scheduling_dpmsolver_multistep_inverse.py +158 -52
  383. diffusers/schedulers/scheduling_dpmsolver_sde.py +153 -34
  384. diffusers/schedulers/scheduling_dpmsolver_singlestep.py +275 -86
  385. diffusers/schedulers/scheduling_edm_dpmsolver_multistep.py +81 -57
  386. diffusers/schedulers/scheduling_edm_euler.py +62 -39
  387. diffusers/schedulers/scheduling_euler_ancestral_discrete.py +30 -29
  388. diffusers/schedulers/scheduling_euler_discrete.py +255 -74
  389. diffusers/schedulers/scheduling_flow_match_euler_discrete.py +458 -0
  390. diffusers/schedulers/scheduling_flow_match_heun_discrete.py +320 -0
  391. diffusers/schedulers/scheduling_heun_discrete.py +174 -46
  392. diffusers/schedulers/scheduling_ipndm.py +9 -9
  393. diffusers/schedulers/scheduling_k_dpm_2_ancestral_discrete.py +138 -29
  394. diffusers/schedulers/scheduling_k_dpm_2_discrete.py +132 -26
  395. diffusers/schedulers/scheduling_karras_ve_flax.py +6 -6
  396. diffusers/schedulers/scheduling_lcm.py +23 -29
  397. diffusers/schedulers/scheduling_lms_discrete.py +105 -28
  398. diffusers/schedulers/scheduling_pndm.py +20 -20
  399. diffusers/schedulers/scheduling_repaint.py +21 -21
  400. diffusers/schedulers/scheduling_sasolver.py +157 -60
  401. diffusers/schedulers/scheduling_sde_ve.py +19 -19
  402. diffusers/schedulers/scheduling_tcd.py +41 -36
  403. diffusers/schedulers/scheduling_unclip.py +19 -16
  404. diffusers/schedulers/scheduling_unipc_multistep.py +243 -47
  405. diffusers/schedulers/scheduling_utils.py +12 -5
  406. diffusers/schedulers/scheduling_utils_flax.py +1 -3
  407. diffusers/schedulers/scheduling_vq_diffusion.py +10 -10
  408. diffusers/training_utils.py +214 -30
  409. diffusers/utils/__init__.py +17 -1
  410. diffusers/utils/constants.py +3 -0
  411. diffusers/utils/doc_utils.py +1 -0
  412. diffusers/utils/dummy_pt_objects.py +592 -7
  413. diffusers/utils/dummy_torch_and_torchsde_objects.py +15 -0
  414. diffusers/utils/dummy_torch_and_transformers_and_sentencepiece_objects.py +47 -0
  415. diffusers/utils/dummy_torch_and_transformers_objects.py +1001 -71
  416. diffusers/utils/dynamic_modules_utils.py +34 -29
  417. diffusers/utils/export_utils.py +50 -6
  418. diffusers/utils/hub_utils.py +131 -17
  419. diffusers/utils/import_utils.py +210 -8
  420. diffusers/utils/loading_utils.py +118 -5
  421. diffusers/utils/logging.py +4 -2
  422. diffusers/utils/peft_utils.py +37 -7
  423. diffusers/utils/state_dict_utils.py +13 -2
  424. diffusers/utils/testing_utils.py +193 -11
  425. diffusers/utils/torch_utils.py +4 -0
  426. diffusers/video_processor.py +113 -0
  427. {diffusers-0.27.0.dist-info → diffusers-0.32.2.dist-info}/METADATA +82 -91
  428. diffusers-0.32.2.dist-info/RECORD +550 -0
  429. {diffusers-0.27.0.dist-info → diffusers-0.32.2.dist-info}/WHEEL +1 -1
  430. diffusers/loaders/autoencoder.py +0 -146
  431. diffusers/loaders/controlnet.py +0 -136
  432. diffusers/loaders/lora.py +0 -1349
  433. diffusers/models/prior_transformer.py +0 -12
  434. diffusers/models/t5_film_transformer.py +0 -70
  435. diffusers/models/transformer_2d.py +0 -25
  436. diffusers/models/transformer_temporal.py +0 -34
  437. diffusers/models/unet_1d.py +0 -26
  438. diffusers/models/unet_1d_blocks.py +0 -203
  439. diffusers/models/unet_2d.py +0 -27
  440. diffusers/models/unet_2d_blocks.py +0 -375
  441. diffusers/models/unet_2d_condition.py +0 -25
  442. diffusers-0.27.0.dist-info/RECORD +0 -399
  443. {diffusers-0.27.0.dist-info → diffusers-0.32.2.dist-info}/LICENSE +0 -0
  444. {diffusers-0.27.0.dist-info → diffusers-0.32.2.dist-info}/entry_points.txt +0 -0
  445. {diffusers-0.27.0.dist-info → diffusers-0.32.2.dist-info}/top_level.txt +0 -0
@@ -131,7 +131,6 @@ try:
131
131
  except importlib_metadata.PackageNotFoundError:
132
132
  _unidecode_available = False
133
133
 
134
-
135
134
  _onnxruntime_version = "N/A"
136
135
  _onnx_available = importlib.util.find_spec("onnxruntime") is not None
137
136
  if _onnx_available:
@@ -295,6 +294,68 @@ try:
295
294
  except importlib_metadata.PackageNotFoundError:
296
295
  _torchvision_available = False
297
296
 
297
+ _sentencepiece_available = importlib.util.find_spec("sentencepiece") is not None
298
+ try:
299
+ _sentencepiece_version = importlib_metadata.version("sentencepiece")
300
+ logger.info(f"Successfully imported sentencepiece version {_sentencepiece_version}")
301
+ except importlib_metadata.PackageNotFoundError:
302
+ _sentencepiece_available = False
303
+
304
+ _matplotlib_available = importlib.util.find_spec("matplotlib") is not None
305
+ try:
306
+ _matplotlib_version = importlib_metadata.version("matplotlib")
307
+ logger.debug(f"Successfully imported matplotlib version {_matplotlib_version}")
308
+ except importlib_metadata.PackageNotFoundError:
309
+ _matplotlib_available = False
310
+
311
+ _timm_available = importlib.util.find_spec("timm") is not None
312
+ if _timm_available:
313
+ try:
314
+ _timm_version = importlib_metadata.version("timm")
315
+ logger.info(f"Timm version {_timm_version} available.")
316
+ except importlib_metadata.PackageNotFoundError:
317
+ _timm_available = False
318
+
319
+
320
+ def is_timm_available():
321
+ return _timm_available
322
+
323
+
324
+ _bitsandbytes_available = importlib.util.find_spec("bitsandbytes") is not None
325
+ try:
326
+ _bitsandbytes_version = importlib_metadata.version("bitsandbytes")
327
+ logger.debug(f"Successfully imported bitsandbytes version {_bitsandbytes_version}")
328
+ except importlib_metadata.PackageNotFoundError:
329
+ _bitsandbytes_available = False
330
+
331
+ _is_google_colab = "google.colab" in sys.modules or any(k.startswith("COLAB_") for k in os.environ)
332
+
333
+ _imageio_available = importlib.util.find_spec("imageio") is not None
334
+ if _imageio_available:
335
+ try:
336
+ _imageio_version = importlib_metadata.version("imageio")
337
+ logger.debug(f"Successfully imported imageio version {_imageio_version}")
338
+
339
+ except importlib_metadata.PackageNotFoundError:
340
+ _imageio_available = False
341
+
342
+ _is_gguf_available = importlib.util.find_spec("gguf") is not None
343
+ if _is_gguf_available:
344
+ try:
345
+ _gguf_version = importlib_metadata.version("gguf")
346
+ logger.debug(f"Successfully import gguf version {_gguf_version}")
347
+ except importlib_metadata.PackageNotFoundError:
348
+ _is_gguf_available = False
349
+
350
+
351
+ _is_torchao_available = importlib.util.find_spec("torchao") is not None
352
+ if _is_torchao_available:
353
+ try:
354
+ _torchao_version = importlib_metadata.version("torchao")
355
+ logger.debug(f"Successfully import torchao version {_torchao_version}")
356
+ except importlib_metadata.PackageNotFoundError:
357
+ _is_torchao_available = False
358
+
298
359
 
299
360
  def is_torch_available():
300
361
  return _torch_available
@@ -392,6 +453,38 @@ def is_torchvision_available():
392
453
  return _torchvision_available
393
454
 
394
455
 
456
+ def is_matplotlib_available():
457
+ return _matplotlib_available
458
+
459
+
460
+ def is_safetensors_available():
461
+ return _safetensors_available
462
+
463
+
464
+ def is_bitsandbytes_available():
465
+ return _bitsandbytes_available
466
+
467
+
468
+ def is_google_colab():
469
+ return _is_google_colab
470
+
471
+
472
+ def is_sentencepiece_available():
473
+ return _sentencepiece_available
474
+
475
+
476
+ def is_imageio_available():
477
+ return _imageio_available
478
+
479
+
480
+ def is_gguf_available():
481
+ return _is_gguf_available
482
+
483
+
484
+ def is_torchao_available():
485
+ return _is_torchao_available
486
+
487
+
395
488
  # docstyle-ignore
396
489
  FLAX_IMPORT_ERROR = """
397
490
  {0} requires the FLAX library but it was not found in your environment. Checkout the instructions on the
@@ -499,6 +592,41 @@ INVISIBLE_WATERMARK_IMPORT_ERROR = """
499
592
  {0} requires the invisible-watermark library but it was not found in your environment. You can install it with pip: `pip install invisible-watermark>=0.2.0`
500
593
  """
501
594
 
595
+ # docstyle-ignore
596
+ PEFT_IMPORT_ERROR = """
597
+ {0} requires the peft library but it was not found in your environment. You can install it with pip: `pip install peft`
598
+ """
599
+
600
+ # docstyle-ignore
601
+ SAFETENSORS_IMPORT_ERROR = """
602
+ {0} requires the safetensors library but it was not found in your environment. You can install it with pip: `pip install safetensors`
603
+ """
604
+
605
+ # docstyle-ignore
606
+ SENTENCEPIECE_IMPORT_ERROR = """
607
+ {0} requires the sentencepiece library but it was not found in your environment. You can install it with pip: `pip install sentencepiece`
608
+ """
609
+
610
+
611
+ # docstyle-ignore
612
+ BITSANDBYTES_IMPORT_ERROR = """
613
+ {0} requires the bitsandbytes library but it was not found in your environment. You can install it with pip: `pip install bitsandbytes`
614
+ """
615
+
616
+ # docstyle-ignore
617
+ IMAGEIO_IMPORT_ERROR = """
618
+ {0} requires the imageio library and ffmpeg but it was not found in your environment. You can install it with pip: `pip install imageio imageio-ffmpeg`
619
+ """
620
+
621
+ # docstyle-ignore
622
+ GGUF_IMPORT_ERROR = """
623
+ {0} requires the gguf library but it was not found in your environment. You can install it with pip: `pip install gguf`
624
+ """
625
+
626
+ TORCHAO_IMPORT_ERROR = """
627
+ {0} requires the torchao library but it was not found in your environment. You can install it with pip: `pip install
628
+ torchao`
629
+ """
502
630
 
503
631
  BACKENDS_MAPPING = OrderedDict(
504
632
  [
@@ -520,6 +648,13 @@ BACKENDS_MAPPING = OrderedDict(
520
648
  ("ftfy", (is_ftfy_available, FTFY_IMPORT_ERROR)),
521
649
  ("torchsde", (is_torchsde_available, TORCHSDE_IMPORT_ERROR)),
522
650
  ("invisible_watermark", (is_invisible_watermark_available, INVISIBLE_WATERMARK_IMPORT_ERROR)),
651
+ ("peft", (is_peft_available, PEFT_IMPORT_ERROR)),
652
+ ("safetensors", (is_safetensors_available, SAFETENSORS_IMPORT_ERROR)),
653
+ ("bitsandbytes", (is_bitsandbytes_available, BITSANDBYTES_IMPORT_ERROR)),
654
+ ("sentencepiece", (is_sentencepiece_available, SENTENCEPIECE_IMPORT_ERROR)),
655
+ ("imageio", (is_imageio_available, IMAGEIO_IMPORT_ERROR)),
656
+ ("gguf", (is_gguf_available, GGUF_IMPORT_ERROR)),
657
+ ("torchao", (is_torchao_available, TORCHAO_IMPORT_ERROR)),
523
658
  ]
524
659
  )
525
660
 
@@ -570,8 +705,9 @@ class DummyObject(type):
570
705
  # This function was copied from: https://github.com/huggingface/accelerate/blob/874c4967d94badd24f893064cc3bef45f57cadf7/src/accelerate/utils/versions.py#L319
571
706
  def compare_versions(library_or_version: Union[str, Version], operation: str, requirement_version: str):
572
707
  """
573
- Args:
574
708
  Compares a library version to some requirement using a given operation.
709
+
710
+ Args:
575
711
  library_or_version (`str` or `packaging.version.Version`):
576
712
  A library name or a version to check.
577
713
  operation (`str`):
@@ -590,8 +726,9 @@ def compare_versions(library_or_version: Union[str, Version], operation: str, re
590
726
  # This function was copied from: https://github.com/huggingface/accelerate/blob/874c4967d94badd24f893064cc3bef45f57cadf7/src/accelerate/utils/versions.py#L338
591
727
  def is_torch_version(operation: str, version: str):
592
728
  """
593
- Args:
594
729
  Compares the current PyTorch version to a given reference with an operation.
730
+
731
+ Args:
595
732
  operation (`str`):
596
733
  A string representation of an operator, such as `">"` or `"<="`
597
734
  version (`str`):
@@ -600,10 +737,26 @@ def is_torch_version(operation: str, version: str):
600
737
  return compare_versions(parse(_torch_version), operation, version)
601
738
 
602
739
 
603
- def is_transformers_version(operation: str, version: str):
740
+ def is_torch_xla_version(operation: str, version: str):
604
741
  """
742
+ Compares the current torch_xla version to a given reference with an operation.
743
+
605
744
  Args:
745
+ operation (`str`):
746
+ A string representation of an operator, such as `">"` or `"<="`
747
+ version (`str`):
748
+ A string version of torch_xla
749
+ """
750
+ if not is_torch_xla_available:
751
+ return False
752
+ return compare_versions(parse(_torch_xla_version), operation, version)
753
+
754
+
755
+ def is_transformers_version(operation: str, version: str):
756
+ """
606
757
  Compares the current Transformers version to a given reference with an operation.
758
+
759
+ Args:
607
760
  operation (`str`):
608
761
  A string representation of an operator, such as `">"` or `"<="`
609
762
  version (`str`):
@@ -616,8 +769,9 @@ def is_transformers_version(operation: str, version: str):
616
769
 
617
770
  def is_accelerate_version(operation: str, version: str):
618
771
  """
619
- Args:
620
772
  Compares the current Accelerate version to a given reference with an operation.
773
+
774
+ Args:
621
775
  operation (`str`):
622
776
  A string representation of an operator, such as `">"` or `"<="`
623
777
  version (`str`):
@@ -628,10 +782,55 @@ def is_accelerate_version(operation: str, version: str):
628
782
  return compare_versions(parse(_accelerate_version), operation, version)
629
783
 
630
784
 
631
- def is_k_diffusion_version(operation: str, version: str):
785
+ def is_peft_version(operation: str, version: str):
632
786
  """
787
+ Compares the current PEFT version to a given reference with an operation.
788
+
633
789
  Args:
790
+ operation (`str`):
791
+ A string representation of an operator, such as `">"` or `"<="`
792
+ version (`str`):
793
+ A version string
794
+ """
795
+ if not _peft_version:
796
+ return False
797
+ return compare_versions(parse(_peft_version), operation, version)
798
+
799
+
800
+ def is_bitsandbytes_version(operation: str, version: str):
801
+ """
802
+ Args:
803
+ Compares the current bitsandbytes version to a given reference with an operation.
804
+ operation (`str`):
805
+ A string representation of an operator, such as `">"` or `"<="`
806
+ version (`str`):
807
+ A version string
808
+ """
809
+ if not _bitsandbytes_version:
810
+ return False
811
+ return compare_versions(parse(_bitsandbytes_version), operation, version)
812
+
813
+
814
+ def is_gguf_version(operation: str, version: str):
815
+ """
816
+ Compares the current Accelerate version to a given reference with an operation.
817
+
818
+ Args:
819
+ operation (`str`):
820
+ A string representation of an operator, such as `">"` or `"<="`
821
+ version (`str`):
822
+ A version string
823
+ """
824
+ if not _is_gguf_available:
825
+ return False
826
+ return compare_versions(parse(_gguf_version), operation, version)
827
+
828
+
829
+ def is_k_diffusion_version(operation: str, version: str):
830
+ """
634
831
  Compares the current k-diffusion version to a given reference with an operation.
832
+
833
+ Args:
635
834
  operation (`str`):
636
835
  A string representation of an operator, such as `">"` or `"<="`
637
836
  version (`str`):
@@ -644,8 +843,9 @@ def is_k_diffusion_version(operation: str, version: str):
644
843
 
645
844
  def get_objects_from_module(module):
646
845
  """
647
- Args:
648
846
  Returns a dict of object names and values in a module, while skipping private/internal objects
847
+
848
+ Args:
649
849
  module (ModuleType):
650
850
  Module to extract the objects from.
651
851
 
@@ -663,7 +863,9 @@ def get_objects_from_module(module):
663
863
 
664
864
 
665
865
  class OptionalDependencyNotAvailable(BaseException):
666
- """An error indicating that an optional dependency of Diffusers was not found in the environment."""
866
+ """
867
+ An error indicating that an optional dependency of Diffusers was not found in the environment.
868
+ """
667
869
 
668
870
 
669
871
  class _LazyModule(ModuleType):
@@ -1,13 +1,17 @@
1
1
  import os
2
- from typing import Callable, Union
2
+ import tempfile
3
+ from typing import Any, Callable, List, Optional, Tuple, Union
4
+ from urllib.parse import unquote, urlparse
3
5
 
4
6
  import PIL.Image
5
7
  import PIL.ImageOps
6
8
  import requests
7
9
 
10
+ from .import_utils import BACKENDS_MAPPING, is_imageio_available
11
+
8
12
 
9
13
  def load_image(
10
- image: Union[str, PIL.Image.Image], convert_method: Callable[[PIL.Image.Image], PIL.Image.Image] = None
14
+ image: Union[str, PIL.Image.Image], convert_method: Optional[Callable[[PIL.Image.Image], PIL.Image.Image]] = None
11
15
  ) -> PIL.Image.Image:
12
16
  """
13
17
  Loads `image` to a PIL Image.
@@ -15,9 +19,9 @@ def load_image(
15
19
  Args:
16
20
  image (`str` or `PIL.Image.Image`):
17
21
  The image to convert to the PIL Image format.
18
- convert_method (Callable[[PIL.Image.Image], PIL.Image.Image], optional):
19
- A conversion method to apply to the image after loading it.
20
- When set to `None` the image will be converted "RGB".
22
+ convert_method (Callable[[PIL.Image.Image], PIL.Image.Image], *optional*):
23
+ A conversion method to apply to the image after loading it. When set to `None` the image will be converted
24
+ "RGB".
21
25
 
22
26
  Returns:
23
27
  `PIL.Image.Image`:
@@ -47,3 +51,112 @@ def load_image(
47
51
  image = image.convert("RGB")
48
52
 
49
53
  return image
54
+
55
+
56
+ def load_video(
57
+ video: str,
58
+ convert_method: Optional[Callable[[List[PIL.Image.Image]], List[PIL.Image.Image]]] = None,
59
+ ) -> List[PIL.Image.Image]:
60
+ """
61
+ Loads `video` to a list of PIL Image.
62
+
63
+ Args:
64
+ video (`str`):
65
+ A URL or Path to a video to convert to a list of PIL Image format.
66
+ convert_method (Callable[[List[PIL.Image.Image]], List[PIL.Image.Image]], *optional*):
67
+ A conversion method to apply to the video after loading it. When set to `None` the images will be converted
68
+ to "RGB".
69
+
70
+ Returns:
71
+ `List[PIL.Image.Image]`:
72
+ The video as a list of PIL images.
73
+ """
74
+ is_url = video.startswith("http://") or video.startswith("https://")
75
+ is_file = os.path.isfile(video)
76
+ was_tempfile_created = False
77
+
78
+ if not (is_url or is_file):
79
+ raise ValueError(
80
+ f"Incorrect path or URL. URLs must start with `http://` or `https://`, and {video} is not a valid path."
81
+ )
82
+
83
+ if is_url:
84
+ response = requests.get(video, stream=True)
85
+ if response.status_code != 200:
86
+ raise ValueError(f"Failed to download video. Status code: {response.status_code}")
87
+
88
+ parsed_url = urlparse(video)
89
+ file_name = os.path.basename(unquote(parsed_url.path))
90
+
91
+ suffix = os.path.splitext(file_name)[1] or ".mp4"
92
+ video_path = tempfile.NamedTemporaryFile(suffix=suffix, delete=False).name
93
+
94
+ was_tempfile_created = True
95
+
96
+ video_data = response.iter_content(chunk_size=8192)
97
+ with open(video_path, "wb") as f:
98
+ for chunk in video_data:
99
+ f.write(chunk)
100
+
101
+ video = video_path
102
+
103
+ pil_images = []
104
+ if video.endswith(".gif"):
105
+ gif = PIL.Image.open(video)
106
+ try:
107
+ while True:
108
+ pil_images.append(gif.copy())
109
+ gif.seek(gif.tell() + 1)
110
+ except EOFError:
111
+ pass
112
+
113
+ else:
114
+ if is_imageio_available():
115
+ import imageio
116
+ else:
117
+ raise ImportError(BACKENDS_MAPPING["imageio"][1].format("load_video"))
118
+
119
+ try:
120
+ imageio.plugins.ffmpeg.get_exe()
121
+ except AttributeError:
122
+ raise AttributeError(
123
+ "`Unable to find an ffmpeg installation on your machine. Please install via `pip install imageio-ffmpeg"
124
+ )
125
+
126
+ with imageio.get_reader(video) as reader:
127
+ # Read all frames
128
+ for frame in reader:
129
+ pil_images.append(PIL.Image.fromarray(frame))
130
+
131
+ if was_tempfile_created:
132
+ os.remove(video_path)
133
+
134
+ if convert_method is not None:
135
+ pil_images = convert_method(pil_images)
136
+
137
+ return pil_images
138
+
139
+
140
+ # Taken from `transformers`.
141
+ def get_module_from_name(module, tensor_name: str) -> Tuple[Any, str]:
142
+ if "." in tensor_name:
143
+ splits = tensor_name.split(".")
144
+ for split in splits[:-1]:
145
+ new_module = getattr(module, split)
146
+ if new_module is None:
147
+ raise ValueError(f"{module} has no attribute {split}.")
148
+ module = new_module
149
+ tensor_name = splits[-1]
150
+ return module, tensor_name
151
+
152
+
153
+ def get_submodule_by_name(root_module, module_path: str):
154
+ current = root_module
155
+ parts = module_path.split(".")
156
+ for part in parts:
157
+ if part.isdigit():
158
+ idx = int(part)
159
+ current = current[idx] # e.g., for nn.ModuleList or nn.Sequential
160
+ else:
161
+ current = getattr(current, part)
162
+ return current
@@ -12,7 +12,7 @@
12
12
  # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
13
  # See the License for the specific language governing permissions and
14
14
  # limitations under the License.
15
- """ Logging utilities."""
15
+ """Logging utilities."""
16
16
 
17
17
  import logging
18
18
  import os
@@ -82,7 +82,9 @@ def _configure_library_root_logger() -> None:
82
82
  # This library has already configured the library root logger.
83
83
  return
84
84
  _default_handler = logging.StreamHandler() # Set sys.stderr as stream.
85
- _default_handler.flush = sys.stderr.flush
85
+
86
+ if sys.stderr: # only if sys.stderr exists, e.g. when not using pythonw in windows
87
+ _default_handler.flush = sys.stderr.flush
86
88
 
87
89
  # Apply our default configuration to the library root logger.
88
90
  library_root_logger = _get_library_root_logger()
@@ -14,6 +14,7 @@
14
14
  """
15
15
  PEFT utilities: Utilities related to peft library
16
16
  """
17
+
17
18
  import collections
18
19
  import importlib
19
20
  from typing import Optional
@@ -63,9 +64,11 @@ def recurse_remove_peft_layers(model):
63
64
  module_replaced = False
64
65
 
65
66
  if isinstance(module, LoraLayer) and isinstance(module, torch.nn.Linear):
66
- new_module = torch.nn.Linear(module.in_features, module.out_features, bias=module.bias is not None).to(
67
- module.weight.device
68
- )
67
+ new_module = torch.nn.Linear(
68
+ module.in_features,
69
+ module.out_features,
70
+ bias=module.bias is not None,
71
+ ).to(module.weight.device)
69
72
  new_module.weight = module.weight
70
73
  if module.bias is not None:
71
74
  new_module.bias = module.bias
@@ -109,6 +112,9 @@ def scale_lora_layers(model, weight):
109
112
  """
110
113
  from peft.tuners.tuners_utils import BaseTunerLayer
111
114
 
115
+ if weight == 1.0:
116
+ return
117
+
112
118
  for module in model.modules():
113
119
  if isinstance(module, BaseTunerLayer):
114
120
  module.scale_layer(weight)
@@ -128,11 +134,14 @@ def unscale_lora_layers(model, weight: Optional[float] = None):
128
134
  """
129
135
  from peft.tuners.tuners_utils import BaseTunerLayer
130
136
 
137
+ if weight is None or weight == 1.0:
138
+ return
139
+
131
140
  for module in model.modules():
132
141
  if isinstance(module, BaseTunerLayer):
133
- if weight is not None and weight != 0:
142
+ if weight != 0:
134
143
  module.unscale_layer(weight)
135
- elif weight is not None and weight == 0:
144
+ else:
136
145
  for adapter_name in module.active_adapters:
137
146
  # if weight == 0 unscale should re-set the scale to the original value.
138
147
  module.set_scale(adapter_name, 1.0)
@@ -170,6 +179,9 @@ def get_peft_kwargs(rank_dict, network_alpha_dict, peft_state_dict, is_unet=True
170
179
 
171
180
  # layer names without the Diffusers specific
172
181
  target_modules = list({name.split(".lora")[0] for name in peft_state_dict.keys()})
182
+ use_dora = any("lora_magnitude_vector" in k for k in peft_state_dict)
183
+ # for now we know that the "bias" keys are only associated with `lora_B`.
184
+ lora_bias = any("lora_B" in k and k.endswith(".bias") for k in peft_state_dict)
173
185
 
174
186
  lora_config_kwargs = {
175
187
  "r": r,
@@ -177,6 +189,8 @@ def get_peft_kwargs(rank_dict, network_alpha_dict, peft_state_dict, is_unet=True
177
189
  "rank_pattern": rank_pattern,
178
190
  "alpha_pattern": alpha_pattern,
179
191
  "target_modules": target_modules,
192
+ "use_dora": use_dora,
193
+ "lora_bias": lora_bias,
180
194
  }
181
195
  return lora_config_kwargs
182
196
 
@@ -227,16 +241,32 @@ def delete_adapter_layers(model, adapter_name):
227
241
  def set_weights_and_activate_adapters(model, adapter_names, weights):
228
242
  from peft.tuners.tuners_utils import BaseTunerLayer
229
243
 
244
+ def get_module_weight(weight_for_adapter, module_name):
245
+ if not isinstance(weight_for_adapter, dict):
246
+ # If weight_for_adapter is a single number, always return it.
247
+ return weight_for_adapter
248
+
249
+ for layer_name, weight_ in weight_for_adapter.items():
250
+ if layer_name in module_name:
251
+ return weight_
252
+
253
+ parts = module_name.split(".")
254
+ # e.g. key = "down_blocks.1.attentions.0"
255
+ key = f"{parts[0]}.{parts[1]}.attentions.{parts[3]}"
256
+ block_weight = weight_for_adapter.get(key, 1.0)
257
+
258
+ return block_weight
259
+
230
260
  # iterate over each adapter, make it active and set the corresponding scaling weight
231
261
  for adapter_name, weight in zip(adapter_names, weights):
232
- for module in model.modules():
262
+ for module_name, module in model.named_modules():
233
263
  if isinstance(module, BaseTunerLayer):
234
264
  # For backward compatbility with previous PEFT versions
235
265
  if hasattr(module, "set_adapter"):
236
266
  module.set_adapter(adapter_name)
237
267
  else:
238
268
  module.active_adapter = adapter_name
239
- module.set_scale(adapter_name, weight)
269
+ module.set_scale(adapter_name, get_module_weight(weight, module_name))
240
270
 
241
271
  # set multiple active adapters
242
272
  for module in model.modules():
@@ -14,6 +14,7 @@
14
14
  """
15
15
  State dict utilities: utility methods for converting state dicts easily
16
16
  """
17
+
17
18
  import enum
18
19
 
19
20
  from .logging import get_logger
@@ -46,6 +47,7 @@ UNET_TO_DIFFUSERS = {
46
47
  ".to_v_lora.up": ".to_v.lora_B",
47
48
  ".lora.up": ".lora_B",
48
49
  ".lora.down": ".lora_A",
50
+ ".to_out.lora_magnitude_vector": ".to_out.0.lora_magnitude_vector",
49
51
  }
50
52
 
51
53
 
@@ -60,6 +62,8 @@ DIFFUSERS_TO_PEFT = {
60
62
  ".out_proj.lora_linear_layer.down": ".out_proj.lora_A",
61
63
  ".lora_linear_layer.up": ".lora_B",
62
64
  ".lora_linear_layer.down": ".lora_A",
65
+ "text_projection.lora.down.weight": "text_projection.lora_A.weight",
66
+ "text_projection.lora.up.weight": "text_projection.lora_B.weight",
63
67
  }
64
68
 
65
69
  DIFFUSERS_OLD_TO_PEFT = {
@@ -103,6 +107,10 @@ DIFFUSERS_OLD_TO_DIFFUSERS = {
103
107
  ".to_v_lora.down": ".v_proj.lora_linear_layer.down",
104
108
  ".to_out_lora.up": ".out_proj.lora_linear_layer.up",
105
109
  ".to_out_lora.down": ".out_proj.lora_linear_layer.down",
110
+ ".to_k.lora_magnitude_vector": ".k_proj.lora_magnitude_vector",
111
+ ".to_v.lora_magnitude_vector": ".v_proj.lora_magnitude_vector",
112
+ ".to_q.lora_magnitude_vector": ".q_proj.lora_magnitude_vector",
113
+ ".to_out.lora_magnitude_vector": ".out_proj.lora_magnitude_vector",
106
114
  }
107
115
 
108
116
  PEFT_TO_KOHYA_SS = {
@@ -247,8 +255,8 @@ def convert_unet_state_dict_to_peft(state_dict):
247
255
 
248
256
  def convert_all_state_dict_to_peft(state_dict):
249
257
  r"""
250
- Attempts to first `convert_state_dict_to_peft`, and if it doesn't detect `lora_linear_layer`
251
- for a valid `DIFFUSERS` LoRA for example, attempts to exclusively convert the Unet `convert_unet_state_dict_to_peft`
258
+ Attempts to first `convert_state_dict_to_peft`, and if it doesn't detect `lora_linear_layer` for a valid
259
+ `DIFFUSERS` LoRA for example, attempts to exclusively convert the Unet `convert_unet_state_dict_to_peft`
252
260
  """
253
261
  try:
254
262
  peft_dict = convert_state_dict_to_peft(state_dict)
@@ -314,6 +322,9 @@ def convert_state_dict_to_kohya(state_dict, original_type=None, **kwargs):
314
322
  kohya_key = kohya_key.replace("text_encoder.", "lora_te1.")
315
323
  elif "unet" in kohya_key:
316
324
  kohya_key = kohya_key.replace("unet", "lora_unet")
325
+ elif "lora_magnitude_vector" in kohya_key:
326
+ kohya_key = kohya_key.replace("lora_magnitude_vector", "dora_scale")
327
+
317
328
  kohya_key = kohya_key.replace(".", "_", kohya_key.count(".") - 2)
318
329
  kohya_key = kohya_key.replace(peft_adapter_name, "") # Kohya doesn't take names
319
330
  kohya_ss_state_dict[kohya_key] = weight