diffsynth-engine 0.4.0__tar.gz → 0.4.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (192) hide show
  1. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/PKG-INFO +2 -1
  2. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/README.md +8 -4
  3. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/__init__.py +4 -0
  4. diffsynth_engine-0.4.1/diffsynth_engine/conf/models/qwen_image/qwen2_5_vl_config.json +25 -0
  5. diffsynth_engine-0.4.1/diffsynth_engine/conf/models/qwen_image/qwen2_5_vl_vision_config.json +19 -0
  6. diffsynth_engine-0.4.1/diffsynth_engine/conf/models/qwen_image/qwen_image_vae_keymap.json +244 -0
  7. diffsynth_engine-0.4.1/diffsynth_engine/conf/models/wan/vae/wan-vae-keymap.json +244 -0
  8. diffsynth_engine-0.4.1/diffsynth_engine/conf/models/wan/vae/wan2.1-vae.json +48 -0
  9. diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/added_tokens.json +24 -0
  10. diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/merges.txt +151388 -0
  11. diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/special_tokens_map.json +31 -0
  12. diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/tokenizer.json +757444 -0
  13. diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/tokenizer_config.json +209 -0
  14. diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/vocab.json +1 -0
  15. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/configs/__init__.py +12 -0
  16. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/configs/pipeline.py +68 -2
  17. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/transformer_helper.py +33 -0
  18. diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/__init__.py +13 -0
  19. diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/qwen2_5_vl.py +1243 -0
  20. diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/qwen_image_dit.py +425 -0
  21. diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/qwen_image_dit_fbcache.py +133 -0
  22. diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/qwen_image_vae.py +1082 -0
  23. diffsynth_engine-0.4.1/diffsynth_engine/models/wan/__init__.py +11 -0
  24. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/wan/wan_vae.py +16 -3
  25. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/__init__.py +2 -0
  26. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/base.py +11 -4
  27. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/flux_image.py +46 -44
  28. diffsynth_engine-0.4.1/diffsynth_engine/pipelines/qwen_image.py +416 -0
  29. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/sd_image.py +2 -4
  30. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/sdxl_image.py +2 -4
  31. diffsynth_engine-0.4.1/diffsynth_engine/pipelines/utils.py +19 -0
  32. diffsynth_engine-0.4.1/diffsynth_engine/tokenizers/__init__.py +13 -0
  33. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tokenizers/clip.py +1 -1
  34. diffsynth_engine-0.4.1/diffsynth_engine/tokenizers/qwen2.py +210 -0
  35. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tokenizers/t5.py +1 -1
  36. diffsynth_engine-0.4.1/diffsynth_engine/utils/cache.py +55 -0
  37. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/constants.py +7 -0
  38. diffsynth_engine-0.4.1/diffsynth_engine/utils/offload.py +52 -0
  39. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/PKG-INFO +2 -1
  40. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/SOURCES.txt +19 -0
  41. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/requires.txt +1 -0
  42. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/docs/tutorial.md +33 -42
  43. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/docs/tutorial_zh.md +45 -54
  44. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/pyproject.toml +1 -0
  45. diffsynth_engine-0.4.0/diffsynth_engine/pipelines/utils.py +0 -6
  46. diffsynth_engine-0.4.0/diffsynth_engine/tokenizers/__init__.py +0 -6
  47. diffsynth_engine-0.4.0/diffsynth_engine/utils/__init__.py +0 -0
  48. diffsynth_engine-0.4.0/diffsynth_engine/utils/offload.py +0 -36
  49. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/.gitignore +0 -0
  50. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/.pre-commit-config.yaml +0 -0
  51. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/LICENSE +0 -0
  52. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/MANIFEST.in +0 -0
  53. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/assets/dingtalk.png +0 -0
  54. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/assets/showcase.jpeg +0 -0
  55. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/__init__.py +0 -0
  56. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/__init__.py +0 -0
  57. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/base_scheduler.py +0 -0
  58. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/flow_match/__init__.py +0 -0
  59. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/flow_match/flow_beta.py +0 -0
  60. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/flow_match/flow_ddim.py +0 -0
  61. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/flow_match/recifited_flow.py +0 -0
  62. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/__init__.py +0 -0
  63. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/beta.py +0 -0
  64. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/ddim.py +0 -0
  65. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/exponential.py +0 -0
  66. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/karras.py +0 -0
  67. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/linear.py +0 -0
  68. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/sgm_uniform.py +0 -0
  69. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/__init__.py +0 -0
  70. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/flow_match/__init__.py +0 -0
  71. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/flow_match/flow_match_euler.py +0 -0
  72. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/__init__.py +0 -0
  73. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/brownian_tree.py +0 -0
  74. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/ddpm.py +0 -0
  75. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/deis.py +0 -0
  76. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_2m.py +0 -0
  77. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_2m_sde.py +0 -0
  78. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_3m_sde.py +0 -0
  79. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/epsilon.py +0 -0
  80. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/euler.py +0 -0
  81. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/euler_ancestral.py +0 -0
  82. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/components/vae.json +0 -0
  83. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/flux/flux_dit.json +0 -0
  84. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/flux/flux_text_encoder.json +0 -0
  85. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/flux/flux_vae.json +0 -0
  86. /diffsynth_engine-0.4.0/diffsynth_engine/conf/models/wan/vae/wan2.1-vae.json → /diffsynth_engine-0.4.1/diffsynth_engine/conf/models/qwen_image/qwen_image_vae.json +0 -0
  87. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sd/sd_text_encoder.json +0 -0
  88. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sd/sd_unet.json +0 -0
  89. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sd3/sd3_dit.json +0 -0
  90. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sd3/sd3_text_encoder.json +0 -0
  91. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sdxl/sdxl_text_encoder.json +0 -0
  92. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sdxl/sdxl_unet.json +0 -0
  93. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.1-flf2v-14b.json +0 -0
  94. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.1-i2v-14b.json +0 -0
  95. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.1-t2v-1.3b.json +0 -0
  96. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.1-t2v-14b.json +0 -0
  97. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.2-i2v-a14b.json +0 -0
  98. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.2-t2v-a14b.json +0 -0
  99. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.2-ti2v-5b.json +0 -0
  100. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/vae/wan2.2-vae.json +0 -0
  101. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/merges.txt +0 -0
  102. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/special_tokens_map.json +0 -0
  103. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/tokenizer_config.json +0 -0
  104. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/vocab.json +0 -0
  105. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/special_tokens_map.json +0 -0
  106. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/spiece.model +0 -0
  107. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/tokenizer.json +0 -0
  108. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/tokenizer_config.json +0 -0
  109. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/merges.txt +0 -0
  110. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/special_tokens_map.json +0 -0
  111. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/tokenizer_config.json +0 -0
  112. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/vocab.json +0 -0
  113. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/merges.txt +0 -0
  114. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/special_tokens_map.json +0 -0
  115. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/tokenizer_config.json +0 -0
  116. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/vocab.json +0 -0
  117. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/special_tokens_map.json +0 -0
  118. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/spiece.model +0 -0
  119. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/tokenizer.json +0 -0
  120. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/tokenizer_config.json +0 -0
  121. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/configs/controlnet.py +0 -0
  122. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/kernels/__init__.py +0 -0
  123. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/__init__.py +0 -0
  124. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/base.py +0 -0
  125. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/__init__.py +0 -0
  126. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/attention.py +0 -0
  127. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/lora.py +0 -0
  128. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/relative_position_emb.py +0 -0
  129. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/timestep.py +0 -0
  130. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/unet_helper.py +0 -0
  131. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/__init__.py +0 -0
  132. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_controlnet.py +0 -0
  133. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_dit.py +0 -0
  134. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_dit_fbcache.py +0 -0
  135. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_ipadapter.py +0 -0
  136. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_redux.py +0 -0
  137. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_text_encoder.py +0 -0
  138. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_vae.py +0 -0
  139. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/__init__.py +0 -0
  140. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/sd_controlnet.py +0 -0
  141. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/sd_text_encoder.py +0 -0
  142. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/sd_unet.py +0 -0
  143. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/sd_vae.py +0 -0
  144. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd3/__init__.py +0 -0
  145. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd3/sd3_dit.py +0 -0
  146. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd3/sd3_text_encoder.py +0 -0
  147. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd3/sd3_vae.py +0 -0
  148. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/__init__.py +0 -0
  149. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/sdxl_controlnet.py +0 -0
  150. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/sdxl_text_encoder.py +0 -0
  151. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/sdxl_unet.py +0 -0
  152. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/sdxl_vae.py +0 -0
  153. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/text_encoder/__init__.py +0 -0
  154. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/text_encoder/clip.py +0 -0
  155. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/text_encoder/siglip.py +0 -0
  156. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/text_encoder/t5.py +0 -0
  157. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/utils.py +0 -0
  158. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/vae/__init__.py +0 -0
  159. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/vae/vae.py +0 -0
  160. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/wan/wan_dit.py +0 -0
  161. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/wan/wan_image_encoder.py +0 -0
  162. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/wan/wan_text_encoder.py +0 -0
  163. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/wan_video.py +0 -0
  164. {diffsynth_engine-0.4.0/diffsynth_engine/models/wan → diffsynth_engine-0.4.1/diffsynth_engine/processor}/__init__.py +0 -0
  165. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/processor/canny_processor.py +0 -0
  166. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/processor/depth_processor.py +0 -0
  167. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tokenizers/base.py +0 -0
  168. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tokenizers/wan.py +0 -0
  169. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/__init__.py +0 -0
  170. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/flux_inpainting_tool.py +0 -0
  171. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/flux_outpainting_tool.py +0 -0
  172. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/flux_reference_tool.py +0 -0
  173. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/flux_replace_tool.py +0 -0
  174. {diffsynth_engine-0.4.0/diffsynth_engine/processor → diffsynth_engine-0.4.1/diffsynth_engine/utils}/__init__.py +0 -0
  175. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/download.py +0 -0
  176. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/env.py +0 -0
  177. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/flag.py +0 -0
  178. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/fp8_linear.py +0 -0
  179. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/gguf.py +0 -0
  180. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/image.py +0 -0
  181. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/loader.py +0 -0
  182. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/lock.py +0 -0
  183. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/logging.py +0 -0
  184. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/onnx.py +0 -0
  185. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/parallel.py +0 -0
  186. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/platform.py +0 -0
  187. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/prompt.py +0 -0
  188. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/video.py +0 -0
  189. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/dependency_links.txt +0 -0
  190. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/top_level.txt +0 -0
  191. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/setup.cfg +0 -0
  192. {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/setup.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: diffsynth_engine
3
- Version: 0.4.0
3
+ Version: 0.4.1
4
4
  Author: MuseAI x ModelScope
5
5
  Classifier: Programming Language :: Python :: 3
6
6
  Classifier: Operating System :: OS Independent
@@ -28,6 +28,7 @@ Requires-Dist: opencv-python
28
28
  Provides-Extra: dev
29
29
  Requires-Dist: diffusers==0.31.0; extra == "dev"
30
30
  Requires-Dist: transformers==4.45.2; extra == "dev"
31
+ Requires-Dist: accelerate; extra == "dev"
31
32
  Requires-Dist: build; extra == "dev"
32
33
  Requires-Dist: ruff; extra == "dev"
33
34
  Requires-Dist: scikit-image; extra == "dev"
@@ -23,6 +23,7 @@ and offloading strategies, enabling loading of larger diffusion models (e.g., Fl
23
23
 
24
24
  ## News
25
25
 
26
+ - **[v0.4.1](https://github.com/modelscope/DiffSynth-Engine/releases/tag/v0.4.1)** | **August 4, 2025**: 🔥Supports [Qwen-Image](https://www.modelscope.cn/models/Qwen/Qwen-Image), an image generation model excels at complex text rendering and creating images in a wide range of artistic styles.
26
27
  - **[v0.4.0](https://github.com/modelscope/DiffSynth-Engine/releases/tag/v0.4.0)** | **August 1, 2025**:
27
28
  - 🔥Supports [Wan2.2](https://modelscope.cn/collections/tongyiwanxiang-22--shipinshengcheng-2bb5b1adef2840) video generation model
28
29
  - ⚠️[**Breaking Change**] Improved `from_pretrained` method pipeline initialization
@@ -49,21 +50,24 @@ pip3 install -e .
49
50
  ### Usage
50
51
  Text to image
51
52
  ```python
52
- from diffsynth_engine import fetch_model, FluxImagePipeline
53
+ from diffsynth_engine import fetch_model, FluxImagePipeline, FluxPipelineConfig
53
54
 
54
55
  model_path = fetch_model("muse/flux-with-vae", path="flux1-dev-with-vae.safetensors")
55
- pipe = FluxImagePipeline.from_pretrained(model_path, device='cuda:0')
56
+
57
+ config = FluxPipelineConfig.basic_config(model_path=model_path, device="cuda:0")
58
+ pipe = FluxImagePipeline.from_pretrained(config)
56
59
  image = pipe(prompt="a cat")
57
60
  image.save("image.png")
58
61
  ```
59
62
  Text to image with LoRA
60
63
  ```python
61
- from diffsynth_engine import fetch_model, FluxImagePipeline
64
+ from diffsynth_engine import fetch_model, FluxImagePipeline, FluxPipelineConfig
62
65
 
63
66
  model_path = fetch_model("muse/flux-with-vae", path="flux1-dev-with-vae.safetensors")
64
67
  lora_path = fetch_model("DonRat/MAJICFLUS_SuperChinesestyleheongsam", path="麦橘超国风旗袍.safetensors")
65
68
 
66
- pipe = FluxImagePipeline.from_pretrained(model_path, device='cuda:0')
69
+ config = FluxPipelineConfig.basic_config(model_path=model_path, device="cuda:0")
70
+ pipe = FluxImagePipeline.from_pretrained(config)
67
71
  pipe.load_lora(path=lora_path, scale=1.0)
68
72
  image = pipe(prompt="a girl, qipao")
69
73
  image.save("image.png")
@@ -3,6 +3,7 @@ from .configs import (
3
3
  SDXLPipelineConfig,
4
4
  FluxPipelineConfig,
5
5
  WanPipelineConfig,
6
+ QwenImagePipelineConfig,
6
7
  ControlNetParams,
7
8
  ControlType,
8
9
  )
@@ -11,6 +12,7 @@ from .pipelines import (
11
12
  SDXLImagePipeline,
12
13
  SDImagePipeline,
13
14
  WanVideoPipeline,
15
+ QwenImagePipeline,
14
16
  )
15
17
  from .models.flux import FluxControlNet, FluxIPAdapter, FluxRedux
16
18
  from .models.sd import SDControlNet
@@ -31,6 +33,7 @@ __all__ = [
31
33
  "FluxPipelineConfig",
32
34
  "WanPipelineConfig",
33
35
  "FluxImagePipeline",
36
+ "QwenImagePipelineConfig",
34
37
  "FluxControlNet",
35
38
  "FluxIPAdapter",
36
39
  "FluxRedux",
@@ -39,6 +42,7 @@ __all__ = [
39
42
  "SDXLImagePipeline",
40
43
  "SDImagePipeline",
41
44
  "WanVideoPipeline",
45
+ "QwenImagePipeline",
42
46
  "FluxInpaintingTool",
43
47
  "FluxOutpaintingTool",
44
48
  "FluxIPAdapterRefTool",
@@ -0,0 +1,25 @@
1
+ {
2
+ "hidden_size": 3584,
3
+ "intermediate_size": 18944,
4
+ "num_hidden_layers": 28,
5
+ "num_attention_heads": 28,
6
+ "num_key_value_heads": 4,
7
+ "mrope_section": [
8
+ 16,
9
+ 24,
10
+ 24
11
+ ],
12
+ "rms_norm_eps": 1e-6,
13
+ "use_cache": true,
14
+ "use_sliding_window": false,
15
+ "sliding_window": 32768,
16
+ "max_window_layers": 28,
17
+ "vocab_size": 152064,
18
+ "pad_token_id": 151643,
19
+ "im_start_token_id": 151644,
20
+ "im_end_token_id": 151645,
21
+ "vision_start_token_id": 151652,
22
+ "vision_end_token_id": 151653,
23
+ "image_token_id": 151655,
24
+ "video_token_id": 151656
25
+ }
@@ -0,0 +1,19 @@
1
+ {
2
+ "in_channels": 3,
3
+ "hidden_size": 1280,
4
+ "intermediate_size": 3420,
5
+ "out_hidden_size": 3584,
6
+ "num_heads": 16,
7
+ "depth": 32,
8
+ "patch_size": 14,
9
+ "temporal_patch_size": 2,
10
+ "spatial_merge_size": 2,
11
+ "tokens_per_second": 2,
12
+ "window_size": 112,
13
+ "fullatt_block_indexes": [
14
+ 7,
15
+ 15,
16
+ 23,
17
+ 31
18
+ ]
19
+ }
@@ -0,0 +1,244 @@
1
+ {
2
+ "diffusers": {
3
+ "rename_dict": {
4
+ "model.post_quant_conv.bias": "model.conv2.bias",
5
+ "model.post_quant_conv.weight": "model.conv2.weight",
6
+ "model.quant_conv.bias": "model.conv1.bias",
7
+ "model.quant_conv.weight": "model.conv1.weight",
8
+ "model.encoder.conv_in.bias": "model.encoder.conv1.bias",
9
+ "model.encoder.conv_in.weight": "model.encoder.conv1.weight",
10
+ "model.encoder.down_blocks.0.conv_shortcut.bias": "model.encoder.downsamples.0.shortcut.bias",
11
+ "model.encoder.down_blocks.0.conv_shortcut.weight": "model.encoder.downsamples.0.shortcut.weight",
12
+ "model.encoder.down_blocks.0.conv1.bias": "model.encoder.downsamples.0.residual.2.bias",
13
+ "model.encoder.down_blocks.0.conv1.weight": "model.encoder.downsamples.0.residual.2.weight",
14
+ "model.encoder.down_blocks.0.conv2.bias": "model.encoder.downsamples.0.residual.6.bias",
15
+ "model.encoder.down_blocks.0.conv2.weight": "model.encoder.downsamples.0.residual.6.weight",
16
+ "model.encoder.down_blocks.0.norm1.gamma": "model.encoder.downsamples.0.residual.0.gamma",
17
+ "model.encoder.down_blocks.0.norm2.gamma": "model.encoder.downsamples.0.residual.3.gamma",
18
+ "model.encoder.down_blocks.1.conv_shortcut.bias": "model.encoder.downsamples.1.shortcut.bias",
19
+ "model.encoder.down_blocks.1.conv_shortcut.weight": "model.encoder.downsamples.1.shortcut.weight",
20
+ "model.encoder.down_blocks.1.conv1.bias": "model.encoder.downsamples.1.residual.2.bias",
21
+ "model.encoder.down_blocks.1.conv1.weight": "model.encoder.downsamples.1.residual.2.weight",
22
+ "model.encoder.down_blocks.1.conv2.bias": "model.encoder.downsamples.1.residual.6.bias",
23
+ "model.encoder.down_blocks.1.conv2.weight": "model.encoder.downsamples.1.residual.6.weight",
24
+ "model.encoder.down_blocks.1.norm1.gamma": "model.encoder.downsamples.1.residual.0.gamma",
25
+ "model.encoder.down_blocks.1.norm2.gamma": "model.encoder.downsamples.1.residual.3.gamma",
26
+ "model.encoder.down_blocks.2.resample.1.bias": "model.encoder.downsamples.2.resample.1.bias",
27
+ "model.encoder.down_blocks.2.resample.1.weight": "model.encoder.downsamples.2.resample.1.weight",
28
+ "model.encoder.down_blocks.2.time_conv.bias": "model.encoder.downsamples.2.time_conv.bias",
29
+ "model.encoder.down_blocks.2.time_conv.weight": "model.encoder.downsamples.2.time_conv.weight",
30
+ "model.encoder.down_blocks.3.conv_shortcut.bias": "model.encoder.downsamples.3.shortcut.bias",
31
+ "model.encoder.down_blocks.3.conv_shortcut.weight": "model.encoder.downsamples.3.shortcut.weight",
32
+ "model.encoder.down_blocks.3.conv1.bias": "model.encoder.downsamples.3.residual.2.bias",
33
+ "model.encoder.down_blocks.3.conv1.weight": "model.encoder.downsamples.3.residual.2.weight",
34
+ "model.encoder.down_blocks.3.conv2.bias": "model.encoder.downsamples.3.residual.6.bias",
35
+ "model.encoder.down_blocks.3.conv2.weight": "model.encoder.downsamples.3.residual.6.weight",
36
+ "model.encoder.down_blocks.3.norm1.gamma": "model.encoder.downsamples.3.residual.0.gamma",
37
+ "model.encoder.down_blocks.3.norm2.gamma": "model.encoder.downsamples.3.residual.3.gamma",
38
+ "model.encoder.down_blocks.4.conv_shortcut.bias": "model.encoder.downsamples.4.shortcut.bias",
39
+ "model.encoder.down_blocks.4.conv_shortcut.weight": "model.encoder.downsamples.4.shortcut.weight",
40
+ "model.encoder.down_blocks.4.conv1.bias": "model.encoder.downsamples.4.residual.2.bias",
41
+ "model.encoder.down_blocks.4.conv1.weight": "model.encoder.downsamples.4.residual.2.weight",
42
+ "model.encoder.down_blocks.4.conv2.bias": "model.encoder.downsamples.4.residual.6.bias",
43
+ "model.encoder.down_blocks.4.conv2.weight": "model.encoder.downsamples.4.residual.6.weight",
44
+ "model.encoder.down_blocks.4.norm1.gamma": "model.encoder.downsamples.4.residual.0.gamma",
45
+ "model.encoder.down_blocks.4.norm2.gamma": "model.encoder.downsamples.4.residual.3.gamma",
46
+ "model.encoder.down_blocks.5.resample.1.bias": "model.encoder.downsamples.5.resample.1.bias",
47
+ "model.encoder.down_blocks.5.resample.1.weight": "model.encoder.downsamples.5.resample.1.weight",
48
+ "model.encoder.down_blocks.5.time_conv.bias": "model.encoder.downsamples.5.time_conv.bias",
49
+ "model.encoder.down_blocks.5.time_conv.weight": "model.encoder.downsamples.5.time_conv.weight",
50
+ "model.encoder.down_blocks.6.conv_shortcut.bias": "model.encoder.downsamples.6.shortcut.bias",
51
+ "model.encoder.down_blocks.6.conv_shortcut.weight": "model.encoder.downsamples.6.shortcut.weight",
52
+ "model.encoder.down_blocks.6.conv1.bias": "model.encoder.downsamples.6.residual.2.bias",
53
+ "model.encoder.down_blocks.6.conv1.weight": "model.encoder.downsamples.6.residual.2.weight",
54
+ "model.encoder.down_blocks.6.conv2.bias": "model.encoder.downsamples.6.residual.6.bias",
55
+ "model.encoder.down_blocks.6.conv2.weight": "model.encoder.downsamples.6.residual.6.weight",
56
+ "model.encoder.down_blocks.6.norm1.gamma": "model.encoder.downsamples.6.residual.0.gamma",
57
+ "model.encoder.down_blocks.6.norm2.gamma": "model.encoder.downsamples.6.residual.3.gamma",
58
+ "model.encoder.down_blocks.7.conv_shortcut.bias": "model.encoder.downsamples.7.shortcut.bias",
59
+ "model.encoder.down_blocks.7.conv_shortcut.weight": "model.encoder.downsamples.7.shortcut.weight",
60
+ "model.encoder.down_blocks.7.conv1.bias": "model.encoder.downsamples.7.residual.2.bias",
61
+ "model.encoder.down_blocks.7.conv1.weight": "model.encoder.downsamples.7.residual.2.weight",
62
+ "model.encoder.down_blocks.7.conv2.bias": "model.encoder.downsamples.7.residual.6.bias",
63
+ "model.encoder.down_blocks.7.conv2.weight": "model.encoder.downsamples.7.residual.6.weight",
64
+ "model.encoder.down_blocks.7.norm1.gamma": "model.encoder.downsamples.7.residual.0.gamma",
65
+ "model.encoder.down_blocks.7.norm2.gamma": "model.encoder.downsamples.7.residual.3.gamma",
66
+ "model.encoder.down_blocks.8.resample.1.bias": "model.encoder.downsamples.8.resample.1.bias",
67
+ "model.encoder.down_blocks.8.resample.1.weight": "model.encoder.downsamples.8.resample.1.weight",
68
+ "model.encoder.down_blocks.8.time_conv.bias": "model.encoder.downsamples.8.time_conv.bias",
69
+ "model.encoder.down_blocks.8.time_conv.weight": "model.encoder.downsamples.8.time_conv.weight",
70
+ "model.encoder.down_blocks.9.conv_shortcut.bias": "model.encoder.downsamples.9.shortcut.bias",
71
+ "model.encoder.down_blocks.9.conv_shortcut.weight": "model.encoder.downsamples.9.shortcut.weight",
72
+ "model.encoder.down_blocks.9.conv1.bias": "model.encoder.downsamples.9.residual.2.bias",
73
+ "model.encoder.down_blocks.9.conv1.weight": "model.encoder.downsamples.9.residual.2.weight",
74
+ "model.encoder.down_blocks.9.conv2.bias": "model.encoder.downsamples.9.residual.6.bias",
75
+ "model.encoder.down_blocks.9.conv2.weight": "model.encoder.downsamples.9.residual.6.weight",
76
+ "model.encoder.down_blocks.9.norm1.gamma": "model.encoder.downsamples.9.residual.0.gamma",
77
+ "model.encoder.down_blocks.9.norm2.gamma": "model.encoder.downsamples.9.residual.3.gamma",
78
+ "model.encoder.down_blocks.10.conv_shortcut.bias": "model.encoder.downsamples.10.shortcut.bias",
79
+ "model.encoder.down_blocks.10.conv_shortcut.weight": "model.encoder.downsamples.10.shortcut.weight",
80
+ "model.encoder.down_blocks.10.conv1.bias": "model.encoder.downsamples.10.residual.2.bias",
81
+ "model.encoder.down_blocks.10.conv1.weight": "model.encoder.downsamples.10.residual.2.weight",
82
+ "model.encoder.down_blocks.10.conv2.bias": "model.encoder.downsamples.10.residual.6.bias",
83
+ "model.encoder.down_blocks.10.conv2.weight": "model.encoder.downsamples.10.residual.6.weight",
84
+ "model.encoder.down_blocks.10.norm1.gamma": "model.encoder.downsamples.10.residual.0.gamma",
85
+ "model.encoder.down_blocks.10.norm2.gamma": "model.encoder.downsamples.10.residual.3.gamma",
86
+ "model.encoder.mid_block.attentions.0.norm.gamma": "model.encoder.middle.1.norm.gamma",
87
+ "model.encoder.mid_block.attentions.0.proj.bias": "model.encoder.middle.1.proj.bias",
88
+ "model.encoder.mid_block.attentions.0.proj.weight": "model.encoder.middle.1.proj.weight",
89
+ "model.encoder.mid_block.attentions.0.to_qkv.bias": "model.encoder.middle.1.to_qkv.bias",
90
+ "model.encoder.mid_block.attentions.0.to_qkv.weight": "model.encoder.middle.1.to_qkv.weight",
91
+ "model.encoder.mid_block.resnets.0.conv_shortcut.bias": "model.encoder.middle.0.shortcut.bias",
92
+ "model.encoder.mid_block.resnets.0.conv_shortcut.weight": "model.encoder.middle.0.shortcut.weight",
93
+ "model.encoder.mid_block.resnets.0.conv1.bias": "model.encoder.middle.0.residual.2.bias",
94
+ "model.encoder.mid_block.resnets.0.conv1.weight": "model.encoder.middle.0.residual.2.weight",
95
+ "model.encoder.mid_block.resnets.0.conv2.bias": "model.encoder.middle.0.residual.6.bias",
96
+ "model.encoder.mid_block.resnets.0.conv2.weight": "model.encoder.middle.0.residual.6.weight",
97
+ "model.encoder.mid_block.resnets.0.norm1.gamma": "model.encoder.middle.0.residual.0.gamma",
98
+ "model.encoder.mid_block.resnets.0.norm2.gamma": "model.encoder.middle.0.residual.3.gamma",
99
+ "model.encoder.mid_block.resnets.1.conv_shortcut.bias": "model.encoder.middle.2.shortcut.bias",
100
+ "model.encoder.mid_block.resnets.1.conv_shortcut.weight": "model.encoder.middle.2.shortcut.weight",
101
+ "model.encoder.mid_block.resnets.1.conv1.bias": "model.encoder.middle.2.residual.2.bias",
102
+ "model.encoder.mid_block.resnets.1.conv1.weight": "model.encoder.middle.2.residual.2.weight",
103
+ "model.encoder.mid_block.resnets.1.conv2.bias": "model.encoder.middle.2.residual.6.bias",
104
+ "model.encoder.mid_block.resnets.1.conv2.weight": "model.encoder.middle.2.residual.6.weight",
105
+ "model.encoder.mid_block.resnets.1.norm1.gamma": "model.encoder.middle.2.residual.0.gamma",
106
+ "model.encoder.mid_block.resnets.1.norm2.gamma": "model.encoder.middle.2.residual.3.gamma",
107
+ "model.encoder.norm_out.gamma": "model.encoder.head.0.gamma",
108
+ "model.encoder.conv_out.bias": "model.encoder.head.2.bias",
109
+ "model.encoder.conv_out.weight": "model.encoder.head.2.weight",
110
+ "model.decoder.conv_in.bias": "model.decoder.conv1.bias",
111
+ "model.decoder.conv_in.weight": "model.decoder.conv1.weight",
112
+ "model.decoder.mid_block.attentions.0.norm.gamma": "model.decoder.middle.1.norm.gamma",
113
+ "model.decoder.mid_block.attentions.0.proj.bias": "model.decoder.middle.1.proj.bias",
114
+ "model.decoder.mid_block.attentions.0.proj.weight": "model.decoder.middle.1.proj.weight",
115
+ "model.decoder.mid_block.attentions.0.to_qkv.bias": "model.decoder.middle.1.to_qkv.bias",
116
+ "model.decoder.mid_block.attentions.0.to_qkv.weight": "model.decoder.middle.1.to_qkv.weight",
117
+ "model.decoder.mid_block.resnets.0.conv_shortcut.bias": "model.decoder.middle.0.shortcut.bias",
118
+ "model.decoder.mid_block.resnets.0.conv_shortcut.weight": "model.decoder.middle.0.shortcut.weight",
119
+ "model.decoder.mid_block.resnets.0.conv1.bias": "model.decoder.middle.0.residual.2.bias",
120
+ "model.decoder.mid_block.resnets.0.conv1.weight": "model.decoder.middle.0.residual.2.weight",
121
+ "model.decoder.mid_block.resnets.0.conv2.bias": "model.decoder.middle.0.residual.6.bias",
122
+ "model.decoder.mid_block.resnets.0.conv2.weight": "model.decoder.middle.0.residual.6.weight",
123
+ "model.decoder.mid_block.resnets.0.norm1.gamma": "model.decoder.middle.0.residual.0.gamma",
124
+ "model.decoder.mid_block.resnets.0.norm2.gamma": "model.decoder.middle.0.residual.3.gamma",
125
+ "model.decoder.mid_block.resnets.1.conv_shortcut.bias": "model.decoder.middle.2.shortcut.bias",
126
+ "model.decoder.mid_block.resnets.1.conv_shortcut.weight": "model.decoder.middle.2.shortcut.weight",
127
+ "model.decoder.mid_block.resnets.1.conv1.bias": "model.decoder.middle.2.residual.2.bias",
128
+ "model.decoder.mid_block.resnets.1.conv1.weight": "model.decoder.middle.2.residual.2.weight",
129
+ "model.decoder.mid_block.resnets.1.conv2.bias": "model.decoder.middle.2.residual.6.bias",
130
+ "model.decoder.mid_block.resnets.1.conv2.weight": "model.decoder.middle.2.residual.6.weight",
131
+ "model.decoder.mid_block.resnets.1.norm1.gamma": "model.decoder.middle.2.residual.0.gamma",
132
+ "model.decoder.mid_block.resnets.1.norm2.gamma": "model.decoder.middle.2.residual.3.gamma",
133
+ "model.decoder.up_blocks.0.resnets.0.conv_shortcut.bias": "model.decoder.upsamples.0.shortcut.bias",
134
+ "model.decoder.up_blocks.0.resnets.0.conv_shortcut.weight": "model.decoder.upsamples.0.shortcut.weight",
135
+ "model.decoder.up_blocks.0.resnets.0.conv1.bias": "model.decoder.upsamples.0.residual.2.bias",
136
+ "model.decoder.up_blocks.0.resnets.0.conv1.weight": "model.decoder.upsamples.0.residual.2.weight",
137
+ "model.decoder.up_blocks.0.resnets.0.conv2.bias": "model.decoder.upsamples.0.residual.6.bias",
138
+ "model.decoder.up_blocks.0.resnets.0.conv2.weight": "model.decoder.upsamples.0.residual.6.weight",
139
+ "model.decoder.up_blocks.0.resnets.0.norm1.gamma": "model.decoder.upsamples.0.residual.0.gamma",
140
+ "model.decoder.up_blocks.0.resnets.0.norm2.gamma": "model.decoder.upsamples.0.residual.3.gamma",
141
+ "model.decoder.up_blocks.0.resnets.1.conv_shortcut.bias": "model.decoder.upsamples.1.shortcut.bias",
142
+ "model.decoder.up_blocks.0.resnets.1.conv_shortcut.weight": "model.decoder.upsamples.1.shortcut.weight",
143
+ "model.decoder.up_blocks.0.resnets.1.conv1.bias": "model.decoder.upsamples.1.residual.2.bias",
144
+ "model.decoder.up_blocks.0.resnets.1.conv1.weight": "model.decoder.upsamples.1.residual.2.weight",
145
+ "model.decoder.up_blocks.0.resnets.1.conv2.bias": "model.decoder.upsamples.1.residual.6.bias",
146
+ "model.decoder.up_blocks.0.resnets.1.conv2.weight": "model.decoder.upsamples.1.residual.6.weight",
147
+ "model.decoder.up_blocks.0.resnets.1.norm1.gamma": "model.decoder.upsamples.1.residual.0.gamma",
148
+ "model.decoder.up_blocks.0.resnets.1.norm2.gamma": "model.decoder.upsamples.1.residual.3.gamma",
149
+ "model.decoder.up_blocks.0.resnets.2.conv_shortcut.bias": "model.decoder.upsamples.2.shortcut.bias",
150
+ "model.decoder.up_blocks.0.resnets.2.conv_shortcut.weight": "model.decoder.upsamples.2.shortcut.weight",
151
+ "model.decoder.up_blocks.0.resnets.2.conv1.bias": "model.decoder.upsamples.2.residual.2.bias",
152
+ "model.decoder.up_blocks.0.resnets.2.conv1.weight": "model.decoder.upsamples.2.residual.2.weight",
153
+ "model.decoder.up_blocks.0.resnets.2.conv2.bias": "model.decoder.upsamples.2.residual.6.bias",
154
+ "model.decoder.up_blocks.0.resnets.2.conv2.weight": "model.decoder.upsamples.2.residual.6.weight",
155
+ "model.decoder.up_blocks.0.resnets.2.norm1.gamma": "model.decoder.upsamples.2.residual.0.gamma",
156
+ "model.decoder.up_blocks.0.resnets.2.norm2.gamma": "model.decoder.upsamples.2.residual.3.gamma",
157
+ "model.decoder.up_blocks.0.upsamplers.0.resample.1.bias": "model.decoder.upsamples.3.resample.1.bias",
158
+ "model.decoder.up_blocks.0.upsamplers.0.resample.1.weight": "model.decoder.upsamples.3.resample.1.weight",
159
+ "model.decoder.up_blocks.0.upsamplers.0.time_conv.bias": "model.decoder.upsamples.3.time_conv.bias",
160
+ "model.decoder.up_blocks.0.upsamplers.0.time_conv.weight": "model.decoder.upsamples.3.time_conv.weight",
161
+ "model.decoder.up_blocks.1.resnets.0.conv_shortcut.bias": "model.decoder.upsamples.4.shortcut.bias",
162
+ "model.decoder.up_blocks.1.resnets.0.conv_shortcut.weight": "model.decoder.upsamples.4.shortcut.weight",
163
+ "model.decoder.up_blocks.1.resnets.0.conv1.bias": "model.decoder.upsamples.4.residual.2.bias",
164
+ "model.decoder.up_blocks.1.resnets.0.conv1.weight": "model.decoder.upsamples.4.residual.2.weight",
165
+ "model.decoder.up_blocks.1.resnets.0.conv2.bias": "model.decoder.upsamples.4.residual.6.bias",
166
+ "model.decoder.up_blocks.1.resnets.0.conv2.weight": "model.decoder.upsamples.4.residual.6.weight",
167
+ "model.decoder.up_blocks.1.resnets.0.norm1.gamma": "model.decoder.upsamples.4.residual.0.gamma",
168
+ "model.decoder.up_blocks.1.resnets.0.norm2.gamma": "model.decoder.upsamples.4.residual.3.gamma",
169
+ "model.decoder.up_blocks.1.resnets.1.conv_shortcut.bias": "model.decoder.upsamples.5.shortcut.bias",
170
+ "model.decoder.up_blocks.1.resnets.1.conv_shortcut.weight": "model.decoder.upsamples.5.shortcut.weight",
171
+ "model.decoder.up_blocks.1.resnets.1.conv1.bias": "model.decoder.upsamples.5.residual.2.bias",
172
+ "model.decoder.up_blocks.1.resnets.1.conv1.weight": "model.decoder.upsamples.5.residual.2.weight",
173
+ "model.decoder.up_blocks.1.resnets.1.conv2.bias": "model.decoder.upsamples.5.residual.6.bias",
174
+ "model.decoder.up_blocks.1.resnets.1.conv2.weight": "model.decoder.upsamples.5.residual.6.weight",
175
+ "model.decoder.up_blocks.1.resnets.1.norm1.gamma": "model.decoder.upsamples.5.residual.0.gamma",
176
+ "model.decoder.up_blocks.1.resnets.1.norm2.gamma": "model.decoder.upsamples.5.residual.3.gamma",
177
+ "model.decoder.up_blocks.1.resnets.2.conv_shortcut.bias": "model.decoder.upsamples.6.shortcut.bias",
178
+ "model.decoder.up_blocks.1.resnets.2.conv_shortcut.weight": "model.decoder.upsamples.6.shortcut.weight",
179
+ "model.decoder.up_blocks.1.resnets.2.conv1.bias": "model.decoder.upsamples.6.residual.2.bias",
180
+ "model.decoder.up_blocks.1.resnets.2.conv1.weight": "model.decoder.upsamples.6.residual.2.weight",
181
+ "model.decoder.up_blocks.1.resnets.2.conv2.bias": "model.decoder.upsamples.6.residual.6.bias",
182
+ "model.decoder.up_blocks.1.resnets.2.conv2.weight": "model.decoder.upsamples.6.residual.6.weight",
183
+ "model.decoder.up_blocks.1.resnets.2.norm1.gamma": "model.decoder.upsamples.6.residual.0.gamma",
184
+ "model.decoder.up_blocks.1.resnets.2.norm2.gamma": "model.decoder.upsamples.6.residual.3.gamma",
185
+ "model.decoder.up_blocks.1.upsamplers.0.resample.1.bias": "model.decoder.upsamples.7.resample.1.bias",
186
+ "model.decoder.up_blocks.1.upsamplers.0.resample.1.weight": "model.decoder.upsamples.7.resample.1.weight",
187
+ "model.decoder.up_blocks.1.upsamplers.0.time_conv.bias": "model.decoder.upsamples.7.time_conv.bias",
188
+ "model.decoder.up_blocks.1.upsamplers.0.time_conv.weight": "model.decoder.upsamples.7.time_conv.weight",
189
+ "model.decoder.up_blocks.2.resnets.0.conv_shortcut.bias": "model.decoder.upsamples.8.shortcut.bias",
190
+ "model.decoder.up_blocks.2.resnets.0.conv_shortcut.weight": "model.decoder.upsamples.8.shortcut.weight",
191
+ "model.decoder.up_blocks.2.resnets.0.conv1.bias": "model.decoder.upsamples.8.residual.2.bias",
192
+ "model.decoder.up_blocks.2.resnets.0.conv1.weight": "model.decoder.upsamples.8.residual.2.weight",
193
+ "model.decoder.up_blocks.2.resnets.0.conv2.bias": "model.decoder.upsamples.8.residual.6.bias",
194
+ "model.decoder.up_blocks.2.resnets.0.conv2.weight": "model.decoder.upsamples.8.residual.6.weight",
195
+ "model.decoder.up_blocks.2.resnets.0.norm1.gamma": "model.decoder.upsamples.8.residual.0.gamma",
196
+ "model.decoder.up_blocks.2.resnets.0.norm2.gamma": "model.decoder.upsamples.8.residual.3.gamma",
197
+ "model.decoder.up_blocks.2.resnets.1.conv_shortcut.bias": "model.decoder.upsamples.9.shortcut.bias",
198
+ "model.decoder.up_blocks.2.resnets.1.conv_shortcut.weight": "model.decoder.upsamples.9.shortcut.weight",
199
+ "model.decoder.up_blocks.2.resnets.1.conv1.bias": "model.decoder.upsamples.9.residual.2.bias",
200
+ "model.decoder.up_blocks.2.resnets.1.conv1.weight": "model.decoder.upsamples.9.residual.2.weight",
201
+ "model.decoder.up_blocks.2.resnets.1.conv2.bias": "model.decoder.upsamples.9.residual.6.bias",
202
+ "model.decoder.up_blocks.2.resnets.1.conv2.weight": "model.decoder.upsamples.9.residual.6.weight",
203
+ "model.decoder.up_blocks.2.resnets.1.norm1.gamma": "model.decoder.upsamples.9.residual.0.gamma",
204
+ "model.decoder.up_blocks.2.resnets.1.norm2.gamma": "model.decoder.upsamples.9.residual.3.gamma",
205
+ "model.decoder.up_blocks.2.resnets.2.conv_shortcut.bias": "model.decoder.upsamples.10.shortcut.bias",
206
+ "model.decoder.up_blocks.2.resnets.2.conv_shortcut.weight": "model.decoder.upsamples.10.shortcut.weight",
207
+ "model.decoder.up_blocks.2.resnets.2.conv1.bias": "model.decoder.upsamples.10.residual.2.bias",
208
+ "model.decoder.up_blocks.2.resnets.2.conv1.weight": "model.decoder.upsamples.10.residual.2.weight",
209
+ "model.decoder.up_blocks.2.resnets.2.conv2.bias": "model.decoder.upsamples.10.residual.6.bias",
210
+ "model.decoder.up_blocks.2.resnets.2.conv2.weight": "model.decoder.upsamples.10.residual.6.weight",
211
+ "model.decoder.up_blocks.2.resnets.2.norm1.gamma": "model.decoder.upsamples.10.residual.0.gamma",
212
+ "model.decoder.up_blocks.2.resnets.2.norm2.gamma": "model.decoder.upsamples.10.residual.3.gamma",
213
+ "model.decoder.up_blocks.2.upsamplers.0.resample.1.bias": "model.decoder.upsamples.11.resample.1.bias",
214
+ "model.decoder.up_blocks.2.upsamplers.0.resample.1.weight": "model.decoder.upsamples.11.resample.1.weight",
215
+ "model.decoder.up_blocks.3.resnets.0.conv_shortcut.bias": "model.decoder.upsamples.12.shortcut.bias",
216
+ "model.decoder.up_blocks.3.resnets.0.conv_shortcut.weight": "model.decoder.upsamples.12.shortcut.weight",
217
+ "model.decoder.up_blocks.3.resnets.0.conv1.bias": "model.decoder.upsamples.12.residual.2.bias",
218
+ "model.decoder.up_blocks.3.resnets.0.conv1.weight": "model.decoder.upsamples.12.residual.2.weight",
219
+ "model.decoder.up_blocks.3.resnets.0.conv2.bias": "model.decoder.upsamples.12.residual.6.bias",
220
+ "model.decoder.up_blocks.3.resnets.0.conv2.weight": "model.decoder.upsamples.12.residual.6.weight",
221
+ "model.decoder.up_blocks.3.resnets.0.norm1.gamma": "model.decoder.upsamples.12.residual.0.gamma",
222
+ "model.decoder.up_blocks.3.resnets.0.norm2.gamma": "model.decoder.upsamples.12.residual.3.gamma",
223
+ "model.decoder.up_blocks.3.resnets.1.conv_shortcut.bias": "model.decoder.upsamples.13.shortcut.bias",
224
+ "model.decoder.up_blocks.3.resnets.1.conv_shortcut.weight": "model.decoder.upsamples.13.shortcut.weight",
225
+ "model.decoder.up_blocks.3.resnets.1.conv1.bias": "model.decoder.upsamples.13.residual.2.bias",
226
+ "model.decoder.up_blocks.3.resnets.1.conv1.weight": "model.decoder.upsamples.13.residual.2.weight",
227
+ "model.decoder.up_blocks.3.resnets.1.conv2.bias": "model.decoder.upsamples.13.residual.6.bias",
228
+ "model.decoder.up_blocks.3.resnets.1.conv2.weight": "model.decoder.upsamples.13.residual.6.weight",
229
+ "model.decoder.up_blocks.3.resnets.1.norm1.gamma": "model.decoder.upsamples.13.residual.0.gamma",
230
+ "model.decoder.up_blocks.3.resnets.1.norm2.gamma": "model.decoder.upsamples.13.residual.3.gamma",
231
+ "model.decoder.up_blocks.3.resnets.2.conv_shortcut.bias": "model.decoder.upsamples.14.shortcut.bias",
232
+ "model.decoder.up_blocks.3.resnets.2.conv_shortcut.weight": "model.decoder.upsamples.14.shortcut.weight",
233
+ "model.decoder.up_blocks.3.resnets.2.conv1.bias": "model.decoder.upsamples.14.residual.2.bias",
234
+ "model.decoder.up_blocks.3.resnets.2.conv1.weight": "model.decoder.upsamples.14.residual.2.weight",
235
+ "model.decoder.up_blocks.3.resnets.2.conv2.bias": "model.decoder.upsamples.14.residual.6.bias",
236
+ "model.decoder.up_blocks.3.resnets.2.conv2.weight": "model.decoder.upsamples.14.residual.6.weight",
237
+ "model.decoder.up_blocks.3.resnets.2.norm1.gamma": "model.decoder.upsamples.14.residual.0.gamma",
238
+ "model.decoder.up_blocks.3.resnets.2.norm2.gamma": "model.decoder.upsamples.14.residual.3.gamma",
239
+ "model.decoder.norm_out.gamma": "model.decoder.head.0.gamma",
240
+ "model.decoder.conv_out.bias": "model.decoder.head.2.bias",
241
+ "model.decoder.conv_out.weight": "model.decoder.head.2.weight"
242
+ }
243
+ }
244
+ }