diffsynth-engine 0.4.3.dev10__tar.gz → 0.4.4.dev2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (203) hide show
  1. diffsynth_engine-0.4.4.dev2/.gitattributes +26 -0
  2. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/PKG-INFO +1 -1
  3. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/qwen_image/qwen2_5_vl_vision_config.json +2 -1
  4. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/configs/pipeline.py +5 -0
  5. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/qwen_image/qwen2_5_vl.py +59 -11
  6. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine.egg-info/PKG-INFO +1 -1
  7. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine.egg-info/SOURCES.txt +1 -0
  8. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/.gitignore +0 -0
  9. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/.pre-commit-config.yaml +0 -0
  10. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/LICENSE +0 -0
  11. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/MANIFEST.in +0 -0
  12. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/README.md +0 -0
  13. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/assets/dingtalk.png +0 -0
  14. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/assets/showcase.jpeg +0 -0
  15. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/__init__.py +0 -0
  16. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/__init__.py +0 -0
  17. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/__init__.py +0 -0
  18. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/base_scheduler.py +0 -0
  19. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/flow_match/__init__.py +0 -0
  20. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/flow_match/flow_beta.py +0 -0
  21. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/flow_match/flow_ddim.py +0 -0
  22. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/flow_match/recifited_flow.py +0 -0
  23. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/__init__.py +0 -0
  24. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/beta.py +0 -0
  25. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/ddim.py +0 -0
  26. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/exponential.py +0 -0
  27. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/karras.py +0 -0
  28. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/linear.py +0 -0
  29. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/sgm_uniform.py +0 -0
  30. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/__init__.py +0 -0
  31. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/flow_match/__init__.py +0 -0
  32. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/flow_match/flow_match_euler.py +0 -0
  33. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/__init__.py +0 -0
  34. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/brownian_tree.py +0 -0
  35. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/ddpm.py +0 -0
  36. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/deis.py +0 -0
  37. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_2m.py +0 -0
  38. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_2m_sde.py +0 -0
  39. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_3m_sde.py +0 -0
  40. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/epsilon.py +0 -0
  41. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/euler.py +0 -0
  42. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/algorithm/sampler/stable_diffusion/euler_ancestral.py +0 -0
  43. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/components/vae.json +0 -0
  44. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/flux/flux_dit.json +0 -0
  45. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/flux/flux_text_encoder.json +0 -0
  46. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/flux/flux_vae.json +0 -0
  47. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/qwen_image/qwen2_5_vl_config.json +0 -0
  48. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/qwen_image/qwen_image_vae.json +0 -0
  49. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/qwen_image/qwen_image_vae_keymap.json +0 -0
  50. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/sd/sd_text_encoder.json +0 -0
  51. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/sd/sd_unet.json +0 -0
  52. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/sd3/sd3_dit.json +0 -0
  53. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/sd3/sd3_text_encoder.json +0 -0
  54. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/sdxl/sdxl_text_encoder.json +0 -0
  55. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/sdxl/sdxl_unet.json +0 -0
  56. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/dit/wan2.1-flf2v-14b.json +0 -0
  57. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/dit/wan2.1-i2v-14b.json +0 -0
  58. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/dit/wan2.1-t2v-1.3b.json +0 -0
  59. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/dit/wan2.1-t2v-14b.json +0 -0
  60. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/dit/wan2.2-i2v-a14b.json +0 -0
  61. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/dit/wan2.2-t2v-a14b.json +0 -0
  62. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/dit/wan2.2-ti2v-5b.json +0 -0
  63. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/vae/wan-vae-keymap.json +0 -0
  64. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/vae/wan2.1-vae.json +0 -0
  65. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/models/wan/vae/wan2.2-vae.json +0 -0
  66. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/merges.txt +0 -0
  67. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/special_tokens_map.json +0 -0
  68. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/tokenizer_config.json +0 -0
  69. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/vocab.json +0 -0
  70. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/special_tokens_map.json +0 -0
  71. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/spiece.model +0 -0
  72. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/tokenizer.json +0 -0
  73. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/tokenizer_config.json +0 -0
  74. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/qwen_image/qwen2_vl_image_processor.json +0 -0
  75. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/added_tokens.json +0 -0
  76. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/merges.txt +0 -0
  77. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/special_tokens_map.json +0 -0
  78. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/tokenizer.json +0 -0
  79. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/tokenizer_config.json +0 -0
  80. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/vocab.json +0 -0
  81. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/merges.txt +0 -0
  82. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/special_tokens_map.json +0 -0
  83. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/tokenizer_config.json +0 -0
  84. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/vocab.json +0 -0
  85. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/merges.txt +0 -0
  86. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/special_tokens_map.json +0 -0
  87. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/tokenizer_config.json +0 -0
  88. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/vocab.json +0 -0
  89. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/special_tokens_map.json +0 -0
  90. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/spiece.model +0 -0
  91. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/tokenizer.json +0 -0
  92. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/tokenizer_config.json +0 -0
  93. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/configs/__init__.py +0 -0
  94. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/configs/controlnet.py +0 -0
  95. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/kernels/__init__.py +0 -0
  96. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/__init__.py +0 -0
  97. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/base.py +0 -0
  98. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/basic/__init__.py +0 -0
  99. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/basic/attention.py +0 -0
  100. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/basic/lora.py +0 -0
  101. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/basic/relative_position_emb.py +0 -0
  102. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/basic/timestep.py +0 -0
  103. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/basic/transformer_helper.py +0 -0
  104. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/basic/unet_helper.py +0 -0
  105. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/flux/__init__.py +0 -0
  106. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/flux/flux_controlnet.py +0 -0
  107. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/flux/flux_dit.py +0 -0
  108. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/flux/flux_dit_fbcache.py +0 -0
  109. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/flux/flux_ipadapter.py +0 -0
  110. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/flux/flux_redux.py +0 -0
  111. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/flux/flux_text_encoder.py +0 -0
  112. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/flux/flux_vae.py +0 -0
  113. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/hunyuan3d/__init__.py +0 -0
  114. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/hunyuan3d/dino_image_encoder.py +0 -0
  115. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/hunyuan3d/hunyuan3d_dit.py +0 -0
  116. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/hunyuan3d/hunyuan3d_vae.py +0 -0
  117. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/hunyuan3d/moe.py +0 -0
  118. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/hunyuan3d/surface_extractor.py +0 -0
  119. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/hunyuan3d/volume_decoder.py +0 -0
  120. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/qwen_image/__init__.py +0 -0
  121. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/qwen_image/qwen_image_dit.py +0 -0
  122. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/qwen_image/qwen_image_dit_fbcache.py +0 -0
  123. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/qwen_image/qwen_image_vae.py +0 -0
  124. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd/__init__.py +0 -0
  125. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd/sd_controlnet.py +0 -0
  126. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd/sd_text_encoder.py +0 -0
  127. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd/sd_unet.py +0 -0
  128. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd/sd_vae.py +0 -0
  129. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd3/__init__.py +0 -0
  130. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd3/sd3_dit.py +0 -0
  131. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd3/sd3_text_encoder.py +0 -0
  132. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sd3/sd3_vae.py +0 -0
  133. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sdxl/__init__.py +0 -0
  134. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sdxl/sdxl_controlnet.py +0 -0
  135. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sdxl/sdxl_text_encoder.py +0 -0
  136. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sdxl/sdxl_unet.py +0 -0
  137. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/sdxl/sdxl_vae.py +0 -0
  138. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/text_encoder/__init__.py +0 -0
  139. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/text_encoder/clip.py +0 -0
  140. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/text_encoder/siglip.py +0 -0
  141. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/text_encoder/t5.py +0 -0
  142. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/utils.py +0 -0
  143. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/vae/__init__.py +0 -0
  144. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/vae/vae.py +0 -0
  145. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/wan/__init__.py +0 -0
  146. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/wan/wan_dit.py +0 -0
  147. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/wan/wan_image_encoder.py +0 -0
  148. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/wan/wan_text_encoder.py +0 -0
  149. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/models/wan/wan_vae.py +0 -0
  150. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/__init__.py +0 -0
  151. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/base.py +0 -0
  152. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/flux_image.py +0 -0
  153. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/hunyuan3d_shape.py +0 -0
  154. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/qwen_image.py +0 -0
  155. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/sd_image.py +0 -0
  156. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/sdxl_image.py +0 -0
  157. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/utils.py +0 -0
  158. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/pipelines/wan_video.py +0 -0
  159. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/processor/__init__.py +0 -0
  160. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/processor/canny_processor.py +0 -0
  161. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/processor/depth_processor.py +0 -0
  162. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tokenizers/__init__.py +0 -0
  163. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tokenizers/base.py +0 -0
  164. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tokenizers/clip.py +0 -0
  165. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tokenizers/qwen2.py +0 -0
  166. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tokenizers/qwen2_vl_image_processor.py +0 -0
  167. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tokenizers/qwen2_vl_processor.py +0 -0
  168. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tokenizers/t5.py +0 -0
  169. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tokenizers/wan.py +0 -0
  170. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tools/__init__.py +0 -0
  171. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tools/flux_inpainting_tool.py +0 -0
  172. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tools/flux_outpainting_tool.py +0 -0
  173. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tools/flux_reference_tool.py +0 -0
  174. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/tools/flux_replace_tool.py +0 -0
  175. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/__init__.py +0 -0
  176. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/cache.py +0 -0
  177. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/constants.py +0 -0
  178. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/download.py +0 -0
  179. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/env.py +0 -0
  180. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/flag.py +0 -0
  181. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/fp8_linear.py +0 -0
  182. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/gguf.py +0 -0
  183. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/image.py +0 -0
  184. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/loader.py +0 -0
  185. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/lock.py +0 -0
  186. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/logging.py +0 -0
  187. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/memory/__init__.py +0 -0
  188. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/memory/linear_regression.py +0 -0
  189. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/memory/memory_predcit_model.py +0 -0
  190. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/offload.py +0 -0
  191. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/onnx.py +0 -0
  192. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/parallel.py +0 -0
  193. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/platform.py +0 -0
  194. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/prompt.py +0 -0
  195. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine/utils/video.py +0 -0
  196. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine.egg-info/dependency_links.txt +0 -0
  197. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine.egg-info/requires.txt +0 -0
  198. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/diffsynth_engine.egg-info/top_level.txt +0 -0
  199. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/docs/tutorial.md +0 -0
  200. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/docs/tutorial_zh.md +0 -0
  201. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/pyproject.toml +0 -0
  202. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/setup.cfg +0 -0
  203. {diffsynth_engine-0.4.3.dev10 → diffsynth_engine-0.4.4.dev2}/setup.py +0 -0
@@ -0,0 +1,26 @@
1
+ tests/data/expect/sd/sd_unet.safetensors filter=lfs diff=lfs merge=lfs -text
2
+ tests/data/expect/sdxl/sdxl_unet.safetensors filter=lfs diff=lfs merge=lfs -text
3
+ tests/data/expect/algorithm/recifited_flow_20steps_flux.safetensors filter=lfs diff=lfs merge=lfs -text
4
+ tests/data/expect/algorithm/sgm_uniform_20steps.safetensors filter=lfs diff=lfs merge=lfs -text
5
+ tests/data/expect/flux/flux_text_encoder_2.safetensors filter=lfs diff=lfs merge=lfs -text
6
+ tests/data/expect/qwen_image/qwen_image_dit_output.safetensors filter=lfs diff=lfs merge=lfs -text
7
+ tests/data/expect/sd/sd_text_encoder.safetensors filter=lfs diff=lfs merge=lfs -text
8
+ tests/data/expect/sdxl/sdxl_text_encoder_2.safetensors filter=lfs diff=lfs merge=lfs -text
9
+ tests/data/expect/test_siglip_image_encoder.safetensors filter=lfs diff=lfs merge=lfs -text
10
+ tests/data/expect/wan/wan_vae.safetensors filter=lfs diff=lfs merge=lfs -text
11
+ tests/data/expect/algorithm/beta_20steps.safetensors filter=lfs diff=lfs merge=lfs -text
12
+ tests/data/expect/algorithm/karras_20steps.safetensors filter=lfs diff=lfs merge=lfs -text
13
+ tests/data/expect/flux/flux_dit.safetensors filter=lfs diff=lfs merge=lfs -text
14
+ tests/data/expect/flux/flux_vae.safetensors filter=lfs diff=lfs merge=lfs -text
15
+ tests/data/expect/sd/sd_vae.safetensors filter=lfs diff=lfs merge=lfs -text
16
+ tests/data/expect/sdxl/sdxl_text_encoder_1.safetensors filter=lfs diff=lfs merge=lfs -text
17
+ tests/data/expect/sdxl/sdxl_vae.safetensors filter=lfs diff=lfs merge=lfs -text
18
+ tests/data/input/qwen_image/qwen_image_dit_input.safetensors filter=lfs diff=lfs merge=lfs -text
19
+ tests/data/expect/algorithm/euler_i10.safetensors filter=lfs diff=lfs merge=lfs -text
20
+ tests/data/expect/algorithm/exponential_20steps.safetensors filter=lfs diff=lfs merge=lfs -text
21
+ tests/data/expect/algorithm/scaled_linear_20steps.safetensors filter=lfs diff=lfs merge=lfs -text
22
+ tests/data/expect/qwen_image/qwen2_5_vl.safetensors filter=lfs diff=lfs merge=lfs -text
23
+ tests/data/expect/algorithm/ddim_20steps.safetensors filter=lfs diff=lfs merge=lfs -text
24
+ tests/data/expect/algorithm/flow_match_euler_i10.safetensors filter=lfs diff=lfs merge=lfs -text
25
+ tests/data/expect/algorithm/output.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ tests/data/expect/flux/flux_text_encoder_1.safetensors filter=lfs diff=lfs merge=lfs -text
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: diffsynth_engine
3
- Version: 0.4.3.dev10
3
+ Version: 0.4.4.dev2
4
4
  Author: MuseAI x ModelScope
5
5
  Classifier: Programming Language :: Python :: 3
6
6
  Classifier: Operating System :: OS Independent
@@ -206,6 +206,11 @@ class QwenImagePipelineConfig(AttentionConfig, OptimizationConfig, ParallelConfi
206
206
  # override OptimizationConfig
207
207
  fbcache_relative_l1_threshold = 0.009
208
208
 
209
+ # override BaseConfig
210
+ vae_tiled: bool = True
211
+ vae_tile_size: Tuple[int, int] = (34, 34)
212
+ vae_tile_stride: Tuple[int, int] = (18, 16)
213
+
209
214
  @classmethod
210
215
  def basic_config(
211
216
  cls,
@@ -550,9 +550,15 @@ class Qwen2_5_Attention(nn.Module):
550
550
  if attention_mask is not None: # no matter the length, we just slice it
551
551
  causal_mask = attention_mask[:, :, :, : key_states.shape[1]]
552
552
 
553
- # TODO: use is_causal when attention mask is causal
554
553
  if self.attn_impl == "sdpa":
555
- out = attention_ops.sdpa_attn(query_states, key_states, value_states, is_causal=True)
554
+ is_causal = causal_mask is None and query_states.shape[1] > 1
555
+ out = attention_ops.sdpa_attn(
556
+ query_states,
557
+ key_states,
558
+ value_states,
559
+ attn_mask=causal_mask,
560
+ is_causal=is_causal,
561
+ )
556
562
  else:
557
563
  # TODO: attention_mask for flash attention 2
558
564
  out = attention_ops.attention(
@@ -783,6 +789,9 @@ class Qwen2_5_VLModel(nn.Module):
783
789
  else past_seen_tokens + sequence_length + 1
784
790
  )
785
791
 
792
+ if self.config.attn_impl == "sdpa" and self._ignore_causal_mask(attention_mask, input_tensor, past_seen_tokens):
793
+ return None
794
+
786
795
  # In case the provided `attention` mask is 2D, we generate a causal mask here (4D).
787
796
  causal_mask = self._prepare_4d_causal_attention_mask_with_cache_position(
788
797
  attention_mask=attention_mask,
@@ -802,6 +811,32 @@ class Qwen2_5_VLModel(nn.Module):
802
811
 
803
812
  return causal_mask
804
813
 
814
+ @staticmethod
815
+ def _ignore_causal_mask(
816
+ attention_mask: Optional[torch.Tensor],
817
+ inputs_embeds: torch.Tensor,
818
+ past_seen_tokens: int,
819
+ ):
820
+ """
821
+ Detects whether the optional user-specified attention_mask & the automatically created causal mask can be
822
+ ignored in case PyTorch's SDPA is used, rather relying on SDPA's `is_causal` argument.
823
+
824
+ In case no token is masked in the `attention_mask` argument, if `query_length == 1` or
825
+ `key_value_length == query_length`, we rather rely on SDPA `is_causal` argument to use causal/non-causal masks,
826
+ allowing to dispatch to the flash attention kernel (that can otherwise not be used if a custom `attn_mask` is
827
+ passed).
828
+ """
829
+
830
+ _, query_length = inputs_embeds.shape[0], inputs_embeds.shape[1]
831
+ key_value_length = query_length + past_seen_tokens
832
+
833
+ ignore_causal_mask = False
834
+ if (attention_mask is None or (attention_mask.ndim == 2 and torch.all(attention_mask == 1))) and (
835
+ query_length == 1 or key_value_length == query_length
836
+ ):
837
+ ignore_causal_mask = True
838
+ return ignore_causal_mask
839
+
805
840
  @staticmethod
806
841
  def _prepare_4d_causal_attention_mask_with_cache_position(
807
842
  attention_mask: torch.Tensor,
@@ -825,8 +860,6 @@ class Qwen2_5_VLModel(nn.Module):
825
860
  The target length: when generating with static cache, the mask should be as long as the static cache, to account for the 0 padding, the part of the cache that is not filled yet.
826
861
  dtype (`torch.dtype`):
827
862
  The dtype to use for the 4D attention mask.
828
- past_key_values (`Cache`):
829
- The cache class that is being used currently to generate
830
863
  cache_position (`torch.LongTensor`):
831
864
  Indices depicting the position of the input sequence tokens in the sequence.
832
865
  batch_size (`int`):
@@ -1199,14 +1232,29 @@ class Qwen2_5_VLForConditionalGeneration(PreTrainedModel):
1199
1232
  if position_ids is None:
1200
1233
  assert attention_mask is None or attention_mask.ndim == 2, "attention mask must be 2D"
1201
1234
  # calculate RoPE index once per generation in the pre-fill stage only
1202
- position_ids, rope_deltas = self.get_rope_index(
1203
- input_ids,
1204
- image_grid_thw,
1205
- video_grid_thw,
1206
- second_per_grid_ts,
1207
- attention_mask,
1235
+ is_prefill = (
1236
+ (cache_position is None or cache_position[0] == 0)
1237
+ or self.rope_deltas is None
1238
+ or past_key_values is None
1208
1239
  )
1209
- self.rope_deltas = rope_deltas
1240
+ if is_prefill:
1241
+ position_ids, rope_deltas = self.get_rope_index(
1242
+ input_ids,
1243
+ image_grid_thw,
1244
+ video_grid_thw,
1245
+ second_per_grid_ts,
1246
+ attention_mask,
1247
+ )
1248
+ self.rope_deltas = rope_deltas
1249
+ # then use the prev pre-calculated rope-deltas to get the correct position ids
1250
+ else:
1251
+ batch_size, seq_length, _ = inputs_embeds.shape
1252
+ delta = (cache_position[0] + self.rope_deltas).to(inputs_embeds.device)
1253
+ delta = delta.repeat_interleave(batch_size // delta.shape[0], dim=0)
1254
+ position_ids = torch.arange(seq_length, device=inputs_embeds.device)
1255
+ position_ids = position_ids.view(1, -1).expand(batch_size, -1)
1256
+ position_ids = position_ids.add(delta)
1257
+ position_ids = position_ids.unsqueeze(0).expand(3, -1, -1)
1210
1258
 
1211
1259
  hidden_states, present_key_values = self.model(
1212
1260
  input_ids=None,
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: diffsynth_engine
3
- Version: 0.4.3.dev10
3
+ Version: 0.4.4.dev2
4
4
  Author: MuseAI x ModelScope
5
5
  Classifier: Programming Language :: Python :: 3
6
6
  Classifier: Operating System :: OS Independent
@@ -1,3 +1,4 @@
1
+ .gitattributes
1
2
  .gitignore
2
3
  .pre-commit-config.yaml
3
4
  LICENSE