diffsynth-engine 0.4.0__tar.gz → 0.4.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/PKG-INFO +2 -1
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/README.md +8 -4
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/__init__.py +4 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/models/qwen_image/qwen2_5_vl_config.json +25 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/models/qwen_image/qwen2_5_vl_vision_config.json +19 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/models/qwen_image/qwen_image_vae_keymap.json +244 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/models/wan/vae/wan-vae-keymap.json +244 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/models/wan/vae/wan2.1-vae.json +48 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/added_tokens.json +24 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/merges.txt +151388 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/special_tokens_map.json +31 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/tokenizer.json +757444 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/tokenizer_config.json +209 -0
- diffsynth_engine-0.4.1/diffsynth_engine/conf/tokenizers/qwen_image/tokenizer/vocab.json +1 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/configs/__init__.py +12 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/configs/pipeline.py +68 -2
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/transformer_helper.py +33 -0
- diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/__init__.py +13 -0
- diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/qwen2_5_vl.py +1243 -0
- diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/qwen_image_dit.py +425 -0
- diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/qwen_image_dit_fbcache.py +133 -0
- diffsynth_engine-0.4.1/diffsynth_engine/models/qwen_image/qwen_image_vae.py +1082 -0
- diffsynth_engine-0.4.1/diffsynth_engine/models/wan/__init__.py +11 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/wan/wan_vae.py +16 -3
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/__init__.py +2 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/base.py +11 -4
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/flux_image.py +46 -44
- diffsynth_engine-0.4.1/diffsynth_engine/pipelines/qwen_image.py +416 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/sd_image.py +2 -4
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/sdxl_image.py +2 -4
- diffsynth_engine-0.4.1/diffsynth_engine/pipelines/utils.py +19 -0
- diffsynth_engine-0.4.1/diffsynth_engine/tokenizers/__init__.py +13 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tokenizers/clip.py +1 -1
- diffsynth_engine-0.4.1/diffsynth_engine/tokenizers/qwen2.py +210 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tokenizers/t5.py +1 -1
- diffsynth_engine-0.4.1/diffsynth_engine/utils/cache.py +55 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/constants.py +7 -0
- diffsynth_engine-0.4.1/diffsynth_engine/utils/offload.py +52 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/PKG-INFO +2 -1
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/SOURCES.txt +19 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/requires.txt +1 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/docs/tutorial.md +33 -42
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/docs/tutorial_zh.md +45 -54
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/pyproject.toml +1 -0
- diffsynth_engine-0.4.0/diffsynth_engine/pipelines/utils.py +0 -6
- diffsynth_engine-0.4.0/diffsynth_engine/tokenizers/__init__.py +0 -6
- diffsynth_engine-0.4.0/diffsynth_engine/utils/__init__.py +0 -0
- diffsynth_engine-0.4.0/diffsynth_engine/utils/offload.py +0 -36
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/.gitignore +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/.pre-commit-config.yaml +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/LICENSE +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/MANIFEST.in +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/assets/dingtalk.png +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/assets/showcase.jpeg +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/base_scheduler.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/flow_match/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/flow_match/flow_beta.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/flow_match/flow_ddim.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/flow_match/recifited_flow.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/beta.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/ddim.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/exponential.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/karras.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/linear.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/noise_scheduler/stable_diffusion/sgm_uniform.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/flow_match/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/flow_match/flow_match_euler.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/brownian_tree.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/ddpm.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/deis.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_2m.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_2m_sde.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/dpmpp_3m_sde.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/epsilon.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/euler.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/algorithm/sampler/stable_diffusion/euler_ancestral.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/components/vae.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/flux/flux_dit.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/flux/flux_text_encoder.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/flux/flux_vae.json +0 -0
- /diffsynth_engine-0.4.0/diffsynth_engine/conf/models/wan/vae/wan2.1-vae.json → /diffsynth_engine-0.4.1/diffsynth_engine/conf/models/qwen_image/qwen_image_vae.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sd/sd_text_encoder.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sd/sd_unet.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sd3/sd3_dit.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sd3/sd3_text_encoder.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sdxl/sdxl_text_encoder.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/sdxl/sdxl_unet.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.1-flf2v-14b.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.1-i2v-14b.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.1-t2v-1.3b.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.1-t2v-14b.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.2-i2v-a14b.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.2-t2v-a14b.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/dit/wan2.2-ti2v-5b.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/models/wan/vae/wan2.2-vae.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/merges.txt +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/special_tokens_map.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/tokenizer_config.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_1/vocab.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/special_tokens_map.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/spiece.model +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/tokenizer.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/flux/tokenizer_2/tokenizer_config.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/merges.txt +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/special_tokens_map.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/tokenizer_config.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer/vocab.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/merges.txt +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/special_tokens_map.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/tokenizer_config.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/sdxl/tokenizer_2/vocab.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/special_tokens_map.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/spiece.model +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/tokenizer.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/conf/tokenizers/wan/umt5-xxl/tokenizer_config.json +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/configs/controlnet.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/kernels/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/base.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/attention.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/lora.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/relative_position_emb.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/timestep.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/basic/unet_helper.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_controlnet.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_dit.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_dit_fbcache.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_ipadapter.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_redux.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_text_encoder.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/flux/flux_vae.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/sd_controlnet.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/sd_text_encoder.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/sd_unet.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd/sd_vae.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd3/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd3/sd3_dit.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd3/sd3_text_encoder.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sd3/sd3_vae.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/sdxl_controlnet.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/sdxl_text_encoder.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/sdxl_unet.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/sdxl/sdxl_vae.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/text_encoder/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/text_encoder/clip.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/text_encoder/siglip.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/text_encoder/t5.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/utils.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/vae/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/vae/vae.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/wan/wan_dit.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/wan/wan_image_encoder.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/models/wan/wan_text_encoder.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/pipelines/wan_video.py +0 -0
- {diffsynth_engine-0.4.0/diffsynth_engine/models/wan → diffsynth_engine-0.4.1/diffsynth_engine/processor}/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/processor/canny_processor.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/processor/depth_processor.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tokenizers/base.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tokenizers/wan.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/flux_inpainting_tool.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/flux_outpainting_tool.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/flux_reference_tool.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/tools/flux_replace_tool.py +0 -0
- {diffsynth_engine-0.4.0/diffsynth_engine/processor → diffsynth_engine-0.4.1/diffsynth_engine/utils}/__init__.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/download.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/env.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/flag.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/fp8_linear.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/gguf.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/image.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/loader.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/lock.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/logging.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/onnx.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/parallel.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/platform.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/prompt.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine/utils/video.py +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/dependency_links.txt +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/diffsynth_engine.egg-info/top_level.txt +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/setup.cfg +0 -0
- {diffsynth_engine-0.4.0 → diffsynth_engine-0.4.1}/setup.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: diffsynth_engine
|
|
3
|
-
Version: 0.4.
|
|
3
|
+
Version: 0.4.1
|
|
4
4
|
Author: MuseAI x ModelScope
|
|
5
5
|
Classifier: Programming Language :: Python :: 3
|
|
6
6
|
Classifier: Operating System :: OS Independent
|
|
@@ -28,6 +28,7 @@ Requires-Dist: opencv-python
|
|
|
28
28
|
Provides-Extra: dev
|
|
29
29
|
Requires-Dist: diffusers==0.31.0; extra == "dev"
|
|
30
30
|
Requires-Dist: transformers==4.45.2; extra == "dev"
|
|
31
|
+
Requires-Dist: accelerate; extra == "dev"
|
|
31
32
|
Requires-Dist: build; extra == "dev"
|
|
32
33
|
Requires-Dist: ruff; extra == "dev"
|
|
33
34
|
Requires-Dist: scikit-image; extra == "dev"
|
|
@@ -23,6 +23,7 @@ and offloading strategies, enabling loading of larger diffusion models (e.g., Fl
|
|
|
23
23
|
|
|
24
24
|
## News
|
|
25
25
|
|
|
26
|
+
- **[v0.4.1](https://github.com/modelscope/DiffSynth-Engine/releases/tag/v0.4.1)** | **August 4, 2025**: 🔥Supports [Qwen-Image](https://www.modelscope.cn/models/Qwen/Qwen-Image), an image generation model excels at complex text rendering and creating images in a wide range of artistic styles.
|
|
26
27
|
- **[v0.4.0](https://github.com/modelscope/DiffSynth-Engine/releases/tag/v0.4.0)** | **August 1, 2025**:
|
|
27
28
|
- 🔥Supports [Wan2.2](https://modelscope.cn/collections/tongyiwanxiang-22--shipinshengcheng-2bb5b1adef2840) video generation model
|
|
28
29
|
- ⚠️[**Breaking Change**] Improved `from_pretrained` method pipeline initialization
|
|
@@ -49,21 +50,24 @@ pip3 install -e .
|
|
|
49
50
|
### Usage
|
|
50
51
|
Text to image
|
|
51
52
|
```python
|
|
52
|
-
from diffsynth_engine import fetch_model, FluxImagePipeline
|
|
53
|
+
from diffsynth_engine import fetch_model, FluxImagePipeline, FluxPipelineConfig
|
|
53
54
|
|
|
54
55
|
model_path = fetch_model("muse/flux-with-vae", path="flux1-dev-with-vae.safetensors")
|
|
55
|
-
|
|
56
|
+
|
|
57
|
+
config = FluxPipelineConfig.basic_config(model_path=model_path, device="cuda:0")
|
|
58
|
+
pipe = FluxImagePipeline.from_pretrained(config)
|
|
56
59
|
image = pipe(prompt="a cat")
|
|
57
60
|
image.save("image.png")
|
|
58
61
|
```
|
|
59
62
|
Text to image with LoRA
|
|
60
63
|
```python
|
|
61
|
-
from diffsynth_engine import fetch_model, FluxImagePipeline
|
|
64
|
+
from diffsynth_engine import fetch_model, FluxImagePipeline, FluxPipelineConfig
|
|
62
65
|
|
|
63
66
|
model_path = fetch_model("muse/flux-with-vae", path="flux1-dev-with-vae.safetensors")
|
|
64
67
|
lora_path = fetch_model("DonRat/MAJICFLUS_SuperChinesestyleheongsam", path="麦橘超国风旗袍.safetensors")
|
|
65
68
|
|
|
66
|
-
|
|
69
|
+
config = FluxPipelineConfig.basic_config(model_path=model_path, device="cuda:0")
|
|
70
|
+
pipe = FluxImagePipeline.from_pretrained(config)
|
|
67
71
|
pipe.load_lora(path=lora_path, scale=1.0)
|
|
68
72
|
image = pipe(prompt="a girl, qipao")
|
|
69
73
|
image.save("image.png")
|
|
@@ -3,6 +3,7 @@ from .configs import (
|
|
|
3
3
|
SDXLPipelineConfig,
|
|
4
4
|
FluxPipelineConfig,
|
|
5
5
|
WanPipelineConfig,
|
|
6
|
+
QwenImagePipelineConfig,
|
|
6
7
|
ControlNetParams,
|
|
7
8
|
ControlType,
|
|
8
9
|
)
|
|
@@ -11,6 +12,7 @@ from .pipelines import (
|
|
|
11
12
|
SDXLImagePipeline,
|
|
12
13
|
SDImagePipeline,
|
|
13
14
|
WanVideoPipeline,
|
|
15
|
+
QwenImagePipeline,
|
|
14
16
|
)
|
|
15
17
|
from .models.flux import FluxControlNet, FluxIPAdapter, FluxRedux
|
|
16
18
|
from .models.sd import SDControlNet
|
|
@@ -31,6 +33,7 @@ __all__ = [
|
|
|
31
33
|
"FluxPipelineConfig",
|
|
32
34
|
"WanPipelineConfig",
|
|
33
35
|
"FluxImagePipeline",
|
|
36
|
+
"QwenImagePipelineConfig",
|
|
34
37
|
"FluxControlNet",
|
|
35
38
|
"FluxIPAdapter",
|
|
36
39
|
"FluxRedux",
|
|
@@ -39,6 +42,7 @@ __all__ = [
|
|
|
39
42
|
"SDXLImagePipeline",
|
|
40
43
|
"SDImagePipeline",
|
|
41
44
|
"WanVideoPipeline",
|
|
45
|
+
"QwenImagePipeline",
|
|
42
46
|
"FluxInpaintingTool",
|
|
43
47
|
"FluxOutpaintingTool",
|
|
44
48
|
"FluxIPAdapterRefTool",
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
{
|
|
2
|
+
"hidden_size": 3584,
|
|
3
|
+
"intermediate_size": 18944,
|
|
4
|
+
"num_hidden_layers": 28,
|
|
5
|
+
"num_attention_heads": 28,
|
|
6
|
+
"num_key_value_heads": 4,
|
|
7
|
+
"mrope_section": [
|
|
8
|
+
16,
|
|
9
|
+
24,
|
|
10
|
+
24
|
|
11
|
+
],
|
|
12
|
+
"rms_norm_eps": 1e-6,
|
|
13
|
+
"use_cache": true,
|
|
14
|
+
"use_sliding_window": false,
|
|
15
|
+
"sliding_window": 32768,
|
|
16
|
+
"max_window_layers": 28,
|
|
17
|
+
"vocab_size": 152064,
|
|
18
|
+
"pad_token_id": 151643,
|
|
19
|
+
"im_start_token_id": 151644,
|
|
20
|
+
"im_end_token_id": 151645,
|
|
21
|
+
"vision_start_token_id": 151652,
|
|
22
|
+
"vision_end_token_id": 151653,
|
|
23
|
+
"image_token_id": 151655,
|
|
24
|
+
"video_token_id": 151656
|
|
25
|
+
}
|
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
{
|
|
2
|
+
"in_channels": 3,
|
|
3
|
+
"hidden_size": 1280,
|
|
4
|
+
"intermediate_size": 3420,
|
|
5
|
+
"out_hidden_size": 3584,
|
|
6
|
+
"num_heads": 16,
|
|
7
|
+
"depth": 32,
|
|
8
|
+
"patch_size": 14,
|
|
9
|
+
"temporal_patch_size": 2,
|
|
10
|
+
"spatial_merge_size": 2,
|
|
11
|
+
"tokens_per_second": 2,
|
|
12
|
+
"window_size": 112,
|
|
13
|
+
"fullatt_block_indexes": [
|
|
14
|
+
7,
|
|
15
|
+
15,
|
|
16
|
+
23,
|
|
17
|
+
31
|
|
18
|
+
]
|
|
19
|
+
}
|
|
@@ -0,0 +1,244 @@
|
|
|
1
|
+
{
|
|
2
|
+
"diffusers": {
|
|
3
|
+
"rename_dict": {
|
|
4
|
+
"model.post_quant_conv.bias": "model.conv2.bias",
|
|
5
|
+
"model.post_quant_conv.weight": "model.conv2.weight",
|
|
6
|
+
"model.quant_conv.bias": "model.conv1.bias",
|
|
7
|
+
"model.quant_conv.weight": "model.conv1.weight",
|
|
8
|
+
"model.encoder.conv_in.bias": "model.encoder.conv1.bias",
|
|
9
|
+
"model.encoder.conv_in.weight": "model.encoder.conv1.weight",
|
|
10
|
+
"model.encoder.down_blocks.0.conv_shortcut.bias": "model.encoder.downsamples.0.shortcut.bias",
|
|
11
|
+
"model.encoder.down_blocks.0.conv_shortcut.weight": "model.encoder.downsamples.0.shortcut.weight",
|
|
12
|
+
"model.encoder.down_blocks.0.conv1.bias": "model.encoder.downsamples.0.residual.2.bias",
|
|
13
|
+
"model.encoder.down_blocks.0.conv1.weight": "model.encoder.downsamples.0.residual.2.weight",
|
|
14
|
+
"model.encoder.down_blocks.0.conv2.bias": "model.encoder.downsamples.0.residual.6.bias",
|
|
15
|
+
"model.encoder.down_blocks.0.conv2.weight": "model.encoder.downsamples.0.residual.6.weight",
|
|
16
|
+
"model.encoder.down_blocks.0.norm1.gamma": "model.encoder.downsamples.0.residual.0.gamma",
|
|
17
|
+
"model.encoder.down_blocks.0.norm2.gamma": "model.encoder.downsamples.0.residual.3.gamma",
|
|
18
|
+
"model.encoder.down_blocks.1.conv_shortcut.bias": "model.encoder.downsamples.1.shortcut.bias",
|
|
19
|
+
"model.encoder.down_blocks.1.conv_shortcut.weight": "model.encoder.downsamples.1.shortcut.weight",
|
|
20
|
+
"model.encoder.down_blocks.1.conv1.bias": "model.encoder.downsamples.1.residual.2.bias",
|
|
21
|
+
"model.encoder.down_blocks.1.conv1.weight": "model.encoder.downsamples.1.residual.2.weight",
|
|
22
|
+
"model.encoder.down_blocks.1.conv2.bias": "model.encoder.downsamples.1.residual.6.bias",
|
|
23
|
+
"model.encoder.down_blocks.1.conv2.weight": "model.encoder.downsamples.1.residual.6.weight",
|
|
24
|
+
"model.encoder.down_blocks.1.norm1.gamma": "model.encoder.downsamples.1.residual.0.gamma",
|
|
25
|
+
"model.encoder.down_blocks.1.norm2.gamma": "model.encoder.downsamples.1.residual.3.gamma",
|
|
26
|
+
"model.encoder.down_blocks.2.resample.1.bias": "model.encoder.downsamples.2.resample.1.bias",
|
|
27
|
+
"model.encoder.down_blocks.2.resample.1.weight": "model.encoder.downsamples.2.resample.1.weight",
|
|
28
|
+
"model.encoder.down_blocks.2.time_conv.bias": "model.encoder.downsamples.2.time_conv.bias",
|
|
29
|
+
"model.encoder.down_blocks.2.time_conv.weight": "model.encoder.downsamples.2.time_conv.weight",
|
|
30
|
+
"model.encoder.down_blocks.3.conv_shortcut.bias": "model.encoder.downsamples.3.shortcut.bias",
|
|
31
|
+
"model.encoder.down_blocks.3.conv_shortcut.weight": "model.encoder.downsamples.3.shortcut.weight",
|
|
32
|
+
"model.encoder.down_blocks.3.conv1.bias": "model.encoder.downsamples.3.residual.2.bias",
|
|
33
|
+
"model.encoder.down_blocks.3.conv1.weight": "model.encoder.downsamples.3.residual.2.weight",
|
|
34
|
+
"model.encoder.down_blocks.3.conv2.bias": "model.encoder.downsamples.3.residual.6.bias",
|
|
35
|
+
"model.encoder.down_blocks.3.conv2.weight": "model.encoder.downsamples.3.residual.6.weight",
|
|
36
|
+
"model.encoder.down_blocks.3.norm1.gamma": "model.encoder.downsamples.3.residual.0.gamma",
|
|
37
|
+
"model.encoder.down_blocks.3.norm2.gamma": "model.encoder.downsamples.3.residual.3.gamma",
|
|
38
|
+
"model.encoder.down_blocks.4.conv_shortcut.bias": "model.encoder.downsamples.4.shortcut.bias",
|
|
39
|
+
"model.encoder.down_blocks.4.conv_shortcut.weight": "model.encoder.downsamples.4.shortcut.weight",
|
|
40
|
+
"model.encoder.down_blocks.4.conv1.bias": "model.encoder.downsamples.4.residual.2.bias",
|
|
41
|
+
"model.encoder.down_blocks.4.conv1.weight": "model.encoder.downsamples.4.residual.2.weight",
|
|
42
|
+
"model.encoder.down_blocks.4.conv2.bias": "model.encoder.downsamples.4.residual.6.bias",
|
|
43
|
+
"model.encoder.down_blocks.4.conv2.weight": "model.encoder.downsamples.4.residual.6.weight",
|
|
44
|
+
"model.encoder.down_blocks.4.norm1.gamma": "model.encoder.downsamples.4.residual.0.gamma",
|
|
45
|
+
"model.encoder.down_blocks.4.norm2.gamma": "model.encoder.downsamples.4.residual.3.gamma",
|
|
46
|
+
"model.encoder.down_blocks.5.resample.1.bias": "model.encoder.downsamples.5.resample.1.bias",
|
|
47
|
+
"model.encoder.down_blocks.5.resample.1.weight": "model.encoder.downsamples.5.resample.1.weight",
|
|
48
|
+
"model.encoder.down_blocks.5.time_conv.bias": "model.encoder.downsamples.5.time_conv.bias",
|
|
49
|
+
"model.encoder.down_blocks.5.time_conv.weight": "model.encoder.downsamples.5.time_conv.weight",
|
|
50
|
+
"model.encoder.down_blocks.6.conv_shortcut.bias": "model.encoder.downsamples.6.shortcut.bias",
|
|
51
|
+
"model.encoder.down_blocks.6.conv_shortcut.weight": "model.encoder.downsamples.6.shortcut.weight",
|
|
52
|
+
"model.encoder.down_blocks.6.conv1.bias": "model.encoder.downsamples.6.residual.2.bias",
|
|
53
|
+
"model.encoder.down_blocks.6.conv1.weight": "model.encoder.downsamples.6.residual.2.weight",
|
|
54
|
+
"model.encoder.down_blocks.6.conv2.bias": "model.encoder.downsamples.6.residual.6.bias",
|
|
55
|
+
"model.encoder.down_blocks.6.conv2.weight": "model.encoder.downsamples.6.residual.6.weight",
|
|
56
|
+
"model.encoder.down_blocks.6.norm1.gamma": "model.encoder.downsamples.6.residual.0.gamma",
|
|
57
|
+
"model.encoder.down_blocks.6.norm2.gamma": "model.encoder.downsamples.6.residual.3.gamma",
|
|
58
|
+
"model.encoder.down_blocks.7.conv_shortcut.bias": "model.encoder.downsamples.7.shortcut.bias",
|
|
59
|
+
"model.encoder.down_blocks.7.conv_shortcut.weight": "model.encoder.downsamples.7.shortcut.weight",
|
|
60
|
+
"model.encoder.down_blocks.7.conv1.bias": "model.encoder.downsamples.7.residual.2.bias",
|
|
61
|
+
"model.encoder.down_blocks.7.conv1.weight": "model.encoder.downsamples.7.residual.2.weight",
|
|
62
|
+
"model.encoder.down_blocks.7.conv2.bias": "model.encoder.downsamples.7.residual.6.bias",
|
|
63
|
+
"model.encoder.down_blocks.7.conv2.weight": "model.encoder.downsamples.7.residual.6.weight",
|
|
64
|
+
"model.encoder.down_blocks.7.norm1.gamma": "model.encoder.downsamples.7.residual.0.gamma",
|
|
65
|
+
"model.encoder.down_blocks.7.norm2.gamma": "model.encoder.downsamples.7.residual.3.gamma",
|
|
66
|
+
"model.encoder.down_blocks.8.resample.1.bias": "model.encoder.downsamples.8.resample.1.bias",
|
|
67
|
+
"model.encoder.down_blocks.8.resample.1.weight": "model.encoder.downsamples.8.resample.1.weight",
|
|
68
|
+
"model.encoder.down_blocks.8.time_conv.bias": "model.encoder.downsamples.8.time_conv.bias",
|
|
69
|
+
"model.encoder.down_blocks.8.time_conv.weight": "model.encoder.downsamples.8.time_conv.weight",
|
|
70
|
+
"model.encoder.down_blocks.9.conv_shortcut.bias": "model.encoder.downsamples.9.shortcut.bias",
|
|
71
|
+
"model.encoder.down_blocks.9.conv_shortcut.weight": "model.encoder.downsamples.9.shortcut.weight",
|
|
72
|
+
"model.encoder.down_blocks.9.conv1.bias": "model.encoder.downsamples.9.residual.2.bias",
|
|
73
|
+
"model.encoder.down_blocks.9.conv1.weight": "model.encoder.downsamples.9.residual.2.weight",
|
|
74
|
+
"model.encoder.down_blocks.9.conv2.bias": "model.encoder.downsamples.9.residual.6.bias",
|
|
75
|
+
"model.encoder.down_blocks.9.conv2.weight": "model.encoder.downsamples.9.residual.6.weight",
|
|
76
|
+
"model.encoder.down_blocks.9.norm1.gamma": "model.encoder.downsamples.9.residual.0.gamma",
|
|
77
|
+
"model.encoder.down_blocks.9.norm2.gamma": "model.encoder.downsamples.9.residual.3.gamma",
|
|
78
|
+
"model.encoder.down_blocks.10.conv_shortcut.bias": "model.encoder.downsamples.10.shortcut.bias",
|
|
79
|
+
"model.encoder.down_blocks.10.conv_shortcut.weight": "model.encoder.downsamples.10.shortcut.weight",
|
|
80
|
+
"model.encoder.down_blocks.10.conv1.bias": "model.encoder.downsamples.10.residual.2.bias",
|
|
81
|
+
"model.encoder.down_blocks.10.conv1.weight": "model.encoder.downsamples.10.residual.2.weight",
|
|
82
|
+
"model.encoder.down_blocks.10.conv2.bias": "model.encoder.downsamples.10.residual.6.bias",
|
|
83
|
+
"model.encoder.down_blocks.10.conv2.weight": "model.encoder.downsamples.10.residual.6.weight",
|
|
84
|
+
"model.encoder.down_blocks.10.norm1.gamma": "model.encoder.downsamples.10.residual.0.gamma",
|
|
85
|
+
"model.encoder.down_blocks.10.norm2.gamma": "model.encoder.downsamples.10.residual.3.gamma",
|
|
86
|
+
"model.encoder.mid_block.attentions.0.norm.gamma": "model.encoder.middle.1.norm.gamma",
|
|
87
|
+
"model.encoder.mid_block.attentions.0.proj.bias": "model.encoder.middle.1.proj.bias",
|
|
88
|
+
"model.encoder.mid_block.attentions.0.proj.weight": "model.encoder.middle.1.proj.weight",
|
|
89
|
+
"model.encoder.mid_block.attentions.0.to_qkv.bias": "model.encoder.middle.1.to_qkv.bias",
|
|
90
|
+
"model.encoder.mid_block.attentions.0.to_qkv.weight": "model.encoder.middle.1.to_qkv.weight",
|
|
91
|
+
"model.encoder.mid_block.resnets.0.conv_shortcut.bias": "model.encoder.middle.0.shortcut.bias",
|
|
92
|
+
"model.encoder.mid_block.resnets.0.conv_shortcut.weight": "model.encoder.middle.0.shortcut.weight",
|
|
93
|
+
"model.encoder.mid_block.resnets.0.conv1.bias": "model.encoder.middle.0.residual.2.bias",
|
|
94
|
+
"model.encoder.mid_block.resnets.0.conv1.weight": "model.encoder.middle.0.residual.2.weight",
|
|
95
|
+
"model.encoder.mid_block.resnets.0.conv2.bias": "model.encoder.middle.0.residual.6.bias",
|
|
96
|
+
"model.encoder.mid_block.resnets.0.conv2.weight": "model.encoder.middle.0.residual.6.weight",
|
|
97
|
+
"model.encoder.mid_block.resnets.0.norm1.gamma": "model.encoder.middle.0.residual.0.gamma",
|
|
98
|
+
"model.encoder.mid_block.resnets.0.norm2.gamma": "model.encoder.middle.0.residual.3.gamma",
|
|
99
|
+
"model.encoder.mid_block.resnets.1.conv_shortcut.bias": "model.encoder.middle.2.shortcut.bias",
|
|
100
|
+
"model.encoder.mid_block.resnets.1.conv_shortcut.weight": "model.encoder.middle.2.shortcut.weight",
|
|
101
|
+
"model.encoder.mid_block.resnets.1.conv1.bias": "model.encoder.middle.2.residual.2.bias",
|
|
102
|
+
"model.encoder.mid_block.resnets.1.conv1.weight": "model.encoder.middle.2.residual.2.weight",
|
|
103
|
+
"model.encoder.mid_block.resnets.1.conv2.bias": "model.encoder.middle.2.residual.6.bias",
|
|
104
|
+
"model.encoder.mid_block.resnets.1.conv2.weight": "model.encoder.middle.2.residual.6.weight",
|
|
105
|
+
"model.encoder.mid_block.resnets.1.norm1.gamma": "model.encoder.middle.2.residual.0.gamma",
|
|
106
|
+
"model.encoder.mid_block.resnets.1.norm2.gamma": "model.encoder.middle.2.residual.3.gamma",
|
|
107
|
+
"model.encoder.norm_out.gamma": "model.encoder.head.0.gamma",
|
|
108
|
+
"model.encoder.conv_out.bias": "model.encoder.head.2.bias",
|
|
109
|
+
"model.encoder.conv_out.weight": "model.encoder.head.2.weight",
|
|
110
|
+
"model.decoder.conv_in.bias": "model.decoder.conv1.bias",
|
|
111
|
+
"model.decoder.conv_in.weight": "model.decoder.conv1.weight",
|
|
112
|
+
"model.decoder.mid_block.attentions.0.norm.gamma": "model.decoder.middle.1.norm.gamma",
|
|
113
|
+
"model.decoder.mid_block.attentions.0.proj.bias": "model.decoder.middle.1.proj.bias",
|
|
114
|
+
"model.decoder.mid_block.attentions.0.proj.weight": "model.decoder.middle.1.proj.weight",
|
|
115
|
+
"model.decoder.mid_block.attentions.0.to_qkv.bias": "model.decoder.middle.1.to_qkv.bias",
|
|
116
|
+
"model.decoder.mid_block.attentions.0.to_qkv.weight": "model.decoder.middle.1.to_qkv.weight",
|
|
117
|
+
"model.decoder.mid_block.resnets.0.conv_shortcut.bias": "model.decoder.middle.0.shortcut.bias",
|
|
118
|
+
"model.decoder.mid_block.resnets.0.conv_shortcut.weight": "model.decoder.middle.0.shortcut.weight",
|
|
119
|
+
"model.decoder.mid_block.resnets.0.conv1.bias": "model.decoder.middle.0.residual.2.bias",
|
|
120
|
+
"model.decoder.mid_block.resnets.0.conv1.weight": "model.decoder.middle.0.residual.2.weight",
|
|
121
|
+
"model.decoder.mid_block.resnets.0.conv2.bias": "model.decoder.middle.0.residual.6.bias",
|
|
122
|
+
"model.decoder.mid_block.resnets.0.conv2.weight": "model.decoder.middle.0.residual.6.weight",
|
|
123
|
+
"model.decoder.mid_block.resnets.0.norm1.gamma": "model.decoder.middle.0.residual.0.gamma",
|
|
124
|
+
"model.decoder.mid_block.resnets.0.norm2.gamma": "model.decoder.middle.0.residual.3.gamma",
|
|
125
|
+
"model.decoder.mid_block.resnets.1.conv_shortcut.bias": "model.decoder.middle.2.shortcut.bias",
|
|
126
|
+
"model.decoder.mid_block.resnets.1.conv_shortcut.weight": "model.decoder.middle.2.shortcut.weight",
|
|
127
|
+
"model.decoder.mid_block.resnets.1.conv1.bias": "model.decoder.middle.2.residual.2.bias",
|
|
128
|
+
"model.decoder.mid_block.resnets.1.conv1.weight": "model.decoder.middle.2.residual.2.weight",
|
|
129
|
+
"model.decoder.mid_block.resnets.1.conv2.bias": "model.decoder.middle.2.residual.6.bias",
|
|
130
|
+
"model.decoder.mid_block.resnets.1.conv2.weight": "model.decoder.middle.2.residual.6.weight",
|
|
131
|
+
"model.decoder.mid_block.resnets.1.norm1.gamma": "model.decoder.middle.2.residual.0.gamma",
|
|
132
|
+
"model.decoder.mid_block.resnets.1.norm2.gamma": "model.decoder.middle.2.residual.3.gamma",
|
|
133
|
+
"model.decoder.up_blocks.0.resnets.0.conv_shortcut.bias": "model.decoder.upsamples.0.shortcut.bias",
|
|
134
|
+
"model.decoder.up_blocks.0.resnets.0.conv_shortcut.weight": "model.decoder.upsamples.0.shortcut.weight",
|
|
135
|
+
"model.decoder.up_blocks.0.resnets.0.conv1.bias": "model.decoder.upsamples.0.residual.2.bias",
|
|
136
|
+
"model.decoder.up_blocks.0.resnets.0.conv1.weight": "model.decoder.upsamples.0.residual.2.weight",
|
|
137
|
+
"model.decoder.up_blocks.0.resnets.0.conv2.bias": "model.decoder.upsamples.0.residual.6.bias",
|
|
138
|
+
"model.decoder.up_blocks.0.resnets.0.conv2.weight": "model.decoder.upsamples.0.residual.6.weight",
|
|
139
|
+
"model.decoder.up_blocks.0.resnets.0.norm1.gamma": "model.decoder.upsamples.0.residual.0.gamma",
|
|
140
|
+
"model.decoder.up_blocks.0.resnets.0.norm2.gamma": "model.decoder.upsamples.0.residual.3.gamma",
|
|
141
|
+
"model.decoder.up_blocks.0.resnets.1.conv_shortcut.bias": "model.decoder.upsamples.1.shortcut.bias",
|
|
142
|
+
"model.decoder.up_blocks.0.resnets.1.conv_shortcut.weight": "model.decoder.upsamples.1.shortcut.weight",
|
|
143
|
+
"model.decoder.up_blocks.0.resnets.1.conv1.bias": "model.decoder.upsamples.1.residual.2.bias",
|
|
144
|
+
"model.decoder.up_blocks.0.resnets.1.conv1.weight": "model.decoder.upsamples.1.residual.2.weight",
|
|
145
|
+
"model.decoder.up_blocks.0.resnets.1.conv2.bias": "model.decoder.upsamples.1.residual.6.bias",
|
|
146
|
+
"model.decoder.up_blocks.0.resnets.1.conv2.weight": "model.decoder.upsamples.1.residual.6.weight",
|
|
147
|
+
"model.decoder.up_blocks.0.resnets.1.norm1.gamma": "model.decoder.upsamples.1.residual.0.gamma",
|
|
148
|
+
"model.decoder.up_blocks.0.resnets.1.norm2.gamma": "model.decoder.upsamples.1.residual.3.gamma",
|
|
149
|
+
"model.decoder.up_blocks.0.resnets.2.conv_shortcut.bias": "model.decoder.upsamples.2.shortcut.bias",
|
|
150
|
+
"model.decoder.up_blocks.0.resnets.2.conv_shortcut.weight": "model.decoder.upsamples.2.shortcut.weight",
|
|
151
|
+
"model.decoder.up_blocks.0.resnets.2.conv1.bias": "model.decoder.upsamples.2.residual.2.bias",
|
|
152
|
+
"model.decoder.up_blocks.0.resnets.2.conv1.weight": "model.decoder.upsamples.2.residual.2.weight",
|
|
153
|
+
"model.decoder.up_blocks.0.resnets.2.conv2.bias": "model.decoder.upsamples.2.residual.6.bias",
|
|
154
|
+
"model.decoder.up_blocks.0.resnets.2.conv2.weight": "model.decoder.upsamples.2.residual.6.weight",
|
|
155
|
+
"model.decoder.up_blocks.0.resnets.2.norm1.gamma": "model.decoder.upsamples.2.residual.0.gamma",
|
|
156
|
+
"model.decoder.up_blocks.0.resnets.2.norm2.gamma": "model.decoder.upsamples.2.residual.3.gamma",
|
|
157
|
+
"model.decoder.up_blocks.0.upsamplers.0.resample.1.bias": "model.decoder.upsamples.3.resample.1.bias",
|
|
158
|
+
"model.decoder.up_blocks.0.upsamplers.0.resample.1.weight": "model.decoder.upsamples.3.resample.1.weight",
|
|
159
|
+
"model.decoder.up_blocks.0.upsamplers.0.time_conv.bias": "model.decoder.upsamples.3.time_conv.bias",
|
|
160
|
+
"model.decoder.up_blocks.0.upsamplers.0.time_conv.weight": "model.decoder.upsamples.3.time_conv.weight",
|
|
161
|
+
"model.decoder.up_blocks.1.resnets.0.conv_shortcut.bias": "model.decoder.upsamples.4.shortcut.bias",
|
|
162
|
+
"model.decoder.up_blocks.1.resnets.0.conv_shortcut.weight": "model.decoder.upsamples.4.shortcut.weight",
|
|
163
|
+
"model.decoder.up_blocks.1.resnets.0.conv1.bias": "model.decoder.upsamples.4.residual.2.bias",
|
|
164
|
+
"model.decoder.up_blocks.1.resnets.0.conv1.weight": "model.decoder.upsamples.4.residual.2.weight",
|
|
165
|
+
"model.decoder.up_blocks.1.resnets.0.conv2.bias": "model.decoder.upsamples.4.residual.6.bias",
|
|
166
|
+
"model.decoder.up_blocks.1.resnets.0.conv2.weight": "model.decoder.upsamples.4.residual.6.weight",
|
|
167
|
+
"model.decoder.up_blocks.1.resnets.0.norm1.gamma": "model.decoder.upsamples.4.residual.0.gamma",
|
|
168
|
+
"model.decoder.up_blocks.1.resnets.0.norm2.gamma": "model.decoder.upsamples.4.residual.3.gamma",
|
|
169
|
+
"model.decoder.up_blocks.1.resnets.1.conv_shortcut.bias": "model.decoder.upsamples.5.shortcut.bias",
|
|
170
|
+
"model.decoder.up_blocks.1.resnets.1.conv_shortcut.weight": "model.decoder.upsamples.5.shortcut.weight",
|
|
171
|
+
"model.decoder.up_blocks.1.resnets.1.conv1.bias": "model.decoder.upsamples.5.residual.2.bias",
|
|
172
|
+
"model.decoder.up_blocks.1.resnets.1.conv1.weight": "model.decoder.upsamples.5.residual.2.weight",
|
|
173
|
+
"model.decoder.up_blocks.1.resnets.1.conv2.bias": "model.decoder.upsamples.5.residual.6.bias",
|
|
174
|
+
"model.decoder.up_blocks.1.resnets.1.conv2.weight": "model.decoder.upsamples.5.residual.6.weight",
|
|
175
|
+
"model.decoder.up_blocks.1.resnets.1.norm1.gamma": "model.decoder.upsamples.5.residual.0.gamma",
|
|
176
|
+
"model.decoder.up_blocks.1.resnets.1.norm2.gamma": "model.decoder.upsamples.5.residual.3.gamma",
|
|
177
|
+
"model.decoder.up_blocks.1.resnets.2.conv_shortcut.bias": "model.decoder.upsamples.6.shortcut.bias",
|
|
178
|
+
"model.decoder.up_blocks.1.resnets.2.conv_shortcut.weight": "model.decoder.upsamples.6.shortcut.weight",
|
|
179
|
+
"model.decoder.up_blocks.1.resnets.2.conv1.bias": "model.decoder.upsamples.6.residual.2.bias",
|
|
180
|
+
"model.decoder.up_blocks.1.resnets.2.conv1.weight": "model.decoder.upsamples.6.residual.2.weight",
|
|
181
|
+
"model.decoder.up_blocks.1.resnets.2.conv2.bias": "model.decoder.upsamples.6.residual.6.bias",
|
|
182
|
+
"model.decoder.up_blocks.1.resnets.2.conv2.weight": "model.decoder.upsamples.6.residual.6.weight",
|
|
183
|
+
"model.decoder.up_blocks.1.resnets.2.norm1.gamma": "model.decoder.upsamples.6.residual.0.gamma",
|
|
184
|
+
"model.decoder.up_blocks.1.resnets.2.norm2.gamma": "model.decoder.upsamples.6.residual.3.gamma",
|
|
185
|
+
"model.decoder.up_blocks.1.upsamplers.0.resample.1.bias": "model.decoder.upsamples.7.resample.1.bias",
|
|
186
|
+
"model.decoder.up_blocks.1.upsamplers.0.resample.1.weight": "model.decoder.upsamples.7.resample.1.weight",
|
|
187
|
+
"model.decoder.up_blocks.1.upsamplers.0.time_conv.bias": "model.decoder.upsamples.7.time_conv.bias",
|
|
188
|
+
"model.decoder.up_blocks.1.upsamplers.0.time_conv.weight": "model.decoder.upsamples.7.time_conv.weight",
|
|
189
|
+
"model.decoder.up_blocks.2.resnets.0.conv_shortcut.bias": "model.decoder.upsamples.8.shortcut.bias",
|
|
190
|
+
"model.decoder.up_blocks.2.resnets.0.conv_shortcut.weight": "model.decoder.upsamples.8.shortcut.weight",
|
|
191
|
+
"model.decoder.up_blocks.2.resnets.0.conv1.bias": "model.decoder.upsamples.8.residual.2.bias",
|
|
192
|
+
"model.decoder.up_blocks.2.resnets.0.conv1.weight": "model.decoder.upsamples.8.residual.2.weight",
|
|
193
|
+
"model.decoder.up_blocks.2.resnets.0.conv2.bias": "model.decoder.upsamples.8.residual.6.bias",
|
|
194
|
+
"model.decoder.up_blocks.2.resnets.0.conv2.weight": "model.decoder.upsamples.8.residual.6.weight",
|
|
195
|
+
"model.decoder.up_blocks.2.resnets.0.norm1.gamma": "model.decoder.upsamples.8.residual.0.gamma",
|
|
196
|
+
"model.decoder.up_blocks.2.resnets.0.norm2.gamma": "model.decoder.upsamples.8.residual.3.gamma",
|
|
197
|
+
"model.decoder.up_blocks.2.resnets.1.conv_shortcut.bias": "model.decoder.upsamples.9.shortcut.bias",
|
|
198
|
+
"model.decoder.up_blocks.2.resnets.1.conv_shortcut.weight": "model.decoder.upsamples.9.shortcut.weight",
|
|
199
|
+
"model.decoder.up_blocks.2.resnets.1.conv1.bias": "model.decoder.upsamples.9.residual.2.bias",
|
|
200
|
+
"model.decoder.up_blocks.2.resnets.1.conv1.weight": "model.decoder.upsamples.9.residual.2.weight",
|
|
201
|
+
"model.decoder.up_blocks.2.resnets.1.conv2.bias": "model.decoder.upsamples.9.residual.6.bias",
|
|
202
|
+
"model.decoder.up_blocks.2.resnets.1.conv2.weight": "model.decoder.upsamples.9.residual.6.weight",
|
|
203
|
+
"model.decoder.up_blocks.2.resnets.1.norm1.gamma": "model.decoder.upsamples.9.residual.0.gamma",
|
|
204
|
+
"model.decoder.up_blocks.2.resnets.1.norm2.gamma": "model.decoder.upsamples.9.residual.3.gamma",
|
|
205
|
+
"model.decoder.up_blocks.2.resnets.2.conv_shortcut.bias": "model.decoder.upsamples.10.shortcut.bias",
|
|
206
|
+
"model.decoder.up_blocks.2.resnets.2.conv_shortcut.weight": "model.decoder.upsamples.10.shortcut.weight",
|
|
207
|
+
"model.decoder.up_blocks.2.resnets.2.conv1.bias": "model.decoder.upsamples.10.residual.2.bias",
|
|
208
|
+
"model.decoder.up_blocks.2.resnets.2.conv1.weight": "model.decoder.upsamples.10.residual.2.weight",
|
|
209
|
+
"model.decoder.up_blocks.2.resnets.2.conv2.bias": "model.decoder.upsamples.10.residual.6.bias",
|
|
210
|
+
"model.decoder.up_blocks.2.resnets.2.conv2.weight": "model.decoder.upsamples.10.residual.6.weight",
|
|
211
|
+
"model.decoder.up_blocks.2.resnets.2.norm1.gamma": "model.decoder.upsamples.10.residual.0.gamma",
|
|
212
|
+
"model.decoder.up_blocks.2.resnets.2.norm2.gamma": "model.decoder.upsamples.10.residual.3.gamma",
|
|
213
|
+
"model.decoder.up_blocks.2.upsamplers.0.resample.1.bias": "model.decoder.upsamples.11.resample.1.bias",
|
|
214
|
+
"model.decoder.up_blocks.2.upsamplers.0.resample.1.weight": "model.decoder.upsamples.11.resample.1.weight",
|
|
215
|
+
"model.decoder.up_blocks.3.resnets.0.conv_shortcut.bias": "model.decoder.upsamples.12.shortcut.bias",
|
|
216
|
+
"model.decoder.up_blocks.3.resnets.0.conv_shortcut.weight": "model.decoder.upsamples.12.shortcut.weight",
|
|
217
|
+
"model.decoder.up_blocks.3.resnets.0.conv1.bias": "model.decoder.upsamples.12.residual.2.bias",
|
|
218
|
+
"model.decoder.up_blocks.3.resnets.0.conv1.weight": "model.decoder.upsamples.12.residual.2.weight",
|
|
219
|
+
"model.decoder.up_blocks.3.resnets.0.conv2.bias": "model.decoder.upsamples.12.residual.6.bias",
|
|
220
|
+
"model.decoder.up_blocks.3.resnets.0.conv2.weight": "model.decoder.upsamples.12.residual.6.weight",
|
|
221
|
+
"model.decoder.up_blocks.3.resnets.0.norm1.gamma": "model.decoder.upsamples.12.residual.0.gamma",
|
|
222
|
+
"model.decoder.up_blocks.3.resnets.0.norm2.gamma": "model.decoder.upsamples.12.residual.3.gamma",
|
|
223
|
+
"model.decoder.up_blocks.3.resnets.1.conv_shortcut.bias": "model.decoder.upsamples.13.shortcut.bias",
|
|
224
|
+
"model.decoder.up_blocks.3.resnets.1.conv_shortcut.weight": "model.decoder.upsamples.13.shortcut.weight",
|
|
225
|
+
"model.decoder.up_blocks.3.resnets.1.conv1.bias": "model.decoder.upsamples.13.residual.2.bias",
|
|
226
|
+
"model.decoder.up_blocks.3.resnets.1.conv1.weight": "model.decoder.upsamples.13.residual.2.weight",
|
|
227
|
+
"model.decoder.up_blocks.3.resnets.1.conv2.bias": "model.decoder.upsamples.13.residual.6.bias",
|
|
228
|
+
"model.decoder.up_blocks.3.resnets.1.conv2.weight": "model.decoder.upsamples.13.residual.6.weight",
|
|
229
|
+
"model.decoder.up_blocks.3.resnets.1.norm1.gamma": "model.decoder.upsamples.13.residual.0.gamma",
|
|
230
|
+
"model.decoder.up_blocks.3.resnets.1.norm2.gamma": "model.decoder.upsamples.13.residual.3.gamma",
|
|
231
|
+
"model.decoder.up_blocks.3.resnets.2.conv_shortcut.bias": "model.decoder.upsamples.14.shortcut.bias",
|
|
232
|
+
"model.decoder.up_blocks.3.resnets.2.conv_shortcut.weight": "model.decoder.upsamples.14.shortcut.weight",
|
|
233
|
+
"model.decoder.up_blocks.3.resnets.2.conv1.bias": "model.decoder.upsamples.14.residual.2.bias",
|
|
234
|
+
"model.decoder.up_blocks.3.resnets.2.conv1.weight": "model.decoder.upsamples.14.residual.2.weight",
|
|
235
|
+
"model.decoder.up_blocks.3.resnets.2.conv2.bias": "model.decoder.upsamples.14.residual.6.bias",
|
|
236
|
+
"model.decoder.up_blocks.3.resnets.2.conv2.weight": "model.decoder.upsamples.14.residual.6.weight",
|
|
237
|
+
"model.decoder.up_blocks.3.resnets.2.norm1.gamma": "model.decoder.upsamples.14.residual.0.gamma",
|
|
238
|
+
"model.decoder.up_blocks.3.resnets.2.norm2.gamma": "model.decoder.upsamples.14.residual.3.gamma",
|
|
239
|
+
"model.decoder.norm_out.gamma": "model.decoder.head.0.gamma",
|
|
240
|
+
"model.decoder.conv_out.bias": "model.decoder.head.2.bias",
|
|
241
|
+
"model.decoder.conv_out.weight": "model.decoder.head.2.weight"
|
|
242
|
+
}
|
|
243
|
+
}
|
|
244
|
+
}
|