diffsynth 2.0.8__tar.gz → 2.0.9__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (152) hide show
  1. {diffsynth-2.0.8 → diffsynth-2.0.9}/PKG-INFO +1 -1
  2. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/data/operators.py +17 -13
  3. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth.egg-info/PKG-INFO +1 -1
  4. {diffsynth-2.0.8 → diffsynth-2.0.9}/pyproject.toml +1 -1
  5. {diffsynth-2.0.8 → diffsynth-2.0.9}/LICENSE +0 -0
  6. {diffsynth-2.0.8 → diffsynth-2.0.9}/README.md +0 -0
  7. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/__init__.py +0 -0
  8. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/configs/__init__.py +0 -0
  9. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/configs/model_configs.py +0 -0
  10. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/configs/vram_management_module_maps.py +0 -0
  11. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/__init__.py +0 -0
  12. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/attention/__init__.py +0 -0
  13. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/attention/attention.py +0 -0
  14. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/data/__init__.py +0 -0
  15. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/data/unified_dataset.py +0 -0
  16. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/device/__init__.py +0 -0
  17. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/device/npu_compatible_device.py +0 -0
  18. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/gradient/__init__.py +0 -0
  19. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/gradient/gradient_checkpoint.py +0 -0
  20. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/loader/__init__.py +0 -0
  21. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/loader/config.py +0 -0
  22. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/loader/file.py +0 -0
  23. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/loader/model.py +0 -0
  24. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/npu_patch/npu_fused_operator.py +0 -0
  25. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/vram/__init__.py +0 -0
  26. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/vram/disk_map.py +0 -0
  27. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/vram/initialization.py +0 -0
  28. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/core/vram/layers.py +0 -0
  29. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/diffusion/__init__.py +0 -0
  30. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/diffusion/base_pipeline.py +0 -0
  31. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/diffusion/flow_match.py +0 -0
  32. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/diffusion/logger.py +0 -0
  33. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/diffusion/loss.py +0 -0
  34. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/diffusion/parsers.py +0 -0
  35. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/diffusion/runner.py +0 -0
  36. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/diffusion/training_module.py +0 -0
  37. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/anima_dit.py +0 -0
  38. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/dinov3_image_encoder.py +0 -0
  39. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/ernie_image_dit.py +0 -0
  40. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/ernie_image_text_encoder.py +0 -0
  41. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux2_dit.py +0 -0
  42. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux2_text_encoder.py +0 -0
  43. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux2_vae.py +0 -0
  44. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_controlnet.py +0 -0
  45. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_dit.py +0 -0
  46. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_infiniteyou.py +0 -0
  47. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_ipadapter.py +0 -0
  48. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_lora_encoder.py +0 -0
  49. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_lora_patcher.py +0 -0
  50. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_text_encoder_clip.py +0 -0
  51. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_text_encoder_t5.py +0 -0
  52. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_vae.py +0 -0
  53. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/flux_value_control.py +0 -0
  54. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/general_modules.py +0 -0
  55. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/longcat_video_dit.py +0 -0
  56. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/ltx2_audio_vae.py +0 -0
  57. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/ltx2_common.py +0 -0
  58. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/ltx2_dit.py +0 -0
  59. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/ltx2_text_encoder.py +0 -0
  60. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/ltx2_upsampler.py +0 -0
  61. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/ltx2_video_vae.py +0 -0
  62. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/model_loader.py +0 -0
  63. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/mova_audio_dit.py +0 -0
  64. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/mova_audio_vae.py +0 -0
  65. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/mova_dual_tower_bridge.py +0 -0
  66. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/nexus_gen.py +0 -0
  67. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/nexus_gen_ar_model.py +0 -0
  68. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/nexus_gen_projector.py +0 -0
  69. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/qwen_image_controlnet.py +0 -0
  70. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/qwen_image_dit.py +0 -0
  71. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/qwen_image_image2lora.py +0 -0
  72. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/qwen_image_text_encoder.py +0 -0
  73. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/qwen_image_vae.py +0 -0
  74. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/sd_text_encoder.py +0 -0
  75. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/siglip2_image_encoder.py +0 -0
  76. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/step1x_connector.py +0 -0
  77. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/step1x_text_encoder.py +0 -0
  78. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_animate_adapter.py +0 -0
  79. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_camera_controller.py +0 -0
  80. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_dit.py +0 -0
  81. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_dit_s2v.py +0 -0
  82. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_image_encoder.py +0 -0
  83. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_mot.py +0 -0
  84. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_motion_controller.py +0 -0
  85. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_text_encoder.py +0 -0
  86. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_vace.py +0 -0
  87. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wan_video_vae.py +0 -0
  88. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wantodance.py +0 -0
  89. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/wav2vec.py +0 -0
  90. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/z_image_controlnet.py +0 -0
  91. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/z_image_dit.py +0 -0
  92. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/z_image_image2lora.py +0 -0
  93. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/models/z_image_text_encoder.py +0 -0
  94. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/anima_image.py +0 -0
  95. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/ernie_image.py +0 -0
  96. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/flux2_image.py +0 -0
  97. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/flux_image.py +0 -0
  98. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/ltx2_audio_video.py +0 -0
  99. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/mova_audio_video.py +0 -0
  100. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/qwen_image.py +0 -0
  101. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/wan_video.py +0 -0
  102. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/pipelines/z_image.py +0 -0
  103. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/controlnet/__init__.py +0 -0
  104. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/controlnet/annotator.py +0 -0
  105. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/controlnet/controlnet_input.py +0 -0
  106. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/data/__init__.py +0 -0
  107. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/data/audio.py +0 -0
  108. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/data/audio_video.py +0 -0
  109. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/data/media_io_ltx2.py +0 -0
  110. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/lora/__init__.py +0 -0
  111. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/lora/flux.py +0 -0
  112. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/lora/general.py +0 -0
  113. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/lora/merge.py +0 -0
  114. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/lora/reset_rank.py +0 -0
  115. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/ses/__init__.py +0 -0
  116. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/ses/ses.py +0 -0
  117. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/__init__.py +0 -0
  118. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/anima_dit.py +0 -0
  119. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/ernie_image_text_encoder.py +0 -0
  120. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/flux2_text_encoder.py +0 -0
  121. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/flux_controlnet.py +0 -0
  122. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/flux_dit.py +0 -0
  123. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/flux_infiniteyou.py +0 -0
  124. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/flux_ipadapter.py +0 -0
  125. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/flux_text_encoder_clip.py +0 -0
  126. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/flux_text_encoder_t5.py +0 -0
  127. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/flux_vae.py +0 -0
  128. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/ltx2_audio_vae.py +0 -0
  129. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/ltx2_dit.py +0 -0
  130. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/ltx2_text_encoder.py +0 -0
  131. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/ltx2_video_vae.py +0 -0
  132. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/nexus_gen.py +0 -0
  133. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/nexus_gen_projector.py +0 -0
  134. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/qwen_image_text_encoder.py +0 -0
  135. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/step1x_connector.py +0 -0
  136. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/wan_video_animate_adapter.py +0 -0
  137. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/wan_video_dit.py +0 -0
  138. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/wan_video_image_encoder.py +0 -0
  139. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/wan_video_mot.py +0 -0
  140. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/wan_video_vace.py +0 -0
  141. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/wan_video_vae.py +0 -0
  142. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/wans2v_audio_encoder.py +0 -0
  143. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/z_image_dit.py +0 -0
  144. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/state_dict_converters/z_image_text_encoder.py +0 -0
  145. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/xfuser/__init__.py +0 -0
  146. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/utils/xfuser/xdit_context_parallel.py +0 -0
  147. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth/version.py +0 -0
  148. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth.egg-info/SOURCES.txt +0 -0
  149. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth.egg-info/dependency_links.txt +0 -0
  150. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth.egg-info/requires.txt +0 -0
  151. {diffsynth-2.0.8 → diffsynth-2.0.9}/diffsynth.egg-info/top_level.txt +0 -0
  152. {diffsynth-2.0.8 → diffsynth-2.0.9}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: diffsynth
3
- Version: 2.0.8
3
+ Version: 2.0.9
4
4
  Summary: Enjoy the magic of Diffusion models!
5
5
  Author: ModelScope Team
6
6
  License: Apache-2.0
@@ -1,4 +1,4 @@
1
- import math
1
+ import math, warnings
2
2
  import torch, torchvision, imageio, os
3
3
  import imageio.v3 as iio
4
4
  from PIL import Image
@@ -260,15 +260,19 @@ class LoadAudioWithTorchaudio(DataProcessingOperator, FrameSamplerByRateMixin):
260
260
  FrameSamplerByRateMixin.__init__(self, num_frames, time_division_factor, time_division_remainder, frame_rate, fix_frame_rate)
261
261
 
262
262
  def __call__(self, data: str):
263
- reader = self.get_reader(data)
264
- num_frames = self.get_num_frames(reader)
265
- duration = num_frames / self.frame_rate
266
- waveform, sample_rate = torchaudio.load(data)
267
- target_samples = int(duration * sample_rate)
268
- current_samples = waveform.shape[-1]
269
- if current_samples > target_samples:
270
- waveform = waveform[..., :target_samples]
271
- elif current_samples < target_samples:
272
- padding = target_samples - current_samples
273
- waveform = torch.nn.functional.pad(waveform, (0, padding))
274
- return waveform, sample_rate
263
+ try:
264
+ reader = self.get_reader(data)
265
+ num_frames = self.get_num_frames(reader)
266
+ duration = num_frames / self.frame_rate
267
+ waveform, sample_rate = torchaudio.load(data)
268
+ target_samples = int(duration * sample_rate)
269
+ current_samples = waveform.shape[-1]
270
+ if current_samples > target_samples:
271
+ waveform = waveform[..., :target_samples]
272
+ elif current_samples < target_samples:
273
+ padding = target_samples - current_samples
274
+ waveform = torch.nn.functional.pad(waveform, (0, padding))
275
+ return waveform, sample_rate
276
+ except:
277
+ warnings.warn(f"Cannot load audio in {data}. The audio will be `None`.")
278
+ return None
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: diffsynth
3
- Version: 2.0.8
3
+ Version: 2.0.9
4
4
  Summary: Enjoy the magic of Diffusion models!
5
5
  Author: ModelScope Team
6
6
  License: Apache-2.0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "diffsynth"
7
- version = "2.0.8"
7
+ version = "2.0.9"
8
8
  description = "Enjoy the magic of Diffusion models!"
9
9
  authors = [{name = "ModelScope Team"}]
10
10
  license = {text = "Apache-2.0"}
File without changes
File without changes
File without changes