minicpmo-utils 0.0.5__tar.gz → 0.0.9__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (153) hide show
  1. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/PKG-INFO +11 -15
  2. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/pyproject.toml +26 -20
  3. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/minicpmo/utils.py +1 -88
  4. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/minicpmo_utils.egg-info/PKG-INFO +11 -15
  5. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/minicpmo_utils.egg-info/requires.txt +10 -20
  6. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/README.md +0 -0
  7. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/setup.cfg +0 -0
  8. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/__init__.py +0 -0
  9. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/bin/average_model.py +0 -0
  10. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/bin/export_jit.py +0 -0
  11. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/bin/export_onnx.py +0 -0
  12. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/bin/inference_deprecated.py +0 -0
  13. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/bin/train.py +0 -0
  14. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/cli/__init__.py +0 -0
  15. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/cli/cosyvoice.py +0 -0
  16. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/cli/frontend.py +0 -0
  17. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/cli/model.py +0 -0
  18. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/dataset/__init__.py +0 -0
  19. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/dataset/dataset.py +0 -0
  20. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/dataset/processor.py +0 -0
  21. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/flow/decoder.py +0 -0
  22. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/flow/flow.py +0 -0
  23. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/flow/flow_matching.py +0 -0
  24. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/flow/length_regulator.py +0 -0
  25. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/hifigan/discriminator.py +0 -0
  26. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/hifigan/f0_predictor.py +0 -0
  27. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/hifigan/generator.py +0 -0
  28. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/hifigan/hifigan.py +0 -0
  29. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/llm/llm.py +0 -0
  30. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/tokenizer/assets/multilingual_zh_ja_yue_char_del.tiktoken +0 -0
  31. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/tokenizer/tokenizer.py +0 -0
  32. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/__init__.py +0 -0
  33. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/activation.py +0 -0
  34. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/attention.py +0 -0
  35. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/convolution.py +0 -0
  36. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/decoder.py +0 -0
  37. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/decoder_layer.py +0 -0
  38. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/embedding.py +0 -0
  39. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/encoder.py +0 -0
  40. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/encoder_layer.py +0 -0
  41. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/label_smoothing_loss.py +0 -0
  42. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/positionwise_feed_forward.py +0 -0
  43. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/subsampling.py +0 -0
  44. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/transformer/upsample_encoder.py +0 -0
  45. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/__init__.py +0 -0
  46. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/class_utils.py +0 -0
  47. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/common.py +0 -0
  48. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/executor.py +0 -0
  49. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/file_utils.py +0 -0
  50. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/frontend_utils.py +0 -0
  51. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/losses.py +0 -0
  52. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/mask.py +0 -0
  53. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/scheduler.py +0 -0
  54. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/utils/train_utils.py +0 -0
  55. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/cosyvoice/vllm/cosyvoice2.py +0 -0
  56. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/__init__.py +0 -0
  57. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/app.py +0 -0
  58. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/cli.py +0 -0
  59. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/hifigan/__init__.py +0 -0
  60. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/hifigan/config.py +0 -0
  61. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/hifigan/denoiser.py +0 -0
  62. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/hifigan/env.py +0 -0
  63. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/hifigan/meldataset.py +0 -0
  64. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/hifigan/models.py +0 -0
  65. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/hifigan/xutils.py +0 -0
  66. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/models/__init__.py +0 -0
  67. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/models/baselightningmodule.py +0 -0
  68. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/models/components/__init__.py +0 -0
  69. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/models/components/decoder.py +0 -0
  70. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/models/components/flow_matching.py +0 -0
  71. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/models/components/text_encoder.py +0 -0
  72. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/models/components/transformer.py +0 -0
  73. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/models/matcha_tts.py +0 -0
  74. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/onnx/__init__.py +0 -0
  75. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/onnx/export.py +0 -0
  76. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/onnx/infer.py +0 -0
  77. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/text/__init__.py +0 -0
  78. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/text/cleaners.py +0 -0
  79. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/text/numbers.py +0 -0
  80. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/text/symbols.py +0 -0
  81. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/train.py +0 -0
  82. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/__init__.py +0 -0
  83. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/audio.py +0 -0
  84. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/generate_data_statistics.py +0 -0
  85. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/instantiators.py +0 -0
  86. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/logging_utils.py +0 -0
  87. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/model.py +0 -0
  88. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/monotonic_align/__init__.py +0 -0
  89. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/monotonic_align/setup.py +0 -0
  90. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/pylogger.py +0 -0
  91. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/rich_utils.py +0 -0
  92. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/matcha/utils/utils.py +0 -0
  93. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/minicpmo/__init__.py +0 -0
  94. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/minicpmo/version.py +0 -0
  95. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/minicpmo_utils.egg-info/SOURCES.txt +0 -0
  96. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/minicpmo_utils.egg-info/dependency_links.txt +0 -0
  97. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/minicpmo_utils.egg-info/top_level.txt +0 -0
  98. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/s3tokenizer/__init__.py +0 -0
  99. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/s3tokenizer/assets/BAC009S0764W0121.wav +0 -0
  100. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/s3tokenizer/assets/BAC009S0764W0122.wav +0 -0
  101. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/s3tokenizer/assets/mel_filters.npz +0 -0
  102. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/s3tokenizer/cli.py +0 -0
  103. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/s3tokenizer/model.py +0 -0
  104. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/s3tokenizer/model_v2.py +0 -0
  105. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/s3tokenizer/utils.py +0 -0
  106. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/__init__.py +0 -0
  107. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/__init__.py +0 -0
  108. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/flow/__init__.py +0 -0
  109. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/flow/decoder_dit.py +0 -0
  110. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/flow/flow.py +0 -0
  111. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/flow/flow_matching.py +0 -0
  112. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/transformer/__init__.py +0 -0
  113. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/transformer/attention.py +0 -0
  114. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/transformer/embedding.py +0 -0
  115. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/transformer/encoder_layer.py +0 -0
  116. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/transformer/positionwise_feed_forward.py +0 -0
  117. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/transformer/subsampling.py +0 -0
  118. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/transformer/upsample_encoder_v2.py +0 -0
  119. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/utils/__init__.py +0 -0
  120. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/utils/class_utils.py +0 -0
  121. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/utils/common.py +0 -0
  122. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/cosyvoice2/utils/mask.py +0 -0
  123. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/__init__.py +0 -0
  124. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/cli.py +0 -0
  125. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/config.py +0 -0
  126. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/cosyvoice2.py +0 -0
  127. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/cosyvoice3.py +0 -0
  128. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/engine/__init__.py +0 -0
  129. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/engine/block_manager.py +0 -0
  130. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/engine/llm_engine.py +0 -0
  131. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/engine/model_runner.py +0 -0
  132. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/engine/scheduler.py +0 -0
  133. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/engine/sequence.py +0 -0
  134. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/__init__.py +0 -0
  135. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/flow.py +0 -0
  136. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/flow_components/__init__.py +0 -0
  137. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/flow_components/estimator.py +0 -0
  138. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/flow_components/upsample_encoder.py +0 -0
  139. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/hifigan.py +0 -0
  140. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/__init__.py +0 -0
  141. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/layers.py +0 -0
  142. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/qwen2.py +0 -0
  143. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/__init__.py +0 -0
  144. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/layers.py +0 -0
  145. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/modules/sampler.py +0 -0
  146. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/utils/__init__.py +0 -0
  147. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/utils/audio.py +0 -0
  148. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/utils/context.py +0 -0
  149. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/utils/loader.py +0 -0
  150. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/flashcosyvoice/utils/memory.py +0 -0
  151. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/stepaudio2.py +0 -0
  152. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/token2wav.py +0 -0
  153. {minicpmo_utils-0.0.5 → minicpmo_utils-0.0.9}/src/stepaudio2/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: minicpmo-utils
3
- Version: 0.0.5
3
+ Version: 0.0.9
4
4
  Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
5
5
  Author: MiniCPM-o Utils Maintainers
6
6
  License: Apache-2.0
@@ -14,7 +14,11 @@ Classifier: Programming Language :: Python :: 3.11
14
14
  Classifier: Programming Language :: Python :: 3.12
15
15
  Requires-Python: >=3.10
16
16
  Description-Content-Type: text/markdown
17
- Requires-Dist: numpy
17
+ Requires-Dist: MarkupSafe>=2.1.0
18
+ Requires-Dist: Jinja2>=3.1.0
19
+ Requires-Dist: typing-extensions>=4.12.0
20
+ Requires-Dist: packaging>=23.0
21
+ Requires-Dist: numpy>=1.24.0
18
22
  Requires-Dist: pillow==10.4.0
19
23
  Requires-Dist: librosa==0.9.0
20
24
  Requires-Dist: decord==0.6.0
@@ -24,11 +28,12 @@ Provides-Extra: tts
24
28
  Requires-Dist: torch>=2.3.0; extra == "tts"
25
29
  Requires-Dist: torchaudio>=2.3.0; extra == "tts"
26
30
  Requires-Dist: transformers<4.53.0,>=4.51.0; extra == "tts"
31
+ Requires-Dist: safetensors>=0.4.3; extra == "tts"
27
32
  Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "tts"
28
33
  Requires-Dist: onnx; extra == "tts"
29
34
  Requires-Dist: hyperpyyaml; extra == "tts"
30
- Requires-Dist: openai-whisper==20231117; extra == "tts"
31
- Requires-Dist: tqdm; extra == "tts"
35
+ Requires-Dist: openai-whisper; extra == "tts"
36
+ Requires-Dist: tqdm>=4.66.0; extra == "tts"
32
37
  Requires-Dist: tiktoken; extra == "tts"
33
38
  Requires-Dist: inflect; extra == "tts"
34
39
  Requires-Dist: omegaconf>=2.0.6; extra == "tts"
@@ -42,24 +47,15 @@ Requires-Dist: matplotlib; extra == "tts"
42
47
  Requires-Dist: wget; extra == "tts"
43
48
  Requires-Dist: pyarrow; extra == "tts"
44
49
  Requires-Dist: pyworld; extra == "tts"
45
- Requires-Dist: scipy; extra == "tts"
50
+ Requires-Dist: scipy>=1.10.0; extra == "tts"
46
51
  Requires-Dist: pyyaml; extra == "tts"
47
52
  Requires-Dist: regex; extra == "tts"
48
53
  Requires-Dist: soundfile==0.12.1; extra == "tts"
49
54
  Requires-Dist: diffusers==0.29.0; extra == "tts"
50
55
  Provides-Extra: streaming
51
56
  Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
52
- Provides-Extra: streaming-flash
53
- Requires-Dist: minicpmo-utils[streaming]; extra == "streaming-flash"
54
- Requires-Dist: flash-attn>=2.6.0; sys_platform == "linux" and extra == "streaming-flash"
55
- Requires-Dist: triton>=2.3.0; sys_platform == "linux" and extra == "streaming-flash"
56
- Requires-Dist: safetensors; extra == "streaming-flash"
57
- Requires-Dist: pynvml; extra == "streaming-flash"
58
- Requires-Dist: xxhash; extra == "streaming-flash"
59
- Provides-Extra: gpu
60
- Requires-Dist: onnxruntime-gpu<=1.23.2,>=1.18.0; sys_platform == "linux" and extra == "gpu"
61
57
  Provides-Extra: all
62
- Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
58
+ Requires-Dist: minicpmo-utils[streaming,tts]; extra == "all"
63
59
 
64
60
  ## minicpmo-utils
65
61
 
@@ -1,10 +1,10 @@
1
1
  [build-system]
2
- requires = ["setuptools>=69", "wheel"]
2
+ requires = ["setuptools>=65", "wheel"]
3
3
  build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "minicpmo-utils"
7
- version = "0.0.5"
7
+ version = "0.0.9"
8
8
  description = "Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils."
9
9
  readme = "README.md"
10
10
  requires-python = ">=3.10"
@@ -31,7 +31,12 @@ classifiers = [
31
31
  # - s3tokenizer (来自 S3Tokenizer-main)
32
32
  # - minicpmo (本项目扩展 utils 的统一入口:from minicpmo.utils import ...)
33
33
  dependencies = [
34
- "numpy",
34
+ # 锁定下限,避免 pip 回退到旧版本,加速依赖解析
35
+ "MarkupSafe>=2.1.0",
36
+ "Jinja2>=3.1.0",
37
+ "typing-extensions>=4.12.0",
38
+ "packaging>=23.0",
39
+ "numpy>=1.24.0",
35
40
  "pillow==10.4.0",
36
41
  "librosa==0.9.0",
37
42
  "decord==0.6.0",
@@ -45,11 +50,12 @@ tts = [
45
50
  "torch>=2.3.0",
46
51
  "torchaudio>=2.3.0",
47
52
  "transformers>=4.51.0,<4.53.0", # 4.52+ 有兼容性问题
53
+ "safetensors>=0.4.3",
48
54
  "onnxruntime>=1.18.0,<=1.21.0",
49
55
  "onnx",
50
56
  "hyperpyyaml",
51
- "openai-whisper==20231117",
52
- "tqdm",
57
+ "openai-whisper",
58
+ "tqdm>=4.66.0",
53
59
  "tiktoken",
54
60
  "inflect",
55
61
  "omegaconf>=2.0.6",
@@ -64,7 +70,7 @@ tts = [
64
70
  "pyarrow",
65
71
  "pyworld",
66
72
  # 新增依赖
67
- "scipy",
73
+ "scipy>=1.10.0",
68
74
  "pyyaml",
69
75
  "regex",
70
76
  "soundfile==0.12.1",
@@ -76,23 +82,23 @@ streaming = [
76
82
  "minicpmo-utils[tts]", # streaming 依赖 tts
77
83
  ]
78
84
 
79
- # stepaudio2 Flash 推理引擎依赖(flashcosyvoice.engine 模块需要)
80
- streaming-flash = [
81
- "minicpmo-utils[streaming]",
82
- "flash-attn>=2.6.0; sys_platform == 'linux'",
83
- "triton>=2.3.0; sys_platform == 'linux'",
84
- "safetensors",
85
- "pynvml",
86
- "xxhash",
87
- ]
85
+ # # stepaudio2 Flash 推理引擎依赖(flashcosyvoice.engine 模块需要)
86
+ # streaming-flash = [
87
+ # "minicpmo-utils[streaming]",
88
+ # "flash-attn>=2.6.0; sys_platform == 'linux'",
89
+ # "triton>=2.3.0; sys_platform == 'linux'",
90
+ # "safetensors>=0.4.3",
91
+ # "pynvml",
92
+ # "xxhash",
93
+ # ]
88
94
 
89
- # Linux GPU onnxruntime 可以很重,且与环境强相关,保留为可选 extra
90
- gpu = [
91
- "onnxruntime-gpu>=1.18.0,<=1.23.2; sys_platform == 'linux'",
92
- ]
95
+ # # Linux GPU onnxruntime 可以很重,且与环境强相关,保留为可选 extra
96
+ # gpu = [
97
+ # "onnxruntime-gpu>=1.18.0,<=1.23.2; sys_platform == 'linux'",
98
+ # ]
93
99
 
94
100
  all = [
95
- "minicpmo-utils[tts,streaming,gpu]",
101
+ "minicpmo-utils[tts,streaming]",
96
102
  ]
97
103
 
98
104
  [tool.setuptools]
@@ -26,84 +26,6 @@ MAX_NUM_FRAMES = int(os.getenv("MAX_NUM_FRAMES", 64))
26
26
  VIDEO_MME_DURATION = os.getenv("VIDEO_MME_DURATION", "ALL")
27
27
 
28
28
 
29
- def find_cjk_font():
30
- """
31
- 查找支持中文的字体。
32
- 按优先级返回字体名称或路径,如果找不到则返回 None。
33
- """
34
- # 常见的中文字体名称(按优先级排列)
35
- font_names = [
36
- # Noto CJK 字体(推荐)
37
- "Noto Sans CJK SC",
38
- "Noto Sans CJK",
39
- "NotoSansCJK-Regular",
40
- # 文泉驿字体
41
- "WenQuanYi Zen Hei",
42
- "WenQuanYi Micro Hei",
43
- "文泉驿正黑",
44
- "文泉驿微米黑",
45
- # 思源字体
46
- "Source Han Sans SC",
47
- "Source Han Sans CN",
48
- # 其他常见中文字体
49
- "SimHei",
50
- "Microsoft YaHei",
51
- "PingFang SC",
52
- "Hiragino Sans GB",
53
- "STHeiti",
54
- "AR PL UMing CN",
55
- "AR PL UKai CN",
56
- ]
57
-
58
- # 常见的中文字体文件路径
59
- font_paths = [
60
- # Noto CJK
61
- "/usr/share/fonts/opentype/noto/NotoSansCJK-Regular.ttc",
62
- "/usr/share/fonts/noto-cjk/NotoSansCJK-Regular.ttc",
63
- "/usr/share/fonts/google-noto-cjk/NotoSansCJK-Regular.ttc",
64
- "/usr/share/fonts/truetype/noto/NotoSansCJK-Regular.ttc",
65
- # 文泉驿
66
- "/usr/share/fonts/truetype/wqy/wqy-zenhei.ttc",
67
- "/usr/share/fonts/truetype/wqy/wqy-microhei.ttc",
68
- "/usr/share/fonts/wenquanyi/wqy-zenhei/wqy-zenhei.ttc",
69
- "/usr/share/fonts/wenquanyi/wqy-microhei/wqy-microhei.ttc",
70
- # macOS
71
- "/System/Library/Fonts/PingFang.ttc",
72
- "/Library/Fonts/Arial Unicode.ttf",
73
- # Windows (WSL)
74
- "/mnt/c/Windows/Fonts/msyh.ttc",
75
- "/mnt/c/Windows/Fonts/simhei.ttf",
76
- ]
77
-
78
- # 首先尝试使用 fc-list 查找已安装的中文字体
79
- try:
80
- result = subprocess.run(
81
- ["fc-list", ":lang=zh", "-f", "%{family}\n"],
82
- capture_output=True,
83
- text=True,
84
- timeout=5,
85
- )
86
- if result.returncode == 0:
87
- installed_fonts = set(result.stdout.strip().split("\n"))
88
- for font_name in font_names:
89
- for installed in installed_fonts:
90
- if font_name.lower() in installed.lower():
91
- logger.info(f"Found CJK font via fc-list: {installed}")
92
- return installed.split(",")[0] # 取第一个名称
93
- except Exception as e:
94
- logger.debug(f"fc-list failed: {e}")
95
-
96
- # 然后检查常见的字体文件路径
97
- for path in font_paths:
98
- if os.path.exists(path):
99
- logger.info(f"Found CJK font file: {path}")
100
- return path
101
-
102
- logger.warning("No CJK font found. Chinese subtitles may display as boxes/garbled text.")
103
- logger.warning("Install Chinese fonts with: sudo apt-get install fonts-noto-cjk")
104
- return None
105
-
106
-
107
29
  def concat_images(images, bg_color=(255, 255, 255), cell_size=None, line_color=(0, 0, 0), line_width=6):
108
30
  """
109
31
  images: List[PIL.Image.Image]
@@ -649,18 +571,9 @@ def generate_duplex_video(
649
571
 
650
572
  if has_subtitles:
651
573
  srt_path_escaped = srt_path.replace("\\", "\\\\").replace("'", "'\\''").replace(":", "\\:")
652
-
653
- # 查找支持中文的字体
654
- cjk_font = find_cjk_font()
655
- font_style = ""
656
- if cjk_font:
657
- # 转义字体路径/名称中的特殊字符
658
- font_escaped = cjk_font.replace("\\", "\\\\").replace("'", "'\\''").replace(":", "\\:")
659
- font_style = f"FontName={font_escaped},"
660
-
661
574
  subtitle_filter = (
662
575
  f"subtitles='{srt_path_escaped}':"
663
- f"force_style='{font_style}FontSize=28,"
576
+ f"force_style='FontSize=28,"
664
577
  f"PrimaryColour=&H00FFFFFF,"
665
578
  f"OutlineColour=&H00000000,"
666
579
  f"BorderStyle=3,"
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: minicpmo-utils
3
- Version: 0.0.5
3
+ Version: 0.0.9
4
4
  Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
5
5
  Author: MiniCPM-o Utils Maintainers
6
6
  License: Apache-2.0
@@ -14,7 +14,11 @@ Classifier: Programming Language :: Python :: 3.11
14
14
  Classifier: Programming Language :: Python :: 3.12
15
15
  Requires-Python: >=3.10
16
16
  Description-Content-Type: text/markdown
17
- Requires-Dist: numpy
17
+ Requires-Dist: MarkupSafe>=2.1.0
18
+ Requires-Dist: Jinja2>=3.1.0
19
+ Requires-Dist: typing-extensions>=4.12.0
20
+ Requires-Dist: packaging>=23.0
21
+ Requires-Dist: numpy>=1.24.0
18
22
  Requires-Dist: pillow==10.4.0
19
23
  Requires-Dist: librosa==0.9.0
20
24
  Requires-Dist: decord==0.6.0
@@ -24,11 +28,12 @@ Provides-Extra: tts
24
28
  Requires-Dist: torch>=2.3.0; extra == "tts"
25
29
  Requires-Dist: torchaudio>=2.3.0; extra == "tts"
26
30
  Requires-Dist: transformers<4.53.0,>=4.51.0; extra == "tts"
31
+ Requires-Dist: safetensors>=0.4.3; extra == "tts"
27
32
  Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "tts"
28
33
  Requires-Dist: onnx; extra == "tts"
29
34
  Requires-Dist: hyperpyyaml; extra == "tts"
30
- Requires-Dist: openai-whisper==20231117; extra == "tts"
31
- Requires-Dist: tqdm; extra == "tts"
35
+ Requires-Dist: openai-whisper; extra == "tts"
36
+ Requires-Dist: tqdm>=4.66.0; extra == "tts"
32
37
  Requires-Dist: tiktoken; extra == "tts"
33
38
  Requires-Dist: inflect; extra == "tts"
34
39
  Requires-Dist: omegaconf>=2.0.6; extra == "tts"
@@ -42,24 +47,15 @@ Requires-Dist: matplotlib; extra == "tts"
42
47
  Requires-Dist: wget; extra == "tts"
43
48
  Requires-Dist: pyarrow; extra == "tts"
44
49
  Requires-Dist: pyworld; extra == "tts"
45
- Requires-Dist: scipy; extra == "tts"
50
+ Requires-Dist: scipy>=1.10.0; extra == "tts"
46
51
  Requires-Dist: pyyaml; extra == "tts"
47
52
  Requires-Dist: regex; extra == "tts"
48
53
  Requires-Dist: soundfile==0.12.1; extra == "tts"
49
54
  Requires-Dist: diffusers==0.29.0; extra == "tts"
50
55
  Provides-Extra: streaming
51
56
  Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
52
- Provides-Extra: streaming-flash
53
- Requires-Dist: minicpmo-utils[streaming]; extra == "streaming-flash"
54
- Requires-Dist: flash-attn>=2.6.0; sys_platform == "linux" and extra == "streaming-flash"
55
- Requires-Dist: triton>=2.3.0; sys_platform == "linux" and extra == "streaming-flash"
56
- Requires-Dist: safetensors; extra == "streaming-flash"
57
- Requires-Dist: pynvml; extra == "streaming-flash"
58
- Requires-Dist: xxhash; extra == "streaming-flash"
59
- Provides-Extra: gpu
60
- Requires-Dist: onnxruntime-gpu<=1.23.2,>=1.18.0; sys_platform == "linux" and extra == "gpu"
61
57
  Provides-Extra: all
62
- Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
58
+ Requires-Dist: minicpmo-utils[streaming,tts]; extra == "all"
63
59
 
64
60
  ## minicpmo-utils
65
61
 
@@ -1,4 +1,8 @@
1
- numpy
1
+ MarkupSafe>=2.1.0
2
+ Jinja2>=3.1.0
3
+ typing-extensions>=4.12.0
4
+ packaging>=23.0
5
+ numpy>=1.24.0
2
6
  pillow==10.4.0
3
7
  librosa==0.9.0
4
8
  decord==0.6.0
@@ -6,35 +10,21 @@ moviepy==2.1.2
6
10
  numba==0.61.2
7
11
 
8
12
  [all]
9
- minicpmo-utils[gpu,streaming,tts]
10
-
11
- [gpu]
12
-
13
- [gpu:sys_platform == "linux"]
14
- onnxruntime-gpu<=1.23.2,>=1.18.0
13
+ minicpmo-utils[streaming,tts]
15
14
 
16
15
  [streaming]
17
16
  minicpmo-utils[tts]
18
17
 
19
- [streaming-flash]
20
- minicpmo-utils[streaming]
21
- safetensors
22
- pynvml
23
- xxhash
24
-
25
- [streaming-flash:sys_platform == "linux"]
26
- flash-attn>=2.6.0
27
- triton>=2.3.0
28
-
29
18
  [tts]
30
19
  torch>=2.3.0
31
20
  torchaudio>=2.3.0
32
21
  transformers<4.53.0,>=4.51.0
22
+ safetensors>=0.4.3
33
23
  onnxruntime<=1.21.0,>=1.18.0
34
24
  onnx
35
25
  hyperpyyaml
36
- openai-whisper==20231117
37
- tqdm
26
+ openai-whisper
27
+ tqdm>=4.66.0
38
28
  tiktoken
39
29
  inflect
40
30
  omegaconf>=2.0.6
@@ -48,7 +38,7 @@ matplotlib
48
38
  wget
49
39
  pyarrow
50
40
  pyworld
51
- scipy
41
+ scipy>=1.10.0
52
42
  pyyaml
53
43
  regex
54
44
  soundfile==0.12.1
File without changes
File without changes