minicpmo-utils 0.1.0__tar.gz → 0.1.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (153) hide show
  1. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/PKG-INFO +37 -16
  2. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/README.md +17 -2
  3. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/pyproject.toml +19 -12
  4. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/cli/cosyvoice.py +0 -5
  5. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/minicpmo_utils.egg-info/PKG-INFO +37 -16
  6. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/minicpmo_utils.egg-info/requires.txt +19 -10
  7. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/token2wav.py +0 -1
  8. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/setup.cfg +0 -0
  9. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/__init__.py +0 -0
  10. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/bin/average_model.py +0 -0
  11. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/bin/export_jit.py +0 -0
  12. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/bin/export_onnx.py +0 -0
  13. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/bin/inference_deprecated.py +0 -0
  14. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/bin/train.py +0 -0
  15. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/cli/__init__.py +0 -0
  16. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/cli/frontend.py +0 -0
  17. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/cli/model.py +0 -0
  18. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/dataset/__init__.py +0 -0
  19. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/dataset/dataset.py +0 -0
  20. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/dataset/processor.py +0 -0
  21. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/flow/decoder.py +0 -0
  22. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/flow/flow.py +0 -0
  23. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/flow/flow_matching.py +0 -0
  24. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/flow/length_regulator.py +0 -0
  25. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/hifigan/discriminator.py +0 -0
  26. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/hifigan/f0_predictor.py +0 -0
  27. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/hifigan/generator.py +0 -0
  28. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/hifigan/hifigan.py +0 -0
  29. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/llm/llm.py +0 -0
  30. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/tokenizer/assets/multilingual_zh_ja_yue_char_del.tiktoken +0 -0
  31. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/tokenizer/tokenizer.py +0 -0
  32. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/__init__.py +0 -0
  33. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/activation.py +0 -0
  34. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/attention.py +0 -0
  35. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/convolution.py +0 -0
  36. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/decoder.py +0 -0
  37. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/decoder_layer.py +0 -0
  38. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/embedding.py +0 -0
  39. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/encoder.py +0 -0
  40. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/encoder_layer.py +0 -0
  41. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/label_smoothing_loss.py +0 -0
  42. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/positionwise_feed_forward.py +0 -0
  43. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/subsampling.py +0 -0
  44. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/transformer/upsample_encoder.py +0 -0
  45. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/__init__.py +0 -0
  46. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/class_utils.py +0 -0
  47. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/common.py +0 -0
  48. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/executor.py +0 -0
  49. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/file_utils.py +0 -0
  50. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/frontend_utils.py +0 -0
  51. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/losses.py +0 -0
  52. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/mask.py +0 -0
  53. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/scheduler.py +0 -0
  54. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/utils/train_utils.py +0 -0
  55. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/cosyvoice/vllm/cosyvoice2.py +0 -0
  56. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/__init__.py +0 -0
  57. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/app.py +0 -0
  58. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/cli.py +0 -0
  59. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/hifigan/__init__.py +0 -0
  60. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/hifigan/config.py +0 -0
  61. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/hifigan/denoiser.py +0 -0
  62. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/hifigan/env.py +0 -0
  63. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/hifigan/meldataset.py +0 -0
  64. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/hifigan/models.py +0 -0
  65. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/hifigan/xutils.py +0 -0
  66. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/models/__init__.py +0 -0
  67. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/models/baselightningmodule.py +0 -0
  68. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/models/components/__init__.py +0 -0
  69. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/models/components/decoder.py +0 -0
  70. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/models/components/flow_matching.py +0 -0
  71. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/models/components/text_encoder.py +0 -0
  72. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/models/components/transformer.py +0 -0
  73. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/models/matcha_tts.py +0 -0
  74. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/onnx/__init__.py +0 -0
  75. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/onnx/export.py +0 -0
  76. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/onnx/infer.py +0 -0
  77. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/text/__init__.py +0 -0
  78. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/text/cleaners.py +0 -0
  79. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/text/numbers.py +0 -0
  80. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/text/symbols.py +0 -0
  81. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/train.py +0 -0
  82. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/__init__.py +0 -0
  83. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/audio.py +0 -0
  84. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/generate_data_statistics.py +0 -0
  85. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/instantiators.py +0 -0
  86. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/logging_utils.py +0 -0
  87. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/model.py +0 -0
  88. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/monotonic_align/__init__.py +0 -0
  89. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/monotonic_align/setup.py +0 -0
  90. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/pylogger.py +0 -0
  91. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/rich_utils.py +0 -0
  92. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/matcha/utils/utils.py +0 -0
  93. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/minicpmo/__init__.py +0 -0
  94. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/minicpmo/utils.py +0 -0
  95. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/minicpmo/version.py +0 -0
  96. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/minicpmo_utils.egg-info/SOURCES.txt +0 -0
  97. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/minicpmo_utils.egg-info/dependency_links.txt +0 -0
  98. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/minicpmo_utils.egg-info/top_level.txt +0 -0
  99. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/s3tokenizer/__init__.py +0 -0
  100. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/s3tokenizer/assets/BAC009S0764W0121.wav +0 -0
  101. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/s3tokenizer/assets/BAC009S0764W0122.wav +0 -0
  102. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/s3tokenizer/assets/mel_filters.npz +0 -0
  103. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/s3tokenizer/cli.py +0 -0
  104. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/s3tokenizer/model.py +0 -0
  105. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/s3tokenizer/model_v2.py +0 -0
  106. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/s3tokenizer/utils.py +0 -0
  107. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/__init__.py +0 -0
  108. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/__init__.py +0 -0
  109. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/flow/__init__.py +0 -0
  110. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/flow/decoder_dit.py +0 -0
  111. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/flow/flow.py +0 -0
  112. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/flow/flow_matching.py +0 -0
  113. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/transformer/__init__.py +0 -0
  114. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/transformer/attention.py +0 -0
  115. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/transformer/embedding.py +0 -0
  116. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/transformer/encoder_layer.py +0 -0
  117. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/transformer/positionwise_feed_forward.py +0 -0
  118. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/transformer/subsampling.py +0 -0
  119. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/transformer/upsample_encoder_v2.py +0 -0
  120. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/utils/__init__.py +0 -0
  121. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/utils/class_utils.py +0 -0
  122. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/utils/common.py +0 -0
  123. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/cosyvoice2/utils/mask.py +0 -0
  124. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/__init__.py +0 -0
  125. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/cli.py +0 -0
  126. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/config.py +0 -0
  127. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/cosyvoice2.py +0 -0
  128. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/cosyvoice3.py +0 -0
  129. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/engine/__init__.py +0 -0
  130. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/engine/block_manager.py +0 -0
  131. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/engine/llm_engine.py +0 -0
  132. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/engine/model_runner.py +0 -0
  133. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/engine/scheduler.py +0 -0
  134. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/engine/sequence.py +0 -0
  135. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/__init__.py +0 -0
  136. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/flow.py +0 -0
  137. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/flow_components/__init__.py +0 -0
  138. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/flow_components/estimator.py +0 -0
  139. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/flow_components/upsample_encoder.py +0 -0
  140. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/hifigan.py +0 -0
  141. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/__init__.py +0 -0
  142. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/layers.py +0 -0
  143. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/qwen2.py +0 -0
  144. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/__init__.py +0 -0
  145. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/layers.py +0 -0
  146. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/modules/sampler.py +0 -0
  147. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/utils/__init__.py +0 -0
  148. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/utils/audio.py +0 -0
  149. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/utils/context.py +0 -0
  150. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/utils/loader.py +0 -0
  151. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/flashcosyvoice/utils/memory.py +0 -0
  152. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/stepaudio2.py +0 -0
  153. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.1}/src/stepaudio2/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: minicpmo-utils
3
- Version: 0.1.0
3
+ Version: 0.1.1
4
4
  Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
5
5
  Author: MiniCPM-o Utils Maintainers
6
6
  License: Apache-2.0
@@ -14,23 +14,29 @@ Classifier: Programming Language :: Python :: 3.11
14
14
  Classifier: Programming Language :: Python :: 3.12
15
15
  Requires-Python: >=3.10
16
16
  Description-Content-Type: text/markdown
17
- Requires-Dist: torch>=2.3.0
18
- Requires-Dist: torchaudio>=2.3.0
19
- Requires-Dist: transformers>=4.49.0
20
17
  Requires-Dist: numpy
21
- Requires-Dist: hyperpyyaml
22
- Requires-Dist: modelscope
23
- Requires-Dist: openai-whisper
24
- Requires-Dist: tqdm
25
- Requires-Dist: tiktoken
26
- Requires-Dist: inflect
27
- Requires-Dist: omegaconf
28
- Requires-Dist: einops
18
+ Requires-Dist: pillow
29
19
  Requires-Dist: librosa
30
- Requires-Dist: onnxruntime>=1.18.0
31
- Requires-Dist: diffusers
20
+ Requires-Dist: decord
21
+ Provides-Extra: tts
22
+ Requires-Dist: torch>=2.3.0; extra == "tts"
23
+ Requires-Dist: torchaudio>=2.3.0; extra == "tts"
24
+ Requires-Dist: transformers>=4.49.0; extra == "tts"
25
+ Requires-Dist: hyperpyyaml; extra == "tts"
26
+ Requires-Dist: openai-whisper; extra == "tts"
27
+ Requires-Dist: tqdm; extra == "tts"
28
+ Requires-Dist: tiktoken; extra == "tts"
29
+ Requires-Dist: inflect; extra == "tts"
30
+ Requires-Dist: omegaconf; extra == "tts"
31
+ Requires-Dist: einops; extra == "tts"
32
+ Provides-Extra: streaming
33
+ Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
34
+ Requires-Dist: onnxruntime>=1.18.0; extra == "streaming"
35
+ Requires-Dist: diffusers; extra == "streaming"
32
36
  Provides-Extra: gpu
33
37
  Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gpu"
38
+ Provides-Extra: all
39
+ Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
34
40
 
35
41
  ## minicpmo-utils
36
42
 
@@ -38,17 +44,32 @@ Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gp
38
44
 
39
45
  ### 安装方式
40
46
 
41
- - 从源码本地安装(开发态,可编辑):
47
+ - 从源码本地安装(开发态,可编辑,默认只装公共依赖):
42
48
  ```bash
43
49
  cd minicpmo-utils
44
50
  pip install -e .
45
51
  ```
46
52
 
53
+ - 如果只想安装 cosyvoice 相关依赖(TTS):
54
+ ```bash
55
+ pip install -e .[tts]
56
+ ```
57
+
58
+ - 如果只想安装 stepaudio2 / streaming 相关依赖:
59
+ ```bash
60
+ pip install -e .[streaming]
61
+ ```
62
+
63
+ - 同时安装 cosyvoice + stepaudio2 相关依赖:
64
+ ```bash
65
+ pip install -e .[tts,streaming]
66
+ ```
67
+
47
68
  - 构建并安装 wheel(推荐分发):
48
69
  ```bash
49
70
  cd minicpmo-utils
50
71
  python -m build # 生成 dist/*.whl
51
- pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
72
+ pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
52
73
  ```
53
74
 
54
75
  ### 导入方式
@@ -4,17 +4,32 @@
4
4
 
5
5
  ### 安装方式
6
6
 
7
- - 从源码本地安装(开发态,可编辑):
7
+ - 从源码本地安装(开发态,可编辑,默认只装公共依赖):
8
8
  ```bash
9
9
  cd minicpmo-utils
10
10
  pip install -e .
11
11
  ```
12
12
 
13
+ - 如果只想安装 cosyvoice 相关依赖(TTS):
14
+ ```bash
15
+ pip install -e .[tts]
16
+ ```
17
+
18
+ - 如果只想安装 stepaudio2 / streaming 相关依赖:
19
+ ```bash
20
+ pip install -e .[streaming]
21
+ ```
22
+
23
+ - 同时安装 cosyvoice + stepaudio2 相关依赖:
24
+ ```bash
25
+ pip install -e .[tts,streaming]
26
+ ```
27
+
13
28
  - 构建并安装 wheel(推荐分发):
14
29
  ```bash
15
30
  cd minicpmo-utils
16
31
  python -m build # 生成 dist/*.whl
17
- pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
32
+ pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
18
33
  ```
19
34
 
20
35
  ### 导入方式
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "minicpmo-utils"
7
- version = "0.1.0"
7
+ version = "0.1.1"
8
8
  description = "Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils."
9
9
  readme = "README.md"
10
10
  requires-python = ">=3.10"
@@ -31,36 +31,43 @@ classifiers = [
31
31
  # - s3tokenizer (来自 S3Tokenizer-main)
32
32
  # - minicpmo (本项目扩展 utils 的统一入口:from minicpmo.utils import ...)
33
33
  dependencies = [
34
- # Core ML frameworks (align to stepaudio2's requirements)
34
+ "numpy",
35
+ "pillow",
36
+ "librosa",
37
+ "decord",
38
+ ]
39
+
40
+ [project.optional-dependencies]
41
+ # cosyvoice TTS 相关依赖
42
+ tts = [
35
43
  "torch>=2.3.0",
36
44
  "torchaudio>=2.3.0",
37
45
  "transformers>=4.49.0",
38
-
39
- # Shared / common
40
- "numpy",
41
46
  "hyperpyyaml",
42
-
43
- # cosyvoice side
44
- "modelscope",
45
47
  "openai-whisper",
46
48
  "tqdm",
47
49
  "tiktoken",
48
50
  "inflect",
49
51
  "omegaconf",
50
52
  "einops",
53
+ ]
51
54
 
52
- # stepaudio2 side
53
- "librosa",
55
+ # stepaudio2 / streaming 相关依赖
56
+ streaming = [
57
+ "minicpmo-utils[tts]", # streaming 依赖 tts
54
58
  "onnxruntime>=1.18.0",
55
59
  "diffusers",
56
60
  ]
57
61
 
58
- [project.optional-dependencies]
59
- # Linux GPU onnxruntime can be heavy and environment-specific; keep as an opt-in extra.
62
+ # Linux GPU onnxruntime 可以很重,且与环境强相关,保留为可选 extra
60
63
  gpu = [
61
64
  "onnxruntime-gpu>=1.18.0; sys_platform == 'linux'",
62
65
  ]
63
66
 
67
+ all = [
68
+ "minicpmo-utils[tts,streaming,gpu]",
69
+ ]
70
+
64
71
  [tool.setuptools]
65
72
  include-package-data = true
66
73
 
@@ -16,7 +16,6 @@ import time
16
16
  from typing import Generator
17
17
  from tqdm import tqdm
18
18
  from hyperpyyaml import load_hyperpyyaml
19
- from modelscope import snapshot_download
20
19
  import torch
21
20
  from cosyvoice.cli.frontend import CosyVoiceFrontEnd
22
21
  from cosyvoice.cli.model import CosyVoiceModel, CosyVoice2Model
@@ -30,8 +29,6 @@ class CosyVoice:
30
29
  self.instruct = True if '-Instruct' in model_dir else False
31
30
  self.model_dir = model_dir
32
31
  self.fp16 = fp16
33
- if not os.path.exists(model_dir):
34
- model_dir = snapshot_download(model_dir)
35
32
  hyper_yaml_path = '{}/cosyvoice.yaml'.format(model_dir)
36
33
  if not os.path.exists(hyper_yaml_path):
37
34
  raise ValueError('{} not found!'.format(hyper_yaml_path))
@@ -154,8 +151,6 @@ class CosyVoice2(CosyVoice):
154
151
  self.instruct = True if '-Instruct' in model_dir else False
155
152
  self.model_dir = model_dir
156
153
  self.fp16 = fp16
157
- if not os.path.exists(model_dir):
158
- model_dir = snapshot_download(model_dir)
159
154
 
160
155
  if config_path is None:
161
156
  config_path = f'{model_dir}/cosyvoice2.yaml'
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: minicpmo-utils
3
- Version: 0.1.0
3
+ Version: 0.1.1
4
4
  Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
5
5
  Author: MiniCPM-o Utils Maintainers
6
6
  License: Apache-2.0
@@ -14,23 +14,29 @@ Classifier: Programming Language :: Python :: 3.11
14
14
  Classifier: Programming Language :: Python :: 3.12
15
15
  Requires-Python: >=3.10
16
16
  Description-Content-Type: text/markdown
17
- Requires-Dist: torch>=2.3.0
18
- Requires-Dist: torchaudio>=2.3.0
19
- Requires-Dist: transformers>=4.49.0
20
17
  Requires-Dist: numpy
21
- Requires-Dist: hyperpyyaml
22
- Requires-Dist: modelscope
23
- Requires-Dist: openai-whisper
24
- Requires-Dist: tqdm
25
- Requires-Dist: tiktoken
26
- Requires-Dist: inflect
27
- Requires-Dist: omegaconf
28
- Requires-Dist: einops
18
+ Requires-Dist: pillow
29
19
  Requires-Dist: librosa
30
- Requires-Dist: onnxruntime>=1.18.0
31
- Requires-Dist: diffusers
20
+ Requires-Dist: decord
21
+ Provides-Extra: tts
22
+ Requires-Dist: torch>=2.3.0; extra == "tts"
23
+ Requires-Dist: torchaudio>=2.3.0; extra == "tts"
24
+ Requires-Dist: transformers>=4.49.0; extra == "tts"
25
+ Requires-Dist: hyperpyyaml; extra == "tts"
26
+ Requires-Dist: openai-whisper; extra == "tts"
27
+ Requires-Dist: tqdm; extra == "tts"
28
+ Requires-Dist: tiktoken; extra == "tts"
29
+ Requires-Dist: inflect; extra == "tts"
30
+ Requires-Dist: omegaconf; extra == "tts"
31
+ Requires-Dist: einops; extra == "tts"
32
+ Provides-Extra: streaming
33
+ Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
34
+ Requires-Dist: onnxruntime>=1.18.0; extra == "streaming"
35
+ Requires-Dist: diffusers; extra == "streaming"
32
36
  Provides-Extra: gpu
33
37
  Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gpu"
38
+ Provides-Extra: all
39
+ Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
34
40
 
35
41
  ## minicpmo-utils
36
42
 
@@ -38,17 +44,32 @@ Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gp
38
44
 
39
45
  ### 安装方式
40
46
 
41
- - 从源码本地安装(开发态,可编辑):
47
+ - 从源码本地安装(开发态,可编辑,默认只装公共依赖):
42
48
  ```bash
43
49
  cd minicpmo-utils
44
50
  pip install -e .
45
51
  ```
46
52
 
53
+ - 如果只想安装 cosyvoice 相关依赖(TTS):
54
+ ```bash
55
+ pip install -e .[tts]
56
+ ```
57
+
58
+ - 如果只想安装 stepaudio2 / streaming 相关依赖:
59
+ ```bash
60
+ pip install -e .[streaming]
61
+ ```
62
+
63
+ - 同时安装 cosyvoice + stepaudio2 相关依赖:
64
+ ```bash
65
+ pip install -e .[tts,streaming]
66
+ ```
67
+
47
68
  - 构建并安装 wheel(推荐分发):
48
69
  ```bash
49
70
  cd minicpmo-utils
50
71
  python -m build # 生成 dist/*.whl
51
- pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
72
+ pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
52
73
  ```
53
74
 
54
75
  ### 导入方式
@@ -1,20 +1,29 @@
1
+ numpy
2
+ pillow
3
+ librosa
4
+ decord
5
+
6
+ [all]
7
+ minicpmo-utils[gpu,streaming,tts]
8
+
9
+ [gpu]
10
+
11
+ [gpu:sys_platform == "linux"]
12
+ onnxruntime-gpu>=1.18.0
13
+
14
+ [streaming]
15
+ minicpmo-utils[tts]
16
+ onnxruntime>=1.18.0
17
+ diffusers
18
+
19
+ [tts]
1
20
  torch>=2.3.0
2
21
  torchaudio>=2.3.0
3
22
  transformers>=4.49.0
4
- numpy
5
23
  hyperpyyaml
6
- modelscope
7
24
  openai-whisper
8
25
  tqdm
9
26
  tiktoken
10
27
  inflect
11
28
  omegaconf
12
29
  einops
13
- librosa
14
- onnxruntime>=1.18.0
15
- diffusers
16
-
17
- [gpu]
18
-
19
- [gpu:sys_platform == "linux"]
20
- onnxruntime-gpu>=1.18.0
@@ -7,7 +7,6 @@ import torchaudio
7
7
  import s3tokenizer
8
8
  import onnxruntime
9
9
  import numpy as np
10
- from copy import deepcopy
11
10
 
12
11
  import torchaudio.compliance.kaldi as kaldi
13
12
  from stepaudio2.flashcosyvoice.modules.hifigan import HiFTGenerator
File without changes