minicpmo-utils 0.1.0__tar.gz → 0.1.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (154) hide show
  1. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/PKG-INFO +41 -18
  2. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/README.md +17 -2
  3. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/pyproject.toml +23 -14
  4. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/cli/cosyvoice.py +0 -5
  5. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/PKG-INFO +41 -18
  6. minicpmo_utils-0.1.2/src/minicpmo_utils.egg-info/requires.txt +31 -0
  7. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/token2wav.py +0 -1
  8. minicpmo_utils-0.1.0/src/minicpmo_utils.egg-info/requires.txt +0 -20
  9. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/setup.cfg +0 -0
  10. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/__init__.py +0 -0
  11. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/average_model.py +0 -0
  12. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/export_jit.py +0 -0
  13. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/export_onnx.py +0 -0
  14. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/inference_deprecated.py +0 -0
  15. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/train.py +0 -0
  16. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/cli/__init__.py +0 -0
  17. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/cli/frontend.py +0 -0
  18. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/cli/model.py +0 -0
  19. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/dataset/__init__.py +0 -0
  20. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/dataset/dataset.py +0 -0
  21. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/dataset/processor.py +0 -0
  22. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/flow/decoder.py +0 -0
  23. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/flow/flow.py +0 -0
  24. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/flow/flow_matching.py +0 -0
  25. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/flow/length_regulator.py +0 -0
  26. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/hifigan/discriminator.py +0 -0
  27. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/hifigan/f0_predictor.py +0 -0
  28. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/hifigan/generator.py +0 -0
  29. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/hifigan/hifigan.py +0 -0
  30. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/llm/llm.py +0 -0
  31. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/tokenizer/assets/multilingual_zh_ja_yue_char_del.tiktoken +0 -0
  32. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/tokenizer/tokenizer.py +0 -0
  33. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/__init__.py +0 -0
  34. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/activation.py +0 -0
  35. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/attention.py +0 -0
  36. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/convolution.py +0 -0
  37. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/decoder.py +0 -0
  38. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/decoder_layer.py +0 -0
  39. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/embedding.py +0 -0
  40. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/encoder.py +0 -0
  41. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/encoder_layer.py +0 -0
  42. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/label_smoothing_loss.py +0 -0
  43. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/positionwise_feed_forward.py +0 -0
  44. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/subsampling.py +0 -0
  45. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/upsample_encoder.py +0 -0
  46. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/__init__.py +0 -0
  47. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/class_utils.py +0 -0
  48. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/common.py +0 -0
  49. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/executor.py +0 -0
  50. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/file_utils.py +0 -0
  51. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/frontend_utils.py +0 -0
  52. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/losses.py +0 -0
  53. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/mask.py +0 -0
  54. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/scheduler.py +0 -0
  55. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/train_utils.py +0 -0
  56. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/vllm/cosyvoice2.py +0 -0
  57. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/__init__.py +0 -0
  58. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/app.py +0 -0
  59. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/cli.py +0 -0
  60. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/__init__.py +0 -0
  61. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/config.py +0 -0
  62. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/denoiser.py +0 -0
  63. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/env.py +0 -0
  64. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/meldataset.py +0 -0
  65. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/models.py +0 -0
  66. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/xutils.py +0 -0
  67. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/__init__.py +0 -0
  68. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/baselightningmodule.py +0 -0
  69. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/__init__.py +0 -0
  70. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/decoder.py +0 -0
  71. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/flow_matching.py +0 -0
  72. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/text_encoder.py +0 -0
  73. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/transformer.py +0 -0
  74. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/matcha_tts.py +0 -0
  75. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/onnx/__init__.py +0 -0
  76. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/onnx/export.py +0 -0
  77. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/onnx/infer.py +0 -0
  78. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/text/__init__.py +0 -0
  79. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/text/cleaners.py +0 -0
  80. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/text/numbers.py +0 -0
  81. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/text/symbols.py +0 -0
  82. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/train.py +0 -0
  83. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/__init__.py +0 -0
  84. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/audio.py +0 -0
  85. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/generate_data_statistics.py +0 -0
  86. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/instantiators.py +0 -0
  87. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/logging_utils.py +0 -0
  88. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/model.py +0 -0
  89. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/monotonic_align/__init__.py +0 -0
  90. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/monotonic_align/setup.py +0 -0
  91. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/pylogger.py +0 -0
  92. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/rich_utils.py +0 -0
  93. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/utils.py +0 -0
  94. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo/__init__.py +0 -0
  95. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo/utils.py +0 -0
  96. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo/version.py +0 -0
  97. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/SOURCES.txt +0 -0
  98. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/dependency_links.txt +0 -0
  99. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/top_level.txt +0 -0
  100. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/__init__.py +0 -0
  101. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/assets/BAC009S0764W0121.wav +0 -0
  102. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/assets/BAC009S0764W0122.wav +0 -0
  103. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/assets/mel_filters.npz +0 -0
  104. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/cli.py +0 -0
  105. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/model.py +0 -0
  106. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/model_v2.py +0 -0
  107. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/utils.py +0 -0
  108. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/__init__.py +0 -0
  109. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/__init__.py +0 -0
  110. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/__init__.py +0 -0
  111. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/decoder_dit.py +0 -0
  112. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/flow.py +0 -0
  113. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/flow_matching.py +0 -0
  114. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/__init__.py +0 -0
  115. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/attention.py +0 -0
  116. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/embedding.py +0 -0
  117. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/encoder_layer.py +0 -0
  118. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/positionwise_feed_forward.py +0 -0
  119. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/subsampling.py +0 -0
  120. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/upsample_encoder_v2.py +0 -0
  121. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/__init__.py +0 -0
  122. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/class_utils.py +0 -0
  123. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/common.py +0 -0
  124. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/mask.py +0 -0
  125. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/__init__.py +0 -0
  126. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/cli.py +0 -0
  127. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/config.py +0 -0
  128. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/cosyvoice2.py +0 -0
  129. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/cosyvoice3.py +0 -0
  130. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/__init__.py +0 -0
  131. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/block_manager.py +0 -0
  132. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/llm_engine.py +0 -0
  133. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/model_runner.py +0 -0
  134. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/scheduler.py +0 -0
  135. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/sequence.py +0 -0
  136. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/__init__.py +0 -0
  137. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/flow.py +0 -0
  138. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/flow_components/__init__.py +0 -0
  139. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/flow_components/estimator.py +0 -0
  140. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/flow_components/upsample_encoder.py +0 -0
  141. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/hifigan.py +0 -0
  142. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/__init__.py +0 -0
  143. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/layers.py +0 -0
  144. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/qwen2.py +0 -0
  145. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/__init__.py +0 -0
  146. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/layers.py +0 -0
  147. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/sampler.py +0 -0
  148. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/__init__.py +0 -0
  149. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/audio.py +0 -0
  150. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/context.py +0 -0
  151. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/loader.py +0 -0
  152. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/memory.py +0 -0
  153. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/stepaudio2.py +0 -0
  154. {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: minicpmo-utils
3
- Version: 0.1.0
3
+ Version: 0.1.2
4
4
  Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
5
5
  Author: MiniCPM-o Utils Maintainers
6
6
  License: Apache-2.0
@@ -14,23 +14,31 @@ Classifier: Programming Language :: Python :: 3.11
14
14
  Classifier: Programming Language :: Python :: 3.12
15
15
  Requires-Python: >=3.10
16
16
  Description-Content-Type: text/markdown
17
- Requires-Dist: torch>=2.3.0
18
- Requires-Dist: torchaudio>=2.3.0
19
- Requires-Dist: transformers>=4.49.0
20
17
  Requires-Dist: numpy
21
- Requires-Dist: hyperpyyaml
22
- Requires-Dist: modelscope
23
- Requires-Dist: openai-whisper
24
- Requires-Dist: tqdm
25
- Requires-Dist: tiktoken
26
- Requires-Dist: inflect
27
- Requires-Dist: omegaconf
28
- Requires-Dist: einops
29
- Requires-Dist: librosa
30
- Requires-Dist: onnxruntime>=1.18.0
31
- Requires-Dist: diffusers
18
+ Requires-Dist: pillow==10.4.0
19
+ Requires-Dist: librosa==0.9.0
20
+ Requires-Dist: decord==0.6.0
21
+ Requires-Dist: moviepy==2.1.2
22
+ Provides-Extra: tts
23
+ Requires-Dist: torch>=2.3.0; extra == "tts"
24
+ Requires-Dist: torchaudio>=2.3.0; extra == "tts"
25
+ Requires-Dist: transformers>=4.49.0; extra == "tts"
26
+ Requires-Dist: hyperpyyaml; extra == "tts"
27
+ Requires-Dist: openai-whisper; extra == "tts"
28
+ Requires-Dist: tqdm; extra == "tts"
29
+ Requires-Dist: tiktoken; extra == "tts"
30
+ Requires-Dist: inflect; extra == "tts"
31
+ Requires-Dist: omegaconf; extra == "tts"
32
+ Requires-Dist: einops; extra == "tts"
33
+ Provides-Extra: streaming
34
+ Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
35
+ Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "streaming"
36
+ Requires-Dist: onnx; extra == "streaming"
37
+ Requires-Dist: diffusers; extra == "streaming"
32
38
  Provides-Extra: gpu
33
- Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gpu"
39
+ Requires-Dist: onnxruntime-gpu<=1.23.2,>=1.18.0; sys_platform == "linux" and extra == "gpu"
40
+ Provides-Extra: all
41
+ Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
34
42
 
35
43
  ## minicpmo-utils
36
44
 
@@ -38,17 +46,32 @@ Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gp
38
46
 
39
47
  ### 安装方式
40
48
 
41
- - 从源码本地安装(开发态,可编辑):
49
+ - 从源码本地安装(开发态,可编辑,默认只装公共依赖):
42
50
  ```bash
43
51
  cd minicpmo-utils
44
52
  pip install -e .
45
53
  ```
46
54
 
55
+ - 如果只想安装 cosyvoice 相关依赖(TTS):
56
+ ```bash
57
+ pip install -e .[tts]
58
+ ```
59
+
60
+ - 如果只想安装 stepaudio2 / streaming 相关依赖:
61
+ ```bash
62
+ pip install -e .[streaming]
63
+ ```
64
+
65
+ - 同时安装 cosyvoice + stepaudio2 相关依赖:
66
+ ```bash
67
+ pip install -e .[tts,streaming]
68
+ ```
69
+
47
70
  - 构建并安装 wheel(推荐分发):
48
71
  ```bash
49
72
  cd minicpmo-utils
50
73
  python -m build # 生成 dist/*.whl
51
- pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
74
+ pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
52
75
  ```
53
76
 
54
77
  ### 导入方式
@@ -4,17 +4,32 @@
4
4
 
5
5
  ### 安装方式
6
6
 
7
- - 从源码本地安装(开发态,可编辑):
7
+ - 从源码本地安装(开发态,可编辑,默认只装公共依赖):
8
8
  ```bash
9
9
  cd minicpmo-utils
10
10
  pip install -e .
11
11
  ```
12
12
 
13
+ - 如果只想安装 cosyvoice 相关依赖(TTS):
14
+ ```bash
15
+ pip install -e .[tts]
16
+ ```
17
+
18
+ - 如果只想安装 stepaudio2 / streaming 相关依赖:
19
+ ```bash
20
+ pip install -e .[streaming]
21
+ ```
22
+
23
+ - 同时安装 cosyvoice + stepaudio2 相关依赖:
24
+ ```bash
25
+ pip install -e .[tts,streaming]
26
+ ```
27
+
13
28
  - 构建并安装 wheel(推荐分发):
14
29
  ```bash
15
30
  cd minicpmo-utils
16
31
  python -m build # 生成 dist/*.whl
17
- pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
32
+ pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
18
33
  ```
19
34
 
20
35
  ### 导入方式
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "minicpmo-utils"
7
- version = "0.1.0"
7
+ version = "0.1.2"
8
8
  description = "Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils."
9
9
  readme = "README.md"
10
10
  requires-python = ">=3.10"
@@ -31,34 +31,43 @@ classifiers = [
31
31
  # - s3tokenizer (来自 S3Tokenizer-main)
32
32
  # - minicpmo (本项目扩展 utils 的统一入口:from minicpmo.utils import ...)
33
33
  dependencies = [
34
- # Core ML frameworks (align to stepaudio2's requirements)
34
+ "numpy",
35
+ "pillow==10.4.0",
36
+ "librosa==0.9.0",
37
+ "decord==0.6.0",
38
+ "moviepy==2.1.2"
39
+ ]
40
+
41
+ [project.optional-dependencies]
42
+ # cosyvoice TTS 相关依赖
43
+ tts = [
35
44
  "torch>=2.3.0",
36
45
  "torchaudio>=2.3.0",
37
46
  "transformers>=4.49.0",
38
-
39
- # Shared / common
40
- "numpy",
41
47
  "hyperpyyaml",
42
-
43
- # cosyvoice side
44
- "modelscope",
45
48
  "openai-whisper",
46
49
  "tqdm",
47
50
  "tiktoken",
48
51
  "inflect",
49
52
  "omegaconf",
50
53
  "einops",
54
+ ]
51
55
 
52
- # stepaudio2 side
53
- "librosa",
54
- "onnxruntime>=1.18.0",
56
+ # stepaudio2 / streaming 相关依赖
57
+ streaming = [
58
+ "minicpmo-utils[tts]", # streaming 依赖 tts
59
+ "onnxruntime>=1.18.0,<=1.21.0",
60
+ "onnx",
55
61
  "diffusers",
56
62
  ]
57
63
 
58
- [project.optional-dependencies]
59
- # Linux GPU onnxruntime can be heavy and environment-specific; keep as an opt-in extra.
64
+ # Linux GPU onnxruntime 可以很重,且与环境强相关,保留为可选 extra
60
65
  gpu = [
61
- "onnxruntime-gpu>=1.18.0; sys_platform == 'linux'",
66
+ "onnxruntime-gpu>=1.18.0,<=1.23.2; sys_platform == 'linux'",
67
+ ]
68
+
69
+ all = [
70
+ "minicpmo-utils[tts,streaming,gpu]",
62
71
  ]
63
72
 
64
73
  [tool.setuptools]
@@ -16,7 +16,6 @@ import time
16
16
  from typing import Generator
17
17
  from tqdm import tqdm
18
18
  from hyperpyyaml import load_hyperpyyaml
19
- from modelscope import snapshot_download
20
19
  import torch
21
20
  from cosyvoice.cli.frontend import CosyVoiceFrontEnd
22
21
  from cosyvoice.cli.model import CosyVoiceModel, CosyVoice2Model
@@ -30,8 +29,6 @@ class CosyVoice:
30
29
  self.instruct = True if '-Instruct' in model_dir else False
31
30
  self.model_dir = model_dir
32
31
  self.fp16 = fp16
33
- if not os.path.exists(model_dir):
34
- model_dir = snapshot_download(model_dir)
35
32
  hyper_yaml_path = '{}/cosyvoice.yaml'.format(model_dir)
36
33
  if not os.path.exists(hyper_yaml_path):
37
34
  raise ValueError('{} not found!'.format(hyper_yaml_path))
@@ -154,8 +151,6 @@ class CosyVoice2(CosyVoice):
154
151
  self.instruct = True if '-Instruct' in model_dir else False
155
152
  self.model_dir = model_dir
156
153
  self.fp16 = fp16
157
- if not os.path.exists(model_dir):
158
- model_dir = snapshot_download(model_dir)
159
154
 
160
155
  if config_path is None:
161
156
  config_path = f'{model_dir}/cosyvoice2.yaml'
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: minicpmo-utils
3
- Version: 0.1.0
3
+ Version: 0.1.2
4
4
  Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
5
5
  Author: MiniCPM-o Utils Maintainers
6
6
  License: Apache-2.0
@@ -14,23 +14,31 @@ Classifier: Programming Language :: Python :: 3.11
14
14
  Classifier: Programming Language :: Python :: 3.12
15
15
  Requires-Python: >=3.10
16
16
  Description-Content-Type: text/markdown
17
- Requires-Dist: torch>=2.3.0
18
- Requires-Dist: torchaudio>=2.3.0
19
- Requires-Dist: transformers>=4.49.0
20
17
  Requires-Dist: numpy
21
- Requires-Dist: hyperpyyaml
22
- Requires-Dist: modelscope
23
- Requires-Dist: openai-whisper
24
- Requires-Dist: tqdm
25
- Requires-Dist: tiktoken
26
- Requires-Dist: inflect
27
- Requires-Dist: omegaconf
28
- Requires-Dist: einops
29
- Requires-Dist: librosa
30
- Requires-Dist: onnxruntime>=1.18.0
31
- Requires-Dist: diffusers
18
+ Requires-Dist: pillow==10.4.0
19
+ Requires-Dist: librosa==0.9.0
20
+ Requires-Dist: decord==0.6.0
21
+ Requires-Dist: moviepy==2.1.2
22
+ Provides-Extra: tts
23
+ Requires-Dist: torch>=2.3.0; extra == "tts"
24
+ Requires-Dist: torchaudio>=2.3.0; extra == "tts"
25
+ Requires-Dist: transformers>=4.49.0; extra == "tts"
26
+ Requires-Dist: hyperpyyaml; extra == "tts"
27
+ Requires-Dist: openai-whisper; extra == "tts"
28
+ Requires-Dist: tqdm; extra == "tts"
29
+ Requires-Dist: tiktoken; extra == "tts"
30
+ Requires-Dist: inflect; extra == "tts"
31
+ Requires-Dist: omegaconf; extra == "tts"
32
+ Requires-Dist: einops; extra == "tts"
33
+ Provides-Extra: streaming
34
+ Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
35
+ Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "streaming"
36
+ Requires-Dist: onnx; extra == "streaming"
37
+ Requires-Dist: diffusers; extra == "streaming"
32
38
  Provides-Extra: gpu
33
- Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gpu"
39
+ Requires-Dist: onnxruntime-gpu<=1.23.2,>=1.18.0; sys_platform == "linux" and extra == "gpu"
40
+ Provides-Extra: all
41
+ Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
34
42
 
35
43
  ## minicpmo-utils
36
44
 
@@ -38,17 +46,32 @@ Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gp
38
46
 
39
47
  ### 安装方式
40
48
 
41
- - 从源码本地安装(开发态,可编辑):
49
+ - 从源码本地安装(开发态,可编辑,默认只装公共依赖):
42
50
  ```bash
43
51
  cd minicpmo-utils
44
52
  pip install -e .
45
53
  ```
46
54
 
55
+ - 如果只想安装 cosyvoice 相关依赖(TTS):
56
+ ```bash
57
+ pip install -e .[tts]
58
+ ```
59
+
60
+ - 如果只想安装 stepaudio2 / streaming 相关依赖:
61
+ ```bash
62
+ pip install -e .[streaming]
63
+ ```
64
+
65
+ - 同时安装 cosyvoice + stepaudio2 相关依赖:
66
+ ```bash
67
+ pip install -e .[tts,streaming]
68
+ ```
69
+
47
70
  - 构建并安装 wheel(推荐分发):
48
71
  ```bash
49
72
  cd minicpmo-utils
50
73
  python -m build # 生成 dist/*.whl
51
- pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
74
+ pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
52
75
  ```
53
76
 
54
77
  ### 导入方式
@@ -0,0 +1,31 @@
1
+ numpy
2
+ pillow==10.4.0
3
+ librosa==0.9.0
4
+ decord==0.6.0
5
+ moviepy==2.1.2
6
+
7
+ [all]
8
+ minicpmo-utils[gpu,streaming,tts]
9
+
10
+ [gpu]
11
+
12
+ [gpu:sys_platform == "linux"]
13
+ onnxruntime-gpu<=1.23.2,>=1.18.0
14
+
15
+ [streaming]
16
+ minicpmo-utils[tts]
17
+ onnxruntime<=1.21.0,>=1.18.0
18
+ onnx
19
+ diffusers
20
+
21
+ [tts]
22
+ torch>=2.3.0
23
+ torchaudio>=2.3.0
24
+ transformers>=4.49.0
25
+ hyperpyyaml
26
+ openai-whisper
27
+ tqdm
28
+ tiktoken
29
+ inflect
30
+ omegaconf
31
+ einops
@@ -7,7 +7,6 @@ import torchaudio
7
7
  import s3tokenizer
8
8
  import onnxruntime
9
9
  import numpy as np
10
- from copy import deepcopy
11
10
 
12
11
  import torchaudio.compliance.kaldi as kaldi
13
12
  from stepaudio2.flashcosyvoice.modules.hifigan import HiFTGenerator
@@ -1,20 +0,0 @@
1
- torch>=2.3.0
2
- torchaudio>=2.3.0
3
- transformers>=4.49.0
4
- numpy
5
- hyperpyyaml
6
- modelscope
7
- openai-whisper
8
- tqdm
9
- tiktoken
10
- inflect
11
- omegaconf
12
- einops
13
- librosa
14
- onnxruntime>=1.18.0
15
- diffusers
16
-
17
- [gpu]
18
-
19
- [gpu:sys_platform == "linux"]
20
- onnxruntime-gpu>=1.18.0
File without changes