minicpmo-utils 0.1.4__tar.gz → 0.1.6__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (153) hide show
  1. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/PKG-INFO +25 -6
  2. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/pyproject.toml +31 -8
  3. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/file_utils.py +2 -1
  4. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/minicpmo/__init__.py +0 -10
  5. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/minicpmo_utils.egg-info/PKG-INFO +25 -6
  6. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/minicpmo_utils.egg-info/requires.txt +27 -5
  7. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/README.md +0 -0
  8. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/setup.cfg +0 -0
  9. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/__init__.py +0 -0
  10. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/bin/average_model.py +0 -0
  11. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/bin/export_jit.py +0 -0
  12. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/bin/export_onnx.py +0 -0
  13. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/bin/inference_deprecated.py +0 -0
  14. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/bin/train.py +0 -0
  15. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/cli/__init__.py +0 -0
  16. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/cli/cosyvoice.py +0 -0
  17. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/cli/frontend.py +0 -0
  18. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/cli/model.py +0 -0
  19. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/dataset/__init__.py +0 -0
  20. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/dataset/dataset.py +0 -0
  21. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/dataset/processor.py +0 -0
  22. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/flow/decoder.py +0 -0
  23. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/flow/flow.py +0 -0
  24. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/flow/flow_matching.py +0 -0
  25. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/flow/length_regulator.py +0 -0
  26. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/hifigan/discriminator.py +0 -0
  27. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/hifigan/f0_predictor.py +0 -0
  28. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/hifigan/generator.py +0 -0
  29. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/hifigan/hifigan.py +0 -0
  30. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/llm/llm.py +0 -0
  31. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/tokenizer/assets/multilingual_zh_ja_yue_char_del.tiktoken +0 -0
  32. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/tokenizer/tokenizer.py +0 -0
  33. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/__init__.py +0 -0
  34. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/activation.py +0 -0
  35. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/attention.py +0 -0
  36. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/convolution.py +0 -0
  37. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/decoder.py +0 -0
  38. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/decoder_layer.py +0 -0
  39. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/embedding.py +0 -0
  40. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/encoder.py +0 -0
  41. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/encoder_layer.py +0 -0
  42. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/label_smoothing_loss.py +0 -0
  43. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/positionwise_feed_forward.py +0 -0
  44. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/subsampling.py +0 -0
  45. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/transformer/upsample_encoder.py +0 -0
  46. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/__init__.py +0 -0
  47. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/class_utils.py +0 -0
  48. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/common.py +0 -0
  49. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/executor.py +0 -0
  50. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/frontend_utils.py +0 -0
  51. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/losses.py +0 -0
  52. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/mask.py +0 -0
  53. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/scheduler.py +0 -0
  54. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/utils/train_utils.py +0 -0
  55. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/cosyvoice/vllm/cosyvoice2.py +0 -0
  56. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/__init__.py +0 -0
  57. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/app.py +0 -0
  58. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/cli.py +0 -0
  59. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/hifigan/__init__.py +0 -0
  60. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/hifigan/config.py +0 -0
  61. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/hifigan/denoiser.py +0 -0
  62. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/hifigan/env.py +0 -0
  63. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/hifigan/meldataset.py +0 -0
  64. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/hifigan/models.py +0 -0
  65. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/hifigan/xutils.py +0 -0
  66. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/models/__init__.py +0 -0
  67. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/models/baselightningmodule.py +0 -0
  68. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/models/components/__init__.py +0 -0
  69. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/models/components/decoder.py +0 -0
  70. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/models/components/flow_matching.py +0 -0
  71. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/models/components/text_encoder.py +0 -0
  72. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/models/components/transformer.py +0 -0
  73. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/models/matcha_tts.py +0 -0
  74. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/onnx/__init__.py +0 -0
  75. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/onnx/export.py +0 -0
  76. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/onnx/infer.py +0 -0
  77. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/text/__init__.py +0 -0
  78. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/text/cleaners.py +0 -0
  79. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/text/numbers.py +0 -0
  80. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/text/symbols.py +0 -0
  81. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/train.py +0 -0
  82. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/__init__.py +0 -0
  83. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/audio.py +0 -0
  84. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/generate_data_statistics.py +0 -0
  85. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/instantiators.py +0 -0
  86. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/logging_utils.py +0 -0
  87. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/model.py +0 -0
  88. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/monotonic_align/__init__.py +0 -0
  89. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/monotonic_align/setup.py +0 -0
  90. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/pylogger.py +0 -0
  91. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/rich_utils.py +0 -0
  92. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/matcha/utils/utils.py +0 -0
  93. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/minicpmo/utils.py +0 -0
  94. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/minicpmo/version.py +0 -0
  95. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/minicpmo_utils.egg-info/SOURCES.txt +0 -0
  96. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/minicpmo_utils.egg-info/dependency_links.txt +0 -0
  97. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/minicpmo_utils.egg-info/top_level.txt +0 -0
  98. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/s3tokenizer/__init__.py +0 -0
  99. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/s3tokenizer/assets/BAC009S0764W0121.wav +0 -0
  100. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/s3tokenizer/assets/BAC009S0764W0122.wav +0 -0
  101. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/s3tokenizer/assets/mel_filters.npz +0 -0
  102. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/s3tokenizer/cli.py +0 -0
  103. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/s3tokenizer/model.py +0 -0
  104. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/s3tokenizer/model_v2.py +0 -0
  105. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/s3tokenizer/utils.py +0 -0
  106. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/__init__.py +0 -0
  107. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/__init__.py +0 -0
  108. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/flow/__init__.py +0 -0
  109. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/flow/decoder_dit.py +0 -0
  110. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/flow/flow.py +0 -0
  111. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/flow/flow_matching.py +0 -0
  112. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/transformer/__init__.py +0 -0
  113. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/transformer/attention.py +0 -0
  114. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/transformer/embedding.py +0 -0
  115. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/transformer/encoder_layer.py +0 -0
  116. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/transformer/positionwise_feed_forward.py +0 -0
  117. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/transformer/subsampling.py +0 -0
  118. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/transformer/upsample_encoder_v2.py +0 -0
  119. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/utils/__init__.py +0 -0
  120. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/utils/class_utils.py +0 -0
  121. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/utils/common.py +0 -0
  122. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/cosyvoice2/utils/mask.py +0 -0
  123. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/__init__.py +0 -0
  124. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/cli.py +0 -0
  125. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/config.py +0 -0
  126. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/cosyvoice2.py +0 -0
  127. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/cosyvoice3.py +0 -0
  128. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/engine/__init__.py +0 -0
  129. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/engine/block_manager.py +0 -0
  130. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/engine/llm_engine.py +0 -0
  131. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/engine/model_runner.py +0 -0
  132. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/engine/scheduler.py +0 -0
  133. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/engine/sequence.py +0 -0
  134. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/__init__.py +0 -0
  135. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/flow.py +0 -0
  136. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/flow_components/__init__.py +0 -0
  137. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/flow_components/estimator.py +0 -0
  138. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/flow_components/upsample_encoder.py +0 -0
  139. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/hifigan.py +0 -0
  140. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/__init__.py +0 -0
  141. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/layers.py +0 -0
  142. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/qwen2.py +0 -0
  143. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/__init__.py +0 -0
  144. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/layers.py +0 -0
  145. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/modules/sampler.py +0 -0
  146. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/utils/__init__.py +0 -0
  147. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/utils/audio.py +0 -0
  148. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/utils/context.py +0 -0
  149. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/utils/loader.py +0 -0
  150. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/flashcosyvoice/utils/memory.py +0 -0
  151. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/stepaudio2.py +0 -0
  152. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/token2wav.py +0 -0
  153. {minicpmo_utils-0.1.4 → minicpmo_utils-0.1.6}/src/stepaudio2/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: minicpmo-utils
3
- Version: 0.1.4
3
+ Version: 0.1.6
4
4
  Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
5
5
  Author: MiniCPM-o Utils Maintainers
6
6
  License: Apache-2.0
@@ -23,23 +23,42 @@ Provides-Extra: tts
23
23
  Requires-Dist: torch>=2.3.0; extra == "tts"
24
24
  Requires-Dist: torchaudio>=2.3.0; extra == "tts"
25
25
  Requires-Dist: transformers>=4.49.0; extra == "tts"
26
+ Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "tts"
27
+ Requires-Dist: onnx; extra == "tts"
26
28
  Requires-Dist: hyperpyyaml; extra == "tts"
27
29
  Requires-Dist: openai-whisper; extra == "tts"
28
30
  Requires-Dist: tqdm; extra == "tts"
29
31
  Requires-Dist: tiktoken; extra == "tts"
30
32
  Requires-Dist: inflect; extra == "tts"
31
- Requires-Dist: omegaconf; extra == "tts"
32
- Requires-Dist: einops; extra == "tts"
33
+ Requires-Dist: omegaconf>=2.0.6; extra == "tts"
33
34
  Requires-Dist: conformer==0.3.2; extra == "tts"
35
+ Requires-Dist: einops==0.8.1; extra == "tts"
36
+ Requires-Dist: hydra-core; extra == "tts"
37
+ Requires-Dist: lightning==2.2.4; extra == "tts"
38
+ Requires-Dist: rich; extra == "tts"
39
+ Requires-Dist: gdown==5.2.0; extra == "tts"
40
+ Requires-Dist: matplotlib; extra == "tts"
41
+ Requires-Dist: wget; extra == "tts"
42
+ Requires-Dist: pyarrow; extra == "tts"
43
+ Requires-Dist: pyworld; extra == "tts"
44
+ Requires-Dist: scipy; extra == "tts"
45
+ Requires-Dist: pyyaml; extra == "tts"
46
+ Requires-Dist: regex; extra == "tts"
47
+ Requires-Dist: soundfile; extra == "tts"
34
48
  Provides-Extra: streaming
35
49
  Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
36
- Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "streaming"
37
- Requires-Dist: onnx; extra == "streaming"
38
50
  Requires-Dist: diffusers; extra == "streaming"
51
+ Provides-Extra: streaming-flash
52
+ Requires-Dist: minicpmo-utils[streaming]; extra == "streaming-flash"
53
+ Requires-Dist: flash-attn>=2.6.0; sys_platform == "linux" and extra == "streaming-flash"
54
+ Requires-Dist: triton>=2.3.0; sys_platform == "linux" and extra == "streaming-flash"
55
+ Requires-Dist: safetensors; extra == "streaming-flash"
56
+ Requires-Dist: pynvml; extra == "streaming-flash"
57
+ Requires-Dist: xxhash; extra == "streaming-flash"
39
58
  Provides-Extra: gpu
40
59
  Requires-Dist: onnxruntime-gpu<=1.23.2,>=1.18.0; sys_platform == "linux" and extra == "gpu"
41
60
  Provides-Extra: all
42
- Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
61
+ Requires-Dist: minicpmo-utils[gpu,streaming,streaming-flash,tts]; extra == "all"
43
62
 
44
63
  ## minicpmo-utils
45
64
 
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "minicpmo-utils"
7
- version = "0.1.4"
7
+ version = "0.1.6"
8
8
  description = "Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils."
9
9
  readme = "README.md"
10
10
  requires-python = ">=3.10"
@@ -35,7 +35,7 @@ dependencies = [
35
35
  "pillow==10.4.0",
36
36
  "librosa==0.9.0",
37
37
  "decord==0.6.0",
38
- "moviepy==2.1.2"
38
+ "moviepy==2.1.2",
39
39
  ]
40
40
 
41
41
  [project.optional-dependencies]
@@ -44,31 +44,54 @@ tts = [
44
44
  "torch>=2.3.0",
45
45
  "torchaudio>=2.3.0",
46
46
  "transformers>=4.49.0",
47
+ "onnxruntime>=1.18.0,<=1.21.0",
48
+ "onnx",
47
49
  "hyperpyyaml",
48
50
  "openai-whisper",
49
51
  "tqdm",
50
52
  "tiktoken",
51
53
  "inflect",
52
- "omegaconf",
53
- "einops",
54
+ "omegaconf>=2.0.6",
54
55
  "conformer==0.3.2",
56
+ "einops==0.8.1",
57
+ "hydra-core",
58
+ "lightning==2.2.4",
59
+ "rich",
60
+ "gdown==5.2.0",
61
+ "matplotlib",
62
+ "wget",
63
+ "pyarrow",
64
+ "pyworld",
65
+ # 新增依赖
66
+ "scipy",
67
+ "pyyaml",
68
+ "regex",
69
+ "soundfile",
55
70
  ]
56
71
 
57
- # stepaudio2 / streaming 相关依赖
72
+ # stepaudio2 基础依赖(token2wav 等)
58
73
  streaming = [
59
74
  "minicpmo-utils[tts]", # streaming 依赖 tts
60
- "onnxruntime>=1.18.0,<=1.21.0",
61
- "onnx",
62
75
  "diffusers",
63
76
  ]
64
77
 
78
+ # stepaudio2 Flash 推理引擎依赖(flashcosyvoice.engine 模块需要)
79
+ streaming-flash = [
80
+ "minicpmo-utils[streaming]",
81
+ "flash-attn>=2.6.0; sys_platform == 'linux'",
82
+ "triton>=2.3.0; sys_platform == 'linux'",
83
+ "safetensors",
84
+ "pynvml",
85
+ "xxhash",
86
+ ]
87
+
65
88
  # Linux GPU onnxruntime 可以很重,且与环境强相关,保留为可选 extra
66
89
  gpu = [
67
90
  "onnxruntime-gpu>=1.18.0,<=1.23.2; sys_platform == 'linux'",
68
91
  ]
69
92
 
70
93
  all = [
71
- "minicpmo-utils[tts,streaming,gpu]",
94
+ "minicpmo-utils[tts,streaming,streaming-flash,gpu]",
72
95
  ]
73
96
 
74
97
  [tool.setuptools]
@@ -20,7 +20,8 @@ import torch
20
20
  import torchaudio
21
21
  import logging
22
22
  logging.getLogger('matplotlib').setLevel(logging.WARNING)
23
- logging.basicConfig(level=logging.DEBUG,
23
+ logging.getLogger('numba').setLevel(logging.WARNING)
24
+ logging.basicConfig(level=logging.INFO,
24
25
  format='%(asctime)s %(levelname)s %(message)s')
25
26
 
26
27
 
@@ -12,13 +12,3 @@
12
12
  """
13
13
 
14
14
  from .version import __version__
15
-
16
- # Eager re-exports to allow:
17
- # from minicpmo import cosyvoice, stepaudio2, matcha
18
- # 而不需要懒加载。
19
- # import cosyvoice as cosyvoice
20
- # import stepaudio2 as stepaudio2
21
- # import matcha as matcha
22
-
23
- # __all__ = ["__version__", "cosyvoice", "stepaudio2", "matcha"]
24
-
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: minicpmo-utils
3
- Version: 0.1.4
3
+ Version: 0.1.6
4
4
  Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
5
5
  Author: MiniCPM-o Utils Maintainers
6
6
  License: Apache-2.0
@@ -23,23 +23,42 @@ Provides-Extra: tts
23
23
  Requires-Dist: torch>=2.3.0; extra == "tts"
24
24
  Requires-Dist: torchaudio>=2.3.0; extra == "tts"
25
25
  Requires-Dist: transformers>=4.49.0; extra == "tts"
26
+ Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "tts"
27
+ Requires-Dist: onnx; extra == "tts"
26
28
  Requires-Dist: hyperpyyaml; extra == "tts"
27
29
  Requires-Dist: openai-whisper; extra == "tts"
28
30
  Requires-Dist: tqdm; extra == "tts"
29
31
  Requires-Dist: tiktoken; extra == "tts"
30
32
  Requires-Dist: inflect; extra == "tts"
31
- Requires-Dist: omegaconf; extra == "tts"
32
- Requires-Dist: einops; extra == "tts"
33
+ Requires-Dist: omegaconf>=2.0.6; extra == "tts"
33
34
  Requires-Dist: conformer==0.3.2; extra == "tts"
35
+ Requires-Dist: einops==0.8.1; extra == "tts"
36
+ Requires-Dist: hydra-core; extra == "tts"
37
+ Requires-Dist: lightning==2.2.4; extra == "tts"
38
+ Requires-Dist: rich; extra == "tts"
39
+ Requires-Dist: gdown==5.2.0; extra == "tts"
40
+ Requires-Dist: matplotlib; extra == "tts"
41
+ Requires-Dist: wget; extra == "tts"
42
+ Requires-Dist: pyarrow; extra == "tts"
43
+ Requires-Dist: pyworld; extra == "tts"
44
+ Requires-Dist: scipy; extra == "tts"
45
+ Requires-Dist: pyyaml; extra == "tts"
46
+ Requires-Dist: regex; extra == "tts"
47
+ Requires-Dist: soundfile; extra == "tts"
34
48
  Provides-Extra: streaming
35
49
  Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
36
- Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "streaming"
37
- Requires-Dist: onnx; extra == "streaming"
38
50
  Requires-Dist: diffusers; extra == "streaming"
51
+ Provides-Extra: streaming-flash
52
+ Requires-Dist: minicpmo-utils[streaming]; extra == "streaming-flash"
53
+ Requires-Dist: flash-attn>=2.6.0; sys_platform == "linux" and extra == "streaming-flash"
54
+ Requires-Dist: triton>=2.3.0; sys_platform == "linux" and extra == "streaming-flash"
55
+ Requires-Dist: safetensors; extra == "streaming-flash"
56
+ Requires-Dist: pynvml; extra == "streaming-flash"
57
+ Requires-Dist: xxhash; extra == "streaming-flash"
39
58
  Provides-Extra: gpu
40
59
  Requires-Dist: onnxruntime-gpu<=1.23.2,>=1.18.0; sys_platform == "linux" and extra == "gpu"
41
60
  Provides-Extra: all
42
- Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
61
+ Requires-Dist: minicpmo-utils[gpu,streaming,streaming-flash,tts]; extra == "all"
43
62
 
44
63
  ## minicpmo-utils
45
64
 
@@ -5,7 +5,7 @@ decord==0.6.0
5
5
  moviepy==2.1.2
6
6
 
7
7
  [all]
8
- minicpmo-utils[gpu,streaming,tts]
8
+ minicpmo-utils[gpu,streaming,streaming-flash,tts]
9
9
 
10
10
  [gpu]
11
11
 
@@ -14,19 +14,41 @@ onnxruntime-gpu<=1.23.2,>=1.18.0
14
14
 
15
15
  [streaming]
16
16
  minicpmo-utils[tts]
17
- onnxruntime<=1.21.0,>=1.18.0
18
- onnx
19
17
  diffusers
20
18
 
19
+ [streaming-flash]
20
+ minicpmo-utils[streaming]
21
+ safetensors
22
+ pynvml
23
+ xxhash
24
+
25
+ [streaming-flash:sys_platform == "linux"]
26
+ flash-attn>=2.6.0
27
+ triton>=2.3.0
28
+
21
29
  [tts]
22
30
  torch>=2.3.0
23
31
  torchaudio>=2.3.0
24
32
  transformers>=4.49.0
33
+ onnxruntime<=1.21.0,>=1.18.0
34
+ onnx
25
35
  hyperpyyaml
26
36
  openai-whisper
27
37
  tqdm
28
38
  tiktoken
29
39
  inflect
30
- omegaconf
31
- einops
40
+ omegaconf>=2.0.6
32
41
  conformer==0.3.2
42
+ einops==0.8.1
43
+ hydra-core
44
+ lightning==2.2.4
45
+ rich
46
+ gdown==5.2.0
47
+ matplotlib
48
+ wget
49
+ pyarrow
50
+ pyworld
51
+ scipy
52
+ pyyaml
53
+ regex
54
+ soundfile
File without changes
File without changes