minicpmo-utils 0.1.0__tar.gz → 0.1.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/PKG-INFO +41 -18
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/README.md +17 -2
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/pyproject.toml +23 -14
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/cli/cosyvoice.py +0 -5
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/PKG-INFO +41 -18
- minicpmo_utils-0.1.2/src/minicpmo_utils.egg-info/requires.txt +31 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/token2wav.py +0 -1
- minicpmo_utils-0.1.0/src/minicpmo_utils.egg-info/requires.txt +0 -20
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/setup.cfg +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/average_model.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/export_jit.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/export_onnx.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/inference_deprecated.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/bin/train.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/cli/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/cli/frontend.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/cli/model.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/dataset/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/dataset/dataset.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/dataset/processor.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/flow/decoder.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/flow/flow.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/flow/flow_matching.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/flow/length_regulator.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/hifigan/discriminator.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/hifigan/f0_predictor.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/hifigan/generator.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/hifigan/hifigan.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/llm/llm.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/tokenizer/assets/multilingual_zh_ja_yue_char_del.tiktoken +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/tokenizer/tokenizer.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/activation.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/attention.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/convolution.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/decoder.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/decoder_layer.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/embedding.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/encoder.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/encoder_layer.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/label_smoothing_loss.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/positionwise_feed_forward.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/subsampling.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/upsample_encoder.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/class_utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/common.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/executor.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/file_utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/frontend_utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/losses.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/mask.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/scheduler.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/utils/train_utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/vllm/cosyvoice2.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/app.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/cli.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/config.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/denoiser.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/env.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/meldataset.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/models.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/hifigan/xutils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/baselightningmodule.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/decoder.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/flow_matching.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/text_encoder.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/components/transformer.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/models/matcha_tts.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/onnx/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/onnx/export.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/onnx/infer.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/text/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/text/cleaners.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/text/numbers.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/text/symbols.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/train.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/audio.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/generate_data_statistics.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/instantiators.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/logging_utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/model.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/monotonic_align/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/monotonic_align/setup.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/pylogger.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/rich_utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/matcha/utils/utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo/utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo/version.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/SOURCES.txt +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/dependency_links.txt +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/top_level.txt +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/assets/BAC009S0764W0121.wav +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/assets/BAC009S0764W0122.wav +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/assets/mel_filters.npz +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/cli.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/model.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/model_v2.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/s3tokenizer/utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/decoder_dit.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/flow.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/flow_matching.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/attention.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/embedding.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/encoder_layer.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/positionwise_feed_forward.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/subsampling.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/upsample_encoder_v2.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/class_utils.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/common.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/mask.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/cli.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/config.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/cosyvoice2.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/cosyvoice3.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/block_manager.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/llm_engine.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/model_runner.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/scheduler.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/sequence.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/flow.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/flow_components/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/flow_components/estimator.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/flow_components/upsample_encoder.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/hifigan.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/hifigan_components/layers.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/qwen2.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/qwen2_components/layers.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/sampler.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/__init__.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/audio.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/context.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/loader.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/memory.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/stepaudio2.py +0 -0
- {minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/utils.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: minicpmo-utils
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.2
|
|
4
4
|
Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
|
|
5
5
|
Author: MiniCPM-o Utils Maintainers
|
|
6
6
|
License: Apache-2.0
|
|
@@ -14,23 +14,31 @@ Classifier: Programming Language :: Python :: 3.11
|
|
|
14
14
|
Classifier: Programming Language :: Python :: 3.12
|
|
15
15
|
Requires-Python: >=3.10
|
|
16
16
|
Description-Content-Type: text/markdown
|
|
17
|
-
Requires-Dist: torch>=2.3.0
|
|
18
|
-
Requires-Dist: torchaudio>=2.3.0
|
|
19
|
-
Requires-Dist: transformers>=4.49.0
|
|
20
17
|
Requires-Dist: numpy
|
|
21
|
-
Requires-Dist:
|
|
22
|
-
Requires-Dist:
|
|
23
|
-
Requires-Dist:
|
|
24
|
-
Requires-Dist:
|
|
25
|
-
|
|
26
|
-
Requires-Dist:
|
|
27
|
-
Requires-Dist:
|
|
28
|
-
Requires-Dist:
|
|
29
|
-
Requires-Dist:
|
|
30
|
-
Requires-Dist:
|
|
31
|
-
Requires-Dist:
|
|
18
|
+
Requires-Dist: pillow==10.4.0
|
|
19
|
+
Requires-Dist: librosa==0.9.0
|
|
20
|
+
Requires-Dist: decord==0.6.0
|
|
21
|
+
Requires-Dist: moviepy==2.1.2
|
|
22
|
+
Provides-Extra: tts
|
|
23
|
+
Requires-Dist: torch>=2.3.0; extra == "tts"
|
|
24
|
+
Requires-Dist: torchaudio>=2.3.0; extra == "tts"
|
|
25
|
+
Requires-Dist: transformers>=4.49.0; extra == "tts"
|
|
26
|
+
Requires-Dist: hyperpyyaml; extra == "tts"
|
|
27
|
+
Requires-Dist: openai-whisper; extra == "tts"
|
|
28
|
+
Requires-Dist: tqdm; extra == "tts"
|
|
29
|
+
Requires-Dist: tiktoken; extra == "tts"
|
|
30
|
+
Requires-Dist: inflect; extra == "tts"
|
|
31
|
+
Requires-Dist: omegaconf; extra == "tts"
|
|
32
|
+
Requires-Dist: einops; extra == "tts"
|
|
33
|
+
Provides-Extra: streaming
|
|
34
|
+
Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
|
|
35
|
+
Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "streaming"
|
|
36
|
+
Requires-Dist: onnx; extra == "streaming"
|
|
37
|
+
Requires-Dist: diffusers; extra == "streaming"
|
|
32
38
|
Provides-Extra: gpu
|
|
33
|
-
Requires-Dist: onnxruntime-gpu
|
|
39
|
+
Requires-Dist: onnxruntime-gpu<=1.23.2,>=1.18.0; sys_platform == "linux" and extra == "gpu"
|
|
40
|
+
Provides-Extra: all
|
|
41
|
+
Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
|
|
34
42
|
|
|
35
43
|
## minicpmo-utils
|
|
36
44
|
|
|
@@ -38,17 +46,32 @@ Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gp
|
|
|
38
46
|
|
|
39
47
|
### 安装方式
|
|
40
48
|
|
|
41
|
-
-
|
|
49
|
+
- 从源码本地安装(开发态,可编辑,默认只装公共依赖):
|
|
42
50
|
```bash
|
|
43
51
|
cd minicpmo-utils
|
|
44
52
|
pip install -e .
|
|
45
53
|
```
|
|
46
54
|
|
|
55
|
+
- 如果只想安装 cosyvoice 相关依赖(TTS):
|
|
56
|
+
```bash
|
|
57
|
+
pip install -e .[tts]
|
|
58
|
+
```
|
|
59
|
+
|
|
60
|
+
- 如果只想安装 stepaudio2 / streaming 相关依赖:
|
|
61
|
+
```bash
|
|
62
|
+
pip install -e .[streaming]
|
|
63
|
+
```
|
|
64
|
+
|
|
65
|
+
- 同时安装 cosyvoice + stepaudio2 相关依赖:
|
|
66
|
+
```bash
|
|
67
|
+
pip install -e .[tts,streaming]
|
|
68
|
+
```
|
|
69
|
+
|
|
47
70
|
- 构建并安装 wheel(推荐分发):
|
|
48
71
|
```bash
|
|
49
72
|
cd minicpmo-utils
|
|
50
73
|
python -m build # 生成 dist/*.whl
|
|
51
|
-
pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
|
|
74
|
+
pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
|
|
52
75
|
```
|
|
53
76
|
|
|
54
77
|
### 导入方式
|
|
@@ -4,17 +4,32 @@
|
|
|
4
4
|
|
|
5
5
|
### 安装方式
|
|
6
6
|
|
|
7
|
-
-
|
|
7
|
+
- 从源码本地安装(开发态,可编辑,默认只装公共依赖):
|
|
8
8
|
```bash
|
|
9
9
|
cd minicpmo-utils
|
|
10
10
|
pip install -e .
|
|
11
11
|
```
|
|
12
12
|
|
|
13
|
+
- 如果只想安装 cosyvoice 相关依赖(TTS):
|
|
14
|
+
```bash
|
|
15
|
+
pip install -e .[tts]
|
|
16
|
+
```
|
|
17
|
+
|
|
18
|
+
- 如果只想安装 stepaudio2 / streaming 相关依赖:
|
|
19
|
+
```bash
|
|
20
|
+
pip install -e .[streaming]
|
|
21
|
+
```
|
|
22
|
+
|
|
23
|
+
- 同时安装 cosyvoice + stepaudio2 相关依赖:
|
|
24
|
+
```bash
|
|
25
|
+
pip install -e .[tts,streaming]
|
|
26
|
+
```
|
|
27
|
+
|
|
13
28
|
- 构建并安装 wheel(推荐分发):
|
|
14
29
|
```bash
|
|
15
30
|
cd minicpmo-utils
|
|
16
31
|
python -m build # 生成 dist/*.whl
|
|
17
|
-
pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
|
|
32
|
+
pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
|
|
18
33
|
```
|
|
19
34
|
|
|
20
35
|
### 导入方式
|
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
|
4
4
|
|
|
5
5
|
[project]
|
|
6
6
|
name = "minicpmo-utils"
|
|
7
|
-
version = "0.1.
|
|
7
|
+
version = "0.1.2"
|
|
8
8
|
description = "Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils."
|
|
9
9
|
readme = "README.md"
|
|
10
10
|
requires-python = ">=3.10"
|
|
@@ -31,34 +31,43 @@ classifiers = [
|
|
|
31
31
|
# - s3tokenizer (来自 S3Tokenizer-main)
|
|
32
32
|
# - minicpmo (本项目扩展 utils 的统一入口:from minicpmo.utils import ...)
|
|
33
33
|
dependencies = [
|
|
34
|
-
|
|
34
|
+
"numpy",
|
|
35
|
+
"pillow==10.4.0",
|
|
36
|
+
"librosa==0.9.0",
|
|
37
|
+
"decord==0.6.0",
|
|
38
|
+
"moviepy==2.1.2"
|
|
39
|
+
]
|
|
40
|
+
|
|
41
|
+
[project.optional-dependencies]
|
|
42
|
+
# cosyvoice TTS 相关依赖
|
|
43
|
+
tts = [
|
|
35
44
|
"torch>=2.3.0",
|
|
36
45
|
"torchaudio>=2.3.0",
|
|
37
46
|
"transformers>=4.49.0",
|
|
38
|
-
|
|
39
|
-
# Shared / common
|
|
40
|
-
"numpy",
|
|
41
47
|
"hyperpyyaml",
|
|
42
|
-
|
|
43
|
-
# cosyvoice side
|
|
44
|
-
"modelscope",
|
|
45
48
|
"openai-whisper",
|
|
46
49
|
"tqdm",
|
|
47
50
|
"tiktoken",
|
|
48
51
|
"inflect",
|
|
49
52
|
"omegaconf",
|
|
50
53
|
"einops",
|
|
54
|
+
]
|
|
51
55
|
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
"
|
|
56
|
+
# stepaudio2 / streaming 相关依赖
|
|
57
|
+
streaming = [
|
|
58
|
+
"minicpmo-utils[tts]", # streaming 依赖 tts
|
|
59
|
+
"onnxruntime>=1.18.0,<=1.21.0",
|
|
60
|
+
"onnx",
|
|
55
61
|
"diffusers",
|
|
56
62
|
]
|
|
57
63
|
|
|
58
|
-
|
|
59
|
-
# Linux GPU onnxruntime can be heavy and environment-specific; keep as an opt-in extra.
|
|
64
|
+
# Linux GPU onnxruntime 可以很重,且与环境强相关,保留为可选 extra
|
|
60
65
|
gpu = [
|
|
61
|
-
"onnxruntime-gpu>=1.18.0; sys_platform == 'linux'",
|
|
66
|
+
"onnxruntime-gpu>=1.18.0,<=1.23.2; sys_platform == 'linux'",
|
|
67
|
+
]
|
|
68
|
+
|
|
69
|
+
all = [
|
|
70
|
+
"minicpmo-utils[tts,streaming,gpu]",
|
|
62
71
|
]
|
|
63
72
|
|
|
64
73
|
[tool.setuptools]
|
|
@@ -16,7 +16,6 @@ import time
|
|
|
16
16
|
from typing import Generator
|
|
17
17
|
from tqdm import tqdm
|
|
18
18
|
from hyperpyyaml import load_hyperpyyaml
|
|
19
|
-
from modelscope import snapshot_download
|
|
20
19
|
import torch
|
|
21
20
|
from cosyvoice.cli.frontend import CosyVoiceFrontEnd
|
|
22
21
|
from cosyvoice.cli.model import CosyVoiceModel, CosyVoice2Model
|
|
@@ -30,8 +29,6 @@ class CosyVoice:
|
|
|
30
29
|
self.instruct = True if '-Instruct' in model_dir else False
|
|
31
30
|
self.model_dir = model_dir
|
|
32
31
|
self.fp16 = fp16
|
|
33
|
-
if not os.path.exists(model_dir):
|
|
34
|
-
model_dir = snapshot_download(model_dir)
|
|
35
32
|
hyper_yaml_path = '{}/cosyvoice.yaml'.format(model_dir)
|
|
36
33
|
if not os.path.exists(hyper_yaml_path):
|
|
37
34
|
raise ValueError('{} not found!'.format(hyper_yaml_path))
|
|
@@ -154,8 +151,6 @@ class CosyVoice2(CosyVoice):
|
|
|
154
151
|
self.instruct = True if '-Instruct' in model_dir else False
|
|
155
152
|
self.model_dir = model_dir
|
|
156
153
|
self.fp16 = fp16
|
|
157
|
-
if not os.path.exists(model_dir):
|
|
158
|
-
model_dir = snapshot_download(model_dir)
|
|
159
154
|
|
|
160
155
|
if config_path is None:
|
|
161
156
|
config_path = f'{model_dir}/cosyvoice2.yaml'
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: minicpmo-utils
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.2
|
|
4
4
|
Summary: Unified utilities package for MiniCPM-o: includes cosyvoice + stepaudio2 and extensible utils.
|
|
5
5
|
Author: MiniCPM-o Utils Maintainers
|
|
6
6
|
License: Apache-2.0
|
|
@@ -14,23 +14,31 @@ Classifier: Programming Language :: Python :: 3.11
|
|
|
14
14
|
Classifier: Programming Language :: Python :: 3.12
|
|
15
15
|
Requires-Python: >=3.10
|
|
16
16
|
Description-Content-Type: text/markdown
|
|
17
|
-
Requires-Dist: torch>=2.3.0
|
|
18
|
-
Requires-Dist: torchaudio>=2.3.0
|
|
19
|
-
Requires-Dist: transformers>=4.49.0
|
|
20
17
|
Requires-Dist: numpy
|
|
21
|
-
Requires-Dist:
|
|
22
|
-
Requires-Dist:
|
|
23
|
-
Requires-Dist:
|
|
24
|
-
Requires-Dist:
|
|
25
|
-
|
|
26
|
-
Requires-Dist:
|
|
27
|
-
Requires-Dist:
|
|
28
|
-
Requires-Dist:
|
|
29
|
-
Requires-Dist:
|
|
30
|
-
Requires-Dist:
|
|
31
|
-
Requires-Dist:
|
|
18
|
+
Requires-Dist: pillow==10.4.0
|
|
19
|
+
Requires-Dist: librosa==0.9.0
|
|
20
|
+
Requires-Dist: decord==0.6.0
|
|
21
|
+
Requires-Dist: moviepy==2.1.2
|
|
22
|
+
Provides-Extra: tts
|
|
23
|
+
Requires-Dist: torch>=2.3.0; extra == "tts"
|
|
24
|
+
Requires-Dist: torchaudio>=2.3.0; extra == "tts"
|
|
25
|
+
Requires-Dist: transformers>=4.49.0; extra == "tts"
|
|
26
|
+
Requires-Dist: hyperpyyaml; extra == "tts"
|
|
27
|
+
Requires-Dist: openai-whisper; extra == "tts"
|
|
28
|
+
Requires-Dist: tqdm; extra == "tts"
|
|
29
|
+
Requires-Dist: tiktoken; extra == "tts"
|
|
30
|
+
Requires-Dist: inflect; extra == "tts"
|
|
31
|
+
Requires-Dist: omegaconf; extra == "tts"
|
|
32
|
+
Requires-Dist: einops; extra == "tts"
|
|
33
|
+
Provides-Extra: streaming
|
|
34
|
+
Requires-Dist: minicpmo-utils[tts]; extra == "streaming"
|
|
35
|
+
Requires-Dist: onnxruntime<=1.21.0,>=1.18.0; extra == "streaming"
|
|
36
|
+
Requires-Dist: onnx; extra == "streaming"
|
|
37
|
+
Requires-Dist: diffusers; extra == "streaming"
|
|
32
38
|
Provides-Extra: gpu
|
|
33
|
-
Requires-Dist: onnxruntime-gpu
|
|
39
|
+
Requires-Dist: onnxruntime-gpu<=1.23.2,>=1.18.0; sys_platform == "linux" and extra == "gpu"
|
|
40
|
+
Provides-Extra: all
|
|
41
|
+
Requires-Dist: minicpmo-utils[gpu,streaming,tts]; extra == "all"
|
|
34
42
|
|
|
35
43
|
## minicpmo-utils
|
|
36
44
|
|
|
@@ -38,17 +46,32 @@ Requires-Dist: onnxruntime-gpu>=1.18.0; sys_platform == "linux" and extra == "gp
|
|
|
38
46
|
|
|
39
47
|
### 安装方式
|
|
40
48
|
|
|
41
|
-
-
|
|
49
|
+
- 从源码本地安装(开发态,可编辑,默认只装公共依赖):
|
|
42
50
|
```bash
|
|
43
51
|
cd minicpmo-utils
|
|
44
52
|
pip install -e .
|
|
45
53
|
```
|
|
46
54
|
|
|
55
|
+
- 如果只想安装 cosyvoice 相关依赖(TTS):
|
|
56
|
+
```bash
|
|
57
|
+
pip install -e .[tts]
|
|
58
|
+
```
|
|
59
|
+
|
|
60
|
+
- 如果只想安装 stepaudio2 / streaming 相关依赖:
|
|
61
|
+
```bash
|
|
62
|
+
pip install -e .[streaming]
|
|
63
|
+
```
|
|
64
|
+
|
|
65
|
+
- 同时安装 cosyvoice + stepaudio2 相关依赖:
|
|
66
|
+
```bash
|
|
67
|
+
pip install -e .[tts,streaming]
|
|
68
|
+
```
|
|
69
|
+
|
|
47
70
|
- 构建并安装 wheel(推荐分发):
|
|
48
71
|
```bash
|
|
49
72
|
cd minicpmo-utils
|
|
50
73
|
python -m build # 生成 dist/*.whl
|
|
51
|
-
pip install dist/minicpmo_utils-0.1.0-py3-none-any.whl
|
|
74
|
+
pip install \"dist/minicpmo_utils-0.1.0-py3-none-any.whl[tts,streaming]\"
|
|
52
75
|
```
|
|
53
76
|
|
|
54
77
|
### 导入方式
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
numpy
|
|
2
|
+
pillow==10.4.0
|
|
3
|
+
librosa==0.9.0
|
|
4
|
+
decord==0.6.0
|
|
5
|
+
moviepy==2.1.2
|
|
6
|
+
|
|
7
|
+
[all]
|
|
8
|
+
minicpmo-utils[gpu,streaming,tts]
|
|
9
|
+
|
|
10
|
+
[gpu]
|
|
11
|
+
|
|
12
|
+
[gpu:sys_platform == "linux"]
|
|
13
|
+
onnxruntime-gpu<=1.23.2,>=1.18.0
|
|
14
|
+
|
|
15
|
+
[streaming]
|
|
16
|
+
minicpmo-utils[tts]
|
|
17
|
+
onnxruntime<=1.21.0,>=1.18.0
|
|
18
|
+
onnx
|
|
19
|
+
diffusers
|
|
20
|
+
|
|
21
|
+
[tts]
|
|
22
|
+
torch>=2.3.0
|
|
23
|
+
torchaudio>=2.3.0
|
|
24
|
+
transformers>=4.49.0
|
|
25
|
+
hyperpyyaml
|
|
26
|
+
openai-whisper
|
|
27
|
+
tqdm
|
|
28
|
+
tiktoken
|
|
29
|
+
inflect
|
|
30
|
+
omegaconf
|
|
31
|
+
einops
|
|
@@ -1,20 +0,0 @@
|
|
|
1
|
-
torch>=2.3.0
|
|
2
|
-
torchaudio>=2.3.0
|
|
3
|
-
transformers>=4.49.0
|
|
4
|
-
numpy
|
|
5
|
-
hyperpyyaml
|
|
6
|
-
modelscope
|
|
7
|
-
openai-whisper
|
|
8
|
-
tqdm
|
|
9
|
-
tiktoken
|
|
10
|
-
inflect
|
|
11
|
-
omegaconf
|
|
12
|
-
einops
|
|
13
|
-
librosa
|
|
14
|
-
onnxruntime>=1.18.0
|
|
15
|
-
diffusers
|
|
16
|
-
|
|
17
|
-
[gpu]
|
|
18
|
-
|
|
19
|
-
[gpu:sys_platform == "linux"]
|
|
20
|
-
onnxruntime-gpu>=1.18.0
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/label_smoothing_loss.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/cosyvoice/transformer/positionwise_feed_forward.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/minicpmo_utils.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/flow/flow_matching.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/__init__.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/attention.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/embedding.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/encoder_layer.py
RENAMED
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/transformer/subsampling.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/cosyvoice2/utils/class_utils.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/__init__.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/block_manager.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/llm_engine.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/model_runner.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/scheduler.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/engine/sequence.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/hifigan.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/qwen2.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/modules/sampler.py
RENAMED
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{minicpmo_utils-0.1.0 → minicpmo_utils-0.1.2}/src/stepaudio2/flashcosyvoice/utils/context.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|