PyPI - abstractvoice - Versions diffs - 0.5.1__py3-none-any.whl → 0.6.1__py3-none-any.whl - Mend

abstractvoice 0.5.1py3-none-any.whl → 0.6.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

abstractvoice/__init__.py +2 -5
abstractvoice/__main__.py +82 -3
abstractvoice/adapters/__init__.py +12 -0
abstractvoice/adapters/base.py +207 -0
abstractvoice/adapters/stt_faster_whisper.py +401 -0
abstractvoice/adapters/tts_piper.py +480 -0
abstractvoice/aec/__init__.py +10 -0
abstractvoice/aec/webrtc_apm.py +56 -0
abstractvoice/artifacts.py +173 -0
abstractvoice/audio/__init__.py +7 -0
abstractvoice/audio/recorder.py +46 -0
abstractvoice/audio/resample.py +25 -0
abstractvoice/cloning/__init__.py +7 -0
abstractvoice/cloning/engine_chroma.py +738 -0
abstractvoice/cloning/engine_f5.py +546 -0
abstractvoice/cloning/manager.py +349 -0
abstractvoice/cloning/store.py +362 -0
abstractvoice/compute/__init__.py +6 -0
abstractvoice/compute/device.py +73 -0
abstractvoice/config/__init__.py +2 -0
abstractvoice/config/voice_catalog.py +19 -0
abstractvoice/dependency_check.py +0 -1
abstractvoice/examples/cli_repl.py +2403 -243
abstractvoice/examples/voice_cli.py +64 -63
abstractvoice/integrations/__init__.py +2 -0
abstractvoice/integrations/abstractcore.py +116 -0
abstractvoice/integrations/abstractcore_plugin.py +253 -0
abstractvoice/prefetch.py +82 -0
abstractvoice/recognition.py +424 -42
abstractvoice/stop_phrase.py +103 -0
abstractvoice/tts/__init__.py +3 -3
abstractvoice/tts/adapter_tts_engine.py +210 -0
abstractvoice/tts/tts_engine.py +257 -1208
abstractvoice/vm/__init__.py +2 -0
abstractvoice/vm/common.py +21 -0
abstractvoice/vm/core.py +139 -0
abstractvoice/vm/manager.py +108 -0
abstractvoice/vm/stt_mixin.py +158 -0
abstractvoice/vm/tts_mixin.py +550 -0
abstractvoice/voice_manager.py +6 -1061
abstractvoice-0.6.1.dist-info/METADATA +213 -0
abstractvoice-0.6.1.dist-info/RECORD +52 -0
{abstractvoice-0.5.1.dist-info → abstractvoice-0.6.1.dist-info}/WHEEL +1 -1
abstractvoice-0.6.1.dist-info/entry_points.txt +6 -0
abstractvoice/instant_setup.py +0 -83
abstractvoice/simple_model_manager.py +0 -539
abstractvoice-0.5.1.dist-info/METADATA +0 -1458
abstractvoice-0.5.1.dist-info/RECORD +0 -23
abstractvoice-0.5.1.dist-info/entry_points.txt +0 -2
{abstractvoice-0.5.1.dist-info → abstractvoice-0.6.1.dist-info}/licenses/LICENSE +0 -0
{abstractvoice-0.5.1.dist-info → abstractvoice-0.6.1.dist-info}/top_level.txt +0 -0

abstractvoice-0.6.1.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,213 @@
+Metadata-Version: 2.4
+Name: abstractvoice
+Version: 0.6.1
+Summary: A modular Python library for voice interactions with AI systems
+Author-email: Laurent-Philippe Albou <contact@abstractcore.ai>
+License-Expression: MIT
+Project-URL: Repository, https://github.com/lpalbou/abstractvoice
+Project-URL: Documentation, https://github.com/lpalbou/abstractvoice#readme
+Classifier: Development Status :: 3 - Alpha
+Classifier: Intended Audience :: Developers
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.8
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: numpy>=1.24.0
+Requires-Dist: requests>=2.31.0
+Requires-Dist: appdirs>=1.4.0
+Requires-Dist: piper-tts>=1.2.0
+Requires-Dist: huggingface_hub>=0.20.0
+Requires-Dist: faster-whisper>=0.10.0
+Requires-Dist: sounddevice>=0.4.6
+Requires-Dist: soundfile>=0.12.1
+Requires-Dist: webrtcvad>=2.0.10
+Provides-Extra: voice
+Requires-Dist: sounddevice>=0.4.6; extra == "voice"
+Requires-Dist: webrtcvad>=2.0.10; extra == "voice"
+Requires-Dist: soundfile>=0.12.1; extra == "voice"
+Provides-Extra: audio-fx
+Requires-Dist: librosa>=0.10.0; extra == "audio-fx"
+Provides-Extra: cloning
+Requires-Dist: f5-tts>=1.1.0; extra == "cloning"
+Provides-Extra: chroma
+Requires-Dist: torch>=2.0.0; extra == "chroma"
+Requires-Dist: torchaudio>=2.0.0; extra == "chroma"
+Requires-Dist: torchvision>=0.15.0; extra == "chroma"
+Requires-Dist: transformers>=5.0.0rc0; extra == "chroma"
+Requires-Dist: accelerate>=1.0.0; extra == "chroma"
+Requires-Dist: av>=14.0.0; extra == "chroma"
+Requires-Dist: librosa>=0.11.0; extra == "chroma"
+Requires-Dist: audioread>=3.0.0; extra == "chroma"
+Requires-Dist: pillow>=11.0.0; extra == "chroma"
+Requires-Dist: safetensors>=0.5.0; extra == "chroma"
+Provides-Extra: aec
+Requires-Dist: aec-audio-processing>=1.0.1; extra == "aec"
+Provides-Extra: stt
+Requires-Dist: openai-whisper>=20230314; extra == "stt"
+Requires-Dist: tiktoken>=0.6.0; extra == "stt"
+Provides-Extra: web
+Requires-Dist: flask>=2.0.0; extra == "web"
+Provides-Extra: all
+Requires-Dist: piper-tts>=1.2.0; extra == "all"
+Requires-Dist: sounddevice>=0.4.6; extra == "all"
+Requires-Dist: webrtcvad>=2.0.10; extra == "all"
+Requires-Dist: openai-whisper>=20230314; extra == "all"
+Requires-Dist: librosa>=0.10.0; extra == "all"
+Requires-Dist: soundfile>=0.12.1; extra == "all"
+Requires-Dist: flask>=2.0.0; extra == "all"
+Requires-Dist: tiktoken>=0.6.0; extra == "all"
+Requires-Dist: f5-tts>=1.1.0; extra == "all"
+Requires-Dist: aec-audio-processing>=1.0.1; extra == "all"
+Provides-Extra: dev
+Requires-Dist: pytest>=7.0.0; extra == "dev"
+Requires-Dist: black>=22.0.0; extra == "dev"
+Requires-Dist: flake8>=5.0.0; extra == "dev"
+Provides-Extra: voice-full
+Requires-Dist: sounddevice>=0.4.6; extra == "voice-full"
+Requires-Dist: webrtcvad>=2.0.10; extra == "voice-full"
+Requires-Dist: openai-whisper>=20230314; extra == "voice-full"
+Requires-Dist: librosa>=0.10.0; extra == "voice-full"
+Requires-Dist: soundfile>=0.12.1; extra == "voice-full"
+Requires-Dist: tiktoken>=0.6.0; extra == "voice-full"
+Provides-Extra: core-stt
+Requires-Dist: openai-whisper>=20230314; extra == "core-stt"
+Requires-Dist: tiktoken>=0.6.0; extra == "core-stt"
+Provides-Extra: audio-only
+Requires-Dist: sounddevice>=0.4.6; extra == "audio-only"
+Requires-Dist: webrtcvad>=2.0.10; extra == "audio-only"
+Requires-Dist: soundfile>=0.12.1; extra == "audio-only"
+Dynamic: license-file
+# AbstractVoice
+A modular Python library for **voice I/O** around AI applications.
+- **TTS (default)**: Piper (cross-platform, no system deps)
+- **STT (default)**: faster-whisper
+- **Local assistant**: `listen()` + `speak()` with playback/listening control
+- **Headless/server**: `speak_to_bytes()` / `speak_to_file()` and `transcribe_*`
+Status: **alpha** (`0.6.1`). The supported integrator surface is documented in `docs/api.md`.
+Next: `docs/getting-started.md` (recommended setup + first smoke tests).
+> AbstractVoice will ultimately be integrated as the voice modality of AbstractFramework.
+> An OpenAI-compatible voice endpoint is an optional demo/integration layer (see backlog).
+---
+## Install
+```bash
+pip install abstractvoice
+```
+Optional extras (feature flags):
+```bash
+pip install "abstractvoice[all]"
+```
+Notes:
+- `abstractvoice[all]` enables most optional features (incl. cloning + AEC + audio-fx), but **does not** include the GPU-heavy Chroma runtime.
+- For the full list of extras (and platform troubleshooting), see `docs/installation.md`.
+### Explicit model downloads (recommended; never implicit in the REPL)
+Some features rely on large model weights/artifacts. AbstractVoice will **not**
+download these implicitly inside the REPL (offline-first).
+After installing, prefetch explicitly (cross-platform):
+```bash
+abstractvoice-prefetch --stt small
+abstractvoice-prefetch --piper en
+abstractvoice-prefetch --openf5
+abstractvoice-prefetch --chroma
+```
+Or equivalently:
+```bash
+python -m abstractvoice download --stt small
+python -m abstractvoice download --piper en
+python -m abstractvoice download --openf5
+python -m abstractvoice download --chroma
+```
+Notes:
+- `--piper <lang>` downloads the Piper ONNX voice for that language into `~/.piper/models`.
+- `--openf5` is ~5.4GB. `--chroma` is very large (GPU-heavy).
+---
+## Quick smoke tests
+### REPL (fastest end-to-end)
+```bash
+abstractvoice --verbose
+# or (from a source checkout):
+python -m abstractvoice cli --verbose
+```
+Notes:
+- Mic voice input is **off by default** for fast startup. Enable with `--voice-mode stop` (or in-session: `/voice stop`).
+- The REPL is **offline-first**: no implicit model downloads. Use the explicit download commands above.
+See `docs/repl_guide.md`.
+### Minimal Python
+```python
+from abstractvoice import VoiceManager
+vm = VoiceManager()
+vm.speak("Hello! This is AbstractVoice.")
+```
+---
+## Public API (stable surface)
+See `docs/api.md` for the supported integrator contract.
+At a glance:
+- **TTS**: `speak()`, `stop_speaking()`, `pause_speaking()`, `resume_speaking()`, `speak_to_bytes()`, `speak_to_file()`
+- **STT**: `transcribe_file()`, `transcribe_from_bytes()`
+- **Mic**: `listen()`, `stop_listening()`, `pause_listening()`, `resume_listening()`
+---
+## Documentation (minimal set)
+- **Docs index**: `docs/README.md`
+- **Getting started**: `docs/getting-started.md`
+- **FAQ**: `docs/faq.md`
+- **Orientation**: `docs/overview.md`
+- **Acronyms**: `docs/acronyms.md`
+- **Public API**: `docs/api.md`
+- **REPL guide**: `docs/repl_guide.md`
+- **Install troubleshooting**: `docs/installation.md`
+- **Multilingual support**: `docs/multilingual.md`
+- **Architecture (internal)**: `docs/architecture.md` + `docs/adr/`
+- **Model management (Piper-first)**: `docs/model-management.md`
+- **Licensing notes**: `docs/voices-and-licenses.md`
+---
+## Project
+- **Changelog**: `CHANGELOG.md`
+- **Contributing**: `CONTRIBUTING.md`
+- **Security**: `SECURITY.md`
+- **Acknowledgments**: `ACKNOWLEDGMENTS.md`
+## License
+MIT. See `LICENSE`.

abstractvoice-0.6.1.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,52 @@
+abstractvoice/__init__.py,sha256=Ce_KZwKQ_4G-elHU6G8cqmPMUKSih9NP0tEjDK7JHR4,817
+abstractvoice/__main__.py,sha256=EVhZgFwWHBaeRcz1cVoILCzibCyxpD9V9nCOQiO1yUU,8357
+abstractvoice/artifacts.py,sha256=jHcOK6q4barEh92og1oy52b5p4IqC9AwyKbZzFIitww,5750
+abstractvoice/dependency_check.py,sha256=3iz5-bwCQOJvh1jeC9NO8mmlKjuN5LKZ7ZKVy7zcjQw,10002
+abstractvoice/prefetch.py,sha256=XciaG-OPuOLbAbVauyWJdcVh2oDHuyBMJ9a9bht0kwA,2939
+abstractvoice/recognition.py,sha256=xkCjKGKIfHKLuvM-rcdVVfVzZqhcVUv1sqABnZokgJU,27623
+abstractvoice/stop_phrase.py,sha256=PLUkL2uM6n0J--uFs_O_VeIWN6k2-jNhVlmKBol02ys,3382
+abstractvoice/voice_manager.py,sha256=6M1yT9etb6TQWoAmgqhfGWSex7Blg2bzlLTJZTytL7s,234
+abstractvoice/adapters/__init__.py,sha256=PRhDqLA6cj_fEYMkp54PJ5xrAiEt2oEvE5yVK1MKbP4,452
+abstractvoice/adapters/base.py,sha256=GXmBcwvrVpCCIsNcnClMdvn--ngxMZxp0zjfFvVHYd4,6212
+abstractvoice/adapters/stt_faster_whisper.py,sha256=tbqeN4hpa4v7fxO5tzIAojYEOHikZ7_-QqqiiC3l4tA,14980
+abstractvoice/adapters/tts_piper.py,sha256=Vr-tO7BwripH0YayAlG6YG9nkl_c4jbLkyzXnKn5vnU,17505
+abstractvoice/aec/__init__.py,sha256=jXolI_HFtvCvGT4hYJWDW2Ny8x86vRN8PN14yyVNufw,229
+abstractvoice/aec/webrtc_apm.py,sha256=RK2tWFB01sWjsn5mi5IQAgWX__Jwn74-vPaQJp2ZLfs,1748
+abstractvoice/audio/__init__.py,sha256=xe_De58G3Tn0YOnDb8NWO5mQkONHzpZ6SMZ6KPzE2no,177
+abstractvoice/audio/recorder.py,sha256=nM5kZxoAsPHoXuZwsNXcSdn-j2NM9m9npyBzy1HNy4w,1154
+abstractvoice/audio/resample.py,sha256=R116UgWUfMx4Q2lGn4ntXgsDDpJkRIsY7TlGG4GZP1s,783
+abstractvoice/cloning/__init__.py,sha256=xQlZscgtqR1jEPvZPNzKeapRRdldbV6GUCulELwgHwA,188
+abstractvoice/cloning/engine_chroma.py,sha256=8Qg2j3H0kelILnXBrCdGiun9Ms4KzgIAUgD8fm59-jM,30888
+abstractvoice/cloning/engine_f5.py,sha256=4jpRpYThjr_EDsLekcydVOu5BRurHCe4yv8ZR7BVmO4,21749
+abstractvoice/cloning/manager.py,sha256=Ib6ltqewV6CyrYrVCymBSGoalOEQ73ZU3mxZRZD_7zk,13478
+abstractvoice/cloning/store.py,sha256=yTh_ifIvfQL4DRdNM4XpDKWUrBQu1ajdjXbWgRJFi9s,12840
+abstractvoice/compute/__init__.py,sha256=h_Syj7jesZyP1OAo5UnsFZUQAAnqLXPkMgCzx0nh0Js,193
+abstractvoice/compute/device.py,sha256=IM4hf45RRs8u-ZJI81PSX5i_vI9YJosvuy-XqCImnUU,1875
+abstractvoice/config/__init__.py,sha256=VK2uK7bMbFDL6-WlZV-FXmKO1Ii-ezbwYN-rHo2lUTQ,54
+abstractvoice/config/voice_catalog.py,sha256=py5D2qO4tL_PezEtDRyS48BzkA6MiX_l06BsE-Xa5NA,496
+abstractvoice/examples/__init__.py,sha256=94vpKJDlfOrEBIUETg-57Q5Z7fYDidg6v4UzV7V_lZA,60
+abstractvoice/examples/cli_repl.py,sha256=dO7aauMB4mJ0_RZTqVKSzJp0L5oR0Id_cO7zKbWoftk,128469
+abstractvoice/examples/voice_cli.py,sha256=jJ27H7VtwFTktEixxt4Ne_u5vwcZoTiL7oninqCmjio,11068
+abstractvoice/examples/web_api.py,sha256=0g5LKJpl7fZepPQJL25AcdaevV-xv34VqqyWGYYchPk,6376
+abstractvoice/integrations/__init__.py,sha256=NsLg9ewvcXwBP118n0BDg4ye5KMWdcsHxikhkfaIs5s,61
+abstractvoice/integrations/abstractcore.py,sha256=o_vYCUYThb51GeCeoM-hQ_zz9S_5clVCLT5OZZ0txok,4282
+abstractvoice/integrations/abstractcore_plugin.py,sha256=GMPhxV3NnN47NfUQNKoPdtnWTv8251uoyxaB7kQRC6Q,9637
+abstractvoice/stt/__init__.py,sha256=PFc6la3tTkxT4TJYwb0PnMIahM_hFtU4pNQdeKmbooo,120
+abstractvoice/stt/transcriber.py,sha256=GdaH1OsCHu4Vu9rUsQlzH6X9bfcnoiK5tGz1AW_uj6Q,5481
+abstractvoice/tts/__init__.py,sha256=ca3_xFGK5DZ5-6ffNf8TPle3B0oKZizaBbcZs-e3QzE,190
+abstractvoice/tts/adapter_tts_engine.py,sha256=BFgwF2HuZr26if3NIucQrK-5mlDX2VhVLSzJWkOeEnw,8123
+abstractvoice/tts/tts_engine.py,sha256=XLIHwgZfY1S_kbRvs7S95pegVcbuxbV-BtuZIXqE-ak,12301
+abstractvoice/vad/__init__.py,sha256=RIIbFw25jNHgel06E4VvTWJnXjwjeFZ98m1Vx9hVjuo,119
+abstractvoice/vad/voice_detector.py,sha256=ghrhpDFlIR5TsMB2gpigXY6t5c_1yZ7vEX1imAMgWjc,3166
+abstractvoice/vm/__init__.py,sha256=1nxB3-bH6o-q68jkmpTKRImps2GcMLCMAUE3ZAlMqR8,71
+abstractvoice/vm/common.py,sha256=siNFBNAmQ4nMsivwXRM3jQXfcDB9UNJPd7sOIXJeL50,693
+abstractvoice/vm/core.py,sha256=UL4dFxnggn7ueEmECGS1vRpW7qZMB2FcZjrn3OWXwgU,5305
+abstractvoice/vm/manager.py,sha256=4yZI-LdBUP3LriEyY3kV3dKF25AO8r-JAR3YV-YLmWY,4158
+abstractvoice/vm/stt_mixin.py,sha256=5VZ7lVwsy1yGt0UVA4Ixfvyp-1pHqAQJjv0QmQXAedo,5932
+abstractvoice/vm/tts_mixin.py,sha256=GvPC73YjfkkoA6rYrHYqf_FhbzRMuZVbzQ88QubjDQs,22525
+abstractvoice-0.6.1.dist-info/licenses/LICENSE,sha256=TiDPM5WcFRQPoC5e46jGMeMppZ-eu0eFx_HytjE49bk,1105
+abstractvoice-0.6.1.dist-info/METADATA,sha256=y_oRXVn3EynZkyHmz2w3wmhqHtEHb9SZ4BjF1-OP6M0,7213
+abstractvoice-0.6.1.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
+abstractvoice-0.6.1.dist-info/entry_points.txt,sha256=PT4IchtBfcgcjlhbX_84WKyCpe-HWzjpNgJ24Kordco,234
+abstractvoice-0.6.1.dist-info/top_level.txt,sha256=a1qyxqgF1O8cJtPKpcJuImGZ_uXqPNghbLZ9gp-UiOo,14
+abstractvoice-0.6.1.dist-info/RECORD,,

{abstractvoice-0.5.1.dist-info → abstractvoice-0.6.1.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: setuptools (80.9.0)
+Generator: setuptools (80.10.2)
 Root-Is-Purelib: true
 Tag: py3-none-any

abstractvoice-0.6.1.dist-info/entry_points.txt ADDED Viewed

@@ -0,0 +1,6 @@
+[abstractcore.capabilities_plugins]
+abstractvoice = abstractvoice.integrations.abstractcore_plugin:register
+[console_scripts]
+abstractvoice = abstractvoice.examples.voice_cli:main
+abstractvoice-prefetch = abstractvoice.prefetch:main

abstractvoice/instant_setup.py DELETED Viewed

@@ -1,83 +0,0 @@
-"""
-Instant Setup Module for AbstractVoice
-Provides immediate TTS functionality with seamless model download.
-"""
-import os
-import sys
-from pathlib import Path
-# Essential model for instant functionality (lightweight, reliable)
-ESSENTIAL_MODEL = "tts_models/en/ljspeech/fast_pitch"
-ESSENTIAL_MODEL_SIZE = "~100MB"
-def ensure_instant_tts():
-    """
-    Ensure TTS is ready for immediate use.
-    Downloads essential model if needed with progress indicator.
-    Returns:
-        bool: True if TTS is ready, False if failed
-    """
-    try:
-        from TTS.api import TTS
-        from TTS.utils.manage import ModelManager
-        manager = ModelManager()
-        # Check if essential model is already cached
-        if is_model_cached(ESSENTIAL_MODEL):
-            return True
-        # Download essential model with user-friendly progress
-        print(f"🚀 AbstractVoice: Setting up TTS ({ESSENTIAL_MODEL_SIZE})...")
-        print(f"   This happens once and takes ~30 seconds")
-        try:
-            # Download with progress bar
-            tts = TTS(model_name=ESSENTIAL_MODEL, progress_bar=True)
-            print(f"✅ TTS ready! AbstractVoice is now fully functional.")
-            return True
-        except Exception as e:
-            print(f"❌ Setup failed: {e}")
-            print(f"💡 Try: pip install abstractvoice[all]")
-            return False
-    except ImportError as e:
-        print(f"❌ Missing dependencies: {e}")
-        print(f"💡 Install with: pip install abstractvoice[all]")
-        return False
-def is_model_cached(model_name):
-    """Check if a model is already cached."""
-    try:
-        from TTS.utils.manage import ModelManager
-        manager = ModelManager()
-        # Get cached models list
-        models_file = os.path.join(manager.output_prefix, ".models.json")
-        if os.path.exists(models_file):
-            import json
-            with open(models_file, 'r') as f:
-                cached_models = json.load(f)
-                return model_name in cached_models
-        # Fallback: check if model directory exists and has content
-        model_dir = model_name.replace("/", "--")
-        model_path = os.path.join(manager.output_prefix, model_dir)
-        return os.path.exists(model_path) and bool(os.listdir(model_path))
-    except:
-        # If anything fails, assume not cached
-        return False
-def get_instant_model():
-    """Get the essential model name for instant setup."""
-    return ESSENTIAL_MODEL
-if __name__ == "__main__":
-    # CLI test
-    print("🧪 Testing instant setup...")
-    success = ensure_instant_tts()
-    print(f"Result: {'✅ Ready' if success else '❌ Failed'}")

abstractvoice 0.5.1__py3-none-any.whl → 0.6.1__py3-none-any.whl

abstractvoice 0.5.1py3-none-any.whl → 0.6.1py3-none-any.whl