PyPI - abstractvoice - Versions diffs - 0.1.0__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

abstractvoice 0.1.0py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

abstractvoice/__main__.py +20 -10
abstractvoice/examples/cli_repl.py +198 -13
abstractvoice/examples/voice_cli.py +20 -6
abstractvoice/recognition.py +50 -7
abstractvoice/stt/transcriber.py +17 -2
abstractvoice/tts/tts_engine.py +84 -32
abstractvoice/vad/voice_detector.py +16 -2
abstractvoice/voice_manager.py +558 -16
{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/METADATA +228 -50
abstractvoice-0.2.0.dist-info/RECORD +20 -0
{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/licenses/LICENSE +1 -1
abstractvoice-0.1.0.dist-info/RECORD +0 -20
{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/WHEEL +0 -0
{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/entry_points.txt +0 -0
{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/top_level.txt +0 -0

{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: abstractvoice
-Version: 0.1.0
+Version: 0.2.0
 Summary: A modular Python library for voice interactions with AI systems
 Author-email: Laurent-Philippe Albou <contact@abstractcore.ai>
 License-Expression: MIT
@@ -18,31 +18,108 @@ Requires-Python: >=3.8
 Description-Content-Type: text/markdown
 License-File: LICENSE
 Requires-Dist: numpy>=1.24.0
-Requires-Dist: sounddevice>=0.4.6
-Requires-Dist: webrtcvad>=2.0.10
-Requires-Dist: PyAudio>=0.2.13
-Requires-Dist: openai-whisper>=20230314
-Requires-Dist: coqui-tts>=0.27.0
-Requires-Dist: torch>=2.0.0
-Requires-Dist: torchaudio>=2.0.0
-Requires-Dist: librosa>=0.10.0
-Requires-Dist: soundfile>=0.12.1
 Requires-Dist: requests>=2.31.0
-Requires-Dist: flask>=2.0.0
-Requires-Dist: tiktoken>=0.6.0
+Provides-Extra: voice
+Requires-Dist: sounddevice>=0.4.6; extra == "voice"
+Requires-Dist: webrtcvad>=2.0.10; extra == "voice"
+Requires-Dist: PyAudio>=0.2.13; extra == "voice"
+Requires-Dist: soundfile>=0.12.1; extra == "voice"
+Provides-Extra: tts
+Requires-Dist: coqui-tts>=0.27.0; extra == "tts"
+Requires-Dist: torch>=2.0.0; extra == "tts"
+Requires-Dist: torchaudio>=2.0.0; extra == "tts"
+Requires-Dist: librosa>=0.10.0; extra == "tts"
+Provides-Extra: stt
+Requires-Dist: openai-whisper>=20230314; extra == "stt"
+Requires-Dist: tiktoken>=0.6.0; extra == "stt"
+Provides-Extra: web
+Requires-Dist: flask>=2.0.0; extra == "web"
+Provides-Extra: all
+Requires-Dist: sounddevice>=0.4.6; extra == "all"
+Requires-Dist: webrtcvad>=2.0.10; extra == "all"
+Requires-Dist: PyAudio>=0.2.13; extra == "all"
+Requires-Dist: openai-whisper>=20230314; extra == "all"
+Requires-Dist: coqui-tts>=0.27.0; extra == "all"
+Requires-Dist: torch>=2.0.0; extra == "all"
+Requires-Dist: torchaudio>=2.0.0; extra == "all"
+Requires-Dist: librosa>=0.10.0; extra == "all"
+Requires-Dist: soundfile>=0.12.1; extra == "all"
+Requires-Dist: flask>=2.0.0; extra == "all"
+Requires-Dist: tiktoken>=0.6.0; extra == "all"
 Provides-Extra: dev
 Requires-Dist: pytest>=7.0.0; extra == "dev"
 Requires-Dist: black>=22.0.0; extra == "dev"
 Requires-Dist: flake8>=5.0.0; extra == "dev"
+Provides-Extra: languages
+Requires-Dist: sounddevice>=0.4.6; extra == "languages"
+Requires-Dist: webrtcvad>=2.0.10; extra == "languages"
+Requires-Dist: PyAudio>=0.2.13; extra == "languages"
+Requires-Dist: openai-whisper>=20230314; extra == "languages"
+Requires-Dist: coqui-tts>=0.27.0; extra == "languages"
+Requires-Dist: torch>=2.0.0; extra == "languages"
+Requires-Dist: torchaudio>=2.0.0; extra == "languages"
+Requires-Dist: librosa>=0.10.0; extra == "languages"
+Requires-Dist: soundfile>=0.12.1; extra == "languages"
+Requires-Dist: flask>=2.0.0; extra == "languages"
+Requires-Dist: tiktoken>=0.6.0; extra == "languages"
+Provides-Extra: fr
+Requires-Dist: sounddevice>=0.4.6; extra == "fr"
+Requires-Dist: webrtcvad>=2.0.10; extra == "fr"
+Requires-Dist: PyAudio>=0.2.13; extra == "fr"
+Requires-Dist: openai-whisper>=20230314; extra == "fr"
+Requires-Dist: coqui-tts>=0.27.0; extra == "fr"
+Requires-Dist: torch>=2.0.0; extra == "fr"
+Requires-Dist: torchaudio>=2.0.0; extra == "fr"
+Requires-Dist: librosa>=0.10.0; extra == "fr"
+Requires-Dist: soundfile>=0.12.1; extra == "fr"
+Requires-Dist: flask>=2.0.0; extra == "fr"
+Requires-Dist: tiktoken>=0.6.0; extra == "fr"
+Provides-Extra: es
+Requires-Dist: sounddevice>=0.4.6; extra == "es"
+Requires-Dist: webrtcvad>=2.0.10; extra == "es"
+Requires-Dist: PyAudio>=0.2.13; extra == "es"
+Requires-Dist: openai-whisper>=20230314; extra == "es"
+Requires-Dist: coqui-tts>=0.27.0; extra == "es"
+Requires-Dist: torch>=2.0.0; extra == "es"
+Requires-Dist: torchaudio>=2.0.0; extra == "es"
+Requires-Dist: librosa>=0.10.0; extra == "es"
+Requires-Dist: soundfile>=0.12.1; extra == "es"
+Requires-Dist: flask>=2.0.0; extra == "es"
+Requires-Dist: tiktoken>=0.6.0; extra == "es"
+Provides-Extra: de
+Requires-Dist: sounddevice>=0.4.6; extra == "de"
+Requires-Dist: webrtcvad>=2.0.10; extra == "de"
+Requires-Dist: PyAudio>=0.2.13; extra == "de"
+Requires-Dist: openai-whisper>=20230314; extra == "de"
+Requires-Dist: coqui-tts>=0.27.0; extra == "de"
+Requires-Dist: torch>=2.0.0; extra == "de"
+Requires-Dist: torchaudio>=2.0.0; extra == "de"
+Requires-Dist: librosa>=0.10.0; extra == "de"
+Requires-Dist: soundfile>=0.12.1; extra == "de"
+Requires-Dist: flask>=2.0.0; extra == "de"
+Requires-Dist: tiktoken>=0.6.0; extra == "de"
+Provides-Extra: it
+Requires-Dist: sounddevice>=0.4.6; extra == "it"
+Requires-Dist: webrtcvad>=2.0.10; extra == "it"
+Requires-Dist: PyAudio>=0.2.13; extra == "it"
+Requires-Dist: openai-whisper>=20230314; extra == "it"
+Requires-Dist: coqui-tts>=0.27.0; extra == "it"
+Requires-Dist: torch>=2.0.0; extra == "it"
+Requires-Dist: torchaudio>=2.0.0; extra == "it"
+Requires-Dist: librosa>=0.10.0; extra == "it"
+Requires-Dist: soundfile>=0.12.1; extra == "it"
+Requires-Dist: flask>=2.0.0; extra == "it"
+Requires-Dist: tiktoken>=0.6.0; extra == "it"
 Dynamic: license-file
 # AbstractVoice
 [![PyPI version](https://img.shields.io/pypi/v/abstractvoice.svg)](https://pypi.org/project/abstractvoice/)
 [![Python Version](https://img.shields.io/pypi/pyversions/abstractvoice)](https://pypi.org/project/abstractvoice/)
-[![License](https://img.shields.io/pypi/l/abstractvoice)](https://github.com/lpalbou/abstractvoice/blob/main/LICENSE)
+[![license](https://img.shields.io/github/license/lpalbou/AbstractVoice)](https://github.com/lpalbou/abstractvoice/blob/main/LICENSE)
 [![GitHub stars](https://img.shields.io/github/stars/lpalbou/abstractvoice?style=social)](https://github.com/lpalbou/abstractvoice/stargazers)
 A modular Python library for voice interactions with AI systems, providing text-to-speech (TTS) and speech-to-text (STT) capabilities with interrupt handling.
 While we provide CLI and WEB examples, AbstractVoice is designed to be integrated in other projects.
@@ -62,73 +139,174 @@ While we provide CLI and WEB examples, AbstractVoice is designed to be integrate
 - **Interrupt Handling**: Stop TTS by speaking or using stop commands
 - **Modular Design**: Easily integrate with any text generation system
+Note : *the LLM access is rudimentary and abstractvoice is provided more as an example and demonstrator. A better integration is to use the functionalities of this library and use them directly in combination with [AbstractCore](https://github.com/lpalbou/AbstractCore)*.
 ## Installation
-### Prerequisites
+AbstractVoice is designed to **work everywhere, out of the box** with automatic quality upgrades.
+### 🚀 Quick Start (Recommended)
+```bash
+# One command installation - works on all systems
+pip install abstractvoice[all]
-- Python 3.8+ (3.11+ recommended)
-- PortAudio for audio input/output
-- **Recommended**: espeak-ng for best voice quality (VITS model)
+# Verify it works
+python -c "from abstractvoice import VoiceManager; print('✅ Ready to go!')"
+```
-### Installing espeak-ng (Recommended for Best Quality)
+**That's it!** AbstractVoice automatically:
+- ✅ **Works everywhere** - Uses reliable models that run on any system
+- ✅ **Auto-upgrades quality** - Detects when better models are available
+- ✅ **No system dependencies required** - Pure Python installation
+- ✅ **Optional quality boost** - Install `espeak-ng` for premium voices
-AbstractVoice will work without espeak-ng, but voice quality will be significantly better with it:
+### Installation Options
-**macOS:**
 ```bash
-brew install espeak-ng
+# Minimal (just 2 dependencies)
+pip install abstractvoice
+# Add features as needed
+pip install abstractvoice[tts]      # Text-to-speech
+pip install abstractvoice[stt]      # Speech-to-text
+pip install abstractvoice[all]      # Everything (recommended)
+# Language-specific
+pip install abstractvoice[fr]       # French with all features
+pip install abstractvoice[de]       # German with all features
 ```
-**Linux (Ubuntu/Debian):**
+### Optional Quality Upgrade
+For the **absolute best voice quality**, install espeak-ng:
 ```bash
+# macOS
+brew install espeak-ng
+# Linux
 sudo apt-get install espeak-ng
+# Windows
+conda install espeak-ng
 ```
-**Linux (Fedora/RHEL):**
-```bash
-sudo yum install espeak-ng
+AbstractVoice automatically detects espeak-ng and upgrades to premium quality voices when available.
+## Quick Start
+### Basic Usage (Minimal Installation)
+```python
+# First install with minimal dependencies
+# pip install abstractvoice
+from abstractvoice import VoiceManager
+# This will show a helpful error message with installation instructions
+try:
+    vm = VoiceManager()
+except ImportError as e:
+    print(e)  # Shows: "TTS functionality requires optional dependencies..."
+    # Follow the instructions to install: pip install abstractvoice[all]
 ```
-**Windows:**
-```bash
-# Option 1: Using Conda
-conda install -c conda-forge espeak-ng
+### Full Usage Example
-# Option 2: Using Chocolatey
-choco install espeak-ng
+```python
+# After installing with: pip install abstractvoice[all]
-# Option 3: Download installer from https://github.com/espeak-ng/espeak-ng/releases
+from abstractvoice import VoiceManager
+# Initialize voice manager
+vm = VoiceManager(language='en', debug_mode=True)
+# Text-to-speech
+vm.speak("Hello! I can speak text and listen for responses.")
+# Speech-to-text with callbacks
+def on_transcription(text):
+    print(f"You said: {text}")
+    # Process the transcription
+    vm.speak(f"I heard you say: {text}")
+def on_stop():
+    print("Stopping voice interaction")
+# Start listening
+vm.listen(on_transcription, on_stop)
+# The voice manager will automatically pause listening when speaking
+# and resume when done to prevent feedback loops
 ```
-**Without espeak-ng:** AbstractVoice will automatically fall back to a simpler TTS model (fast_pitch) that works everywhere but has lower voice quality.
+## Additional Examples
-### Basic Installation
+### Language-Specific Usage
-```bash
-# Install from PyPI
-pip install abstractvoice
+```python
+# French voice
+vm_fr = VoiceManager(language='fr')
+vm_fr.speak("Bonjour! Je peux parler français.")
-# Or clone the repository
-git clone https://github.com/lpalbou/abstractvoice.git
-cd abstractvoice
-pip install -e .
+# Spanish voice
+vm_es = VoiceManager(language='es')
+vm_es.speak("¡Hola! Puedo hablar español.")
+# Dynamic language switching
+vm.set_language('fr')  # Switch to French
+vm.set_language('en')  # Switch back to English
 ```
-### Development Installation
+### Advanced Configuration
-```bash
-# Install with development dependencies
-pip install "abstractvoice[dev]"
+```python
+from abstractvoice import VoiceManager
+# Custom TTS model selection
+vm = VoiceManager(
+    language='en',
+    tts_model='tts_models/en/ljspeech/fast_pitch',  # Specific model
+    whisper_model='base',  # Larger Whisper model for better accuracy
+    debug_mode=True
+)
+# Speed control
+vm.set_speed(1.5)  # 1.5x speed
+vm.speak("This text will be spoken faster.")
+# Model switching at runtime
+vm.set_tts_model('tts_models/en/ljspeech/vits')  # Switch to VITS
+vm.set_whisper('small')  # Switch to larger Whisper model
 ```
-### From Requirements File
+### Error Handling and Graceful Degradation
-```bash
-# Install all dependencies including the package
-pip install -r requirements.txt
+AbstractVoice is designed to provide helpful error messages and fallback gracefully:
+```python
+# If you install just the basic package
+# pip install abstractvoice
+from abstractvoice import VoiceManager  # This works fine
+try:
+    vm = VoiceManager()  # This will fail with helpful message
+except ImportError as e:
+    print(e)
+    # Output: "TTS functionality requires optional dependencies. Install with:
+    #          pip install abstractvoice[tts]    # For TTS only
+    #          pip install abstractvoice[all]    # For all features"
+# Missing espeak-ng automatically falls back to compatible models
+# Missing dependencies show clear installation instructions
+# All errors are graceful with helpful guidance
 ```
-## Quick Start
+## CLI and Web Examples
+AbstractVoice includes example applications to demonstrate its capabilities:
 ### Using AbstractVoice from the Command Line

abstractvoice-0.2.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,20 @@
+abstractvoice/__init__.py,sha256=6GWG6ruCOQ73dOK1-lGB4F8fvjoAtsAP8fIoYCnVuZk,817
+abstractvoice/__main__.py,sha256=RQCoQy-UrYp-f5K2cl6PTXpaJz3Rk0hSOvCWCf3Ql18,4230
+abstractvoice/recognition.py,sha256=4KtDUDFixEYuBUMDH2fWaD9csKlwA9tqXkMAkyQMSMo,11259
+abstractvoice/voice_manager.py,sha256=WYuN949pzf4pw8SE3g40OQZNC1CbgUZ5SzvpAGAIfPI,29995
+abstractvoice/examples/__init__.py,sha256=94vpKJDlfOrEBIUETg-57Q5Z7fYDidg6v4UzV7V_lZA,60
+abstractvoice/examples/cli_repl.py,sha256=uRFqUOVDP6RXrMquB_rQ1_fxdyLn_UHwuiu30XHbYwE,41250
+abstractvoice/examples/voice_cli.py,sha256=mhiO7i0AooPWPZD-K6O-wQUvMFbRFED-dlGNUjDvsUE,3962
+abstractvoice/examples/web_api.py,sha256=0g5LKJpl7fZepPQJL25AcdaevV-xv34VqqyWGYYchPk,6376
+abstractvoice/stt/__init__.py,sha256=PFc6la3tTkxT4TJYwb0PnMIahM_hFtU4pNQdeKmbooo,120
+abstractvoice/stt/transcriber.py,sha256=GdaH1OsCHu4Vu9rUsQlzH6X9bfcnoiK5tGz1AW_uj6Q,5481
+abstractvoice/tts/__init__.py,sha256=WgJrxqdc_qaRyfFt1jbgMQD9S757jYuBpDzMRB02TFs,122
+abstractvoice/tts/tts_engine.py,sha256=eMhOxMdqH7V29TLf-7B44aoafKfRDd3zT2lpSZkvAA0,41692
+abstractvoice/vad/__init__.py,sha256=RIIbFw25jNHgel06E4VvTWJnXjwjeFZ98m1Vx9hVjuo,119
+abstractvoice/vad/voice_detector.py,sha256=ghrhpDFlIR5TsMB2gpigXY6t5c_1yZ7vEX1imAMgWjc,3166
+abstractvoice-0.2.0.dist-info/licenses/LICENSE,sha256=TiDPM5WcFRQPoC5e46jGMeMppZ-eu0eFx_HytjE49bk,1105
+abstractvoice-0.2.0.dist-info/METADATA,sha256=uxKWbHnTylSvI0CFMq6IUjY6MUAjGIGPVf8o9KEjwqY,38738
+abstractvoice-0.2.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+abstractvoice-0.2.0.dist-info/entry_points.txt,sha256=rL63lqtLrbd7w_hGsR_w9Mr5baq4p3Mzwn4_UJqR_nI,120
+abstractvoice-0.2.0.dist-info/top_level.txt,sha256=a1qyxqgF1O8cJtPKpcJuImGZ_uXqPNghbLZ9gp-UiOo,14
+abstractvoice-0.2.0.dist-info/RECORD,,

{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/licenses/LICENSE RENAMED Viewed

@@ -1,6 +1,6 @@
 MIT License
-Copyright (c) 2025 Laurent-Philippe Albou (lpalbou@gmail.com)
+Copyright (c) 2025 Laurent-Philippe Albou (contact@abstractcore.ai)
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal

abstractvoice-0.1.0.dist-info/RECORD DELETED Viewed

@@ -1,20 +0,0 @@
-abstractvoice/__init__.py,sha256=6GWG6ruCOQ73dOK1-lGB4F8fvjoAtsAP8fIoYCnVuZk,817
-abstractvoice/__main__.py,sha256=ZACGwnSWpqyjQ4oDj6IMj0hV8w76UCST5ZVZa8NMdNY,3546
-abstractvoice/recognition.py,sha256=dWAZ-Pxk0GrDurfTEuDRd5f5DjRYq_68qffUMyr0IvY,9487
-abstractvoice/voice_manager.py,sha256=fDDWAXY6K8wv51JFdLfEDR5-1TW8gevFNY7czyMx4FA,9049
-abstractvoice/examples/__init__.py,sha256=94vpKJDlfOrEBIUETg-57Q5Z7fYDidg6v4UzV7V_lZA,60
-abstractvoice/examples/cli_repl.py,sha256=_Pvp6dSkdJz8csQ3YvVAyAOuI3t0GYdp6_2L3uftC4A,33363
-abstractvoice/examples/voice_cli.py,sha256=M3Gf7CN3XJJkIcILfj5141SAMVCCie7yjG_fwHjbiDA,3141
-abstractvoice/examples/web_api.py,sha256=0g5LKJpl7fZepPQJL25AcdaevV-xv34VqqyWGYYchPk,6376
-abstractvoice/stt/__init__.py,sha256=PFc6la3tTkxT4TJYwb0PnMIahM_hFtU4pNQdeKmbooo,120
-abstractvoice/stt/transcriber.py,sha256=DhCT3yXdWr0dsD7ciT2tIa6XAHrIe3ZvuwK8S7pUM2Y,4845
-abstractvoice/tts/__init__.py,sha256=WgJrxqdc_qaRyfFt1jbgMQD9S757jYuBpDzMRB02TFs,122
-abstractvoice/tts/tts_engine.py,sha256=cuoKaMw7MP2PyUFE0LwZZqYI8tcIGIiX2ZzSP1QH4qo,39224
-abstractvoice/vad/__init__.py,sha256=RIIbFw25jNHgel06E4VvTWJnXjwjeFZ98m1Vx9hVjuo,119
-abstractvoice/vad/voice_detector.py,sha256=fR7uNuDVx_0vLzcMa8d1cEYtyAeZ1nW9ao5_V57rW7s,2584
-abstractvoice-0.1.0.dist-info/licenses/LICENSE,sha256=jxyvKKcODBeM8o4aaTjVpeSI74XSjS4zwIu_n-8eNNE,1099
-abstractvoice-0.1.0.dist-info/METADATA,sha256=eV3ReI4fU5men2rofgFTT9_93ENqkOfCL0PdfNX1ouo,31804
-abstractvoice-0.1.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-abstractvoice-0.1.0.dist-info/entry_points.txt,sha256=rL63lqtLrbd7w_hGsR_w9Mr5baq4p3Mzwn4_UJqR_nI,120
-abstractvoice-0.1.0.dist-info/top_level.txt,sha256=a1qyxqgF1O8cJtPKpcJuImGZ_uXqPNghbLZ9gp-UiOo,14
-abstractvoice-0.1.0.dist-info/RECORD,,

{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{abstractvoice-0.1.0.dist-info → abstractvoice-0.2.0.dist-info}/top_level.txt RENAMED Viewed

File without changes

abstractvoice 0.1.0__py3-none-any.whl → 0.2.0__py3-none-any.whl

abstractvoice 0.1.0py3-none-any.whl → 0.2.0py3-none-any.whl