PyPI - abstractvoice - Versions diffs - 0.3.0__tar.gz → 0.4.1__tar.gz - Mend

abstractvoice 0.3.0tar.gz → 0.4.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

{abstractvoice-0.3.0 → abstractvoice-0.4.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: abstractvoice
-Version: 0.3.0
+Version: 0.4.1
 Summary: A modular Python library for voice interactions with AI systems
 Author-email: Laurent-Philippe Albou <contact@abstractcore.ai>
 License-Expression: MIT
@@ -29,7 +29,7 @@ Requires-Dist: coqui-tts<0.30.0,>=0.27.0; extra == "tts"
 Requires-Dist: torch<2.4.0,>=2.0.0; extra == "tts"
 Requires-Dist: torchvision<0.19.0,>=0.15.0; extra == "tts"
 Requires-Dist: torchaudio<2.4.0,>=2.0.0; extra == "tts"
-Requires-Dist: librosa<0.11.0,>=0.10.0; extra == "tts"
+Requires-Dist: librosa>=0.10.0; extra == "tts"
 Provides-Extra: stt
 Requires-Dist: openai-whisper>=20230314; extra == "stt"
 Requires-Dist: tiktoken>=0.6.0; extra == "stt"
@@ -44,7 +44,7 @@ Requires-Dist: coqui-tts<0.30.0,>=0.27.0; extra == "all"
 Requires-Dist: torch<2.4.0,>=2.0.0; extra == "all"
 Requires-Dist: torchvision<0.19.0,>=0.15.0; extra == "all"
 Requires-Dist: torchaudio<2.4.0,>=2.0.0; extra == "all"
-Requires-Dist: librosa<0.11.0,>=0.10.0; extra == "all"
+Requires-Dist: librosa>=0.10.0; extra == "all"
 Requires-Dist: soundfile>=0.12.1; extra == "all"
 Requires-Dist: flask>=2.0.0; extra == "all"
 Requires-Dist: tiktoken>=0.6.0; extra == "all"
@@ -61,7 +61,7 @@ Requires-Dist: coqui-tts<0.30.0,>=0.27.0; extra == "voice-full"
 Requires-Dist: torch<2.4.0,>=2.0.0; extra == "voice-full"
 Requires-Dist: torchvision<0.19.0,>=0.15.0; extra == "voice-full"
 Requires-Dist: torchaudio<2.4.0,>=2.0.0; extra == "voice-full"
-Requires-Dist: librosa<0.11.0,>=0.10.0; extra == "voice-full"
+Requires-Dist: librosa>=0.10.0; extra == "voice-full"
 Requires-Dist: soundfile>=0.12.1; extra == "voice-full"
 Requires-Dist: tiktoken>=0.6.0; extra == "voice-full"
 Provides-Extra: core-tts
@@ -69,7 +69,7 @@ Requires-Dist: coqui-tts<0.30.0,>=0.27.0; extra == "core-tts"
 Requires-Dist: torch<2.4.0,>=2.0.0; extra == "core-tts"
 Requires-Dist: torchvision<0.19.0,>=0.15.0; extra == "core-tts"
 Requires-Dist: torchaudio<2.4.0,>=2.0.0; extra == "core-tts"
-Requires-Dist: librosa<0.11.0,>=0.10.0; extra == "core-tts"
+Requires-Dist: librosa>=0.10.0; extra == "core-tts"
 Provides-Extra: core-stt
 Requires-Dist: openai-whisper>=20230314; extra == "core-stt"
 Requires-Dist: tiktoken>=0.6.0; extra == "core-stt"
@@ -164,34 +164,58 @@ AbstractVoice automatically detects espeak-ng and upgrades to premium quality vo
 ## Quick Start
-### Basic Usage (Minimal Installation)
+### ⚡ Instant TTS (v0.4.0+)
 ```python
-# First install with minimal dependencies
-# pip install abstractvoice
 from abstractvoice import VoiceManager
-# This will show a helpful error message with installation instructions
-try:
-    vm = VoiceManager()
-except ImportError as e:
-    print(e)  # Shows: "TTS functionality requires optional dependencies..."
-    # Follow the instructions to install: pip install abstractvoice[all]
+# Initialize voice manager - automatically downloads essential model if needed
+vm = VoiceManager()
+# Text-to-speech works immediately!
+vm.speak("Hello! TTS works out of the box!")
 ```
-### Full Usage Example
+**That's it!** AbstractVoice v0.4.0+ automatically:
+- ✅ Downloads essential English model (107MB) on first use
+- ✅ Caches models permanently for offline use
+- ✅ Works immediately after first setup
+- ✅ No complex configuration needed
-```python
-# After installing with: pip install abstractvoice[all]
+### 🌍 Multi-Language Support
-from abstractvoice import VoiceManager
+```python
+# Download and use French voice
+vm.download_model('fr.css10_vits')  # Downloads automatically
+vm.set_language('fr')
+vm.speak("Bonjour! Je parle français maintenant.")
+# Download and use German voice
+vm.download_model('de.thorsten_vits')
+vm.set_language('de')
+vm.speak("Hallo! Ich spreche jetzt Deutsch.")
+```
-# Initialize voice manager
-vm = VoiceManager(language='en', debug_mode=True)
+### 🔧 Check System Status
-# Text-to-speech
-vm.speak("Hello! I can speak text and listen for responses.")
+```python
+from abstractvoice import is_ready, get_status, list_models
+import json
+# Quick readiness check
+ready = is_ready()
+print(f"TTS ready: {ready}")
+# Get detailed status
+status = json.loads(get_status())
+print(f"Models cached: {status['total_cached']}")
+print(f"Offline ready: {status['ready_for_offline']}")
+# List all available models
+models = json.loads(list_models())
+for lang, voices in models.items():
+    print(f"{lang}: {len(voices)} voices available")
+```
 # Speech-to-text with callbacks
 def on_transcription(text):
@@ -1289,6 +1313,80 @@ voice_manager.listen(
 )
 ```
+## 💻 CLI Commands (v0.4.0+)
+AbstractVoice provides powerful CLI commands for model management and voice interactions.
+### Model Management
+```bash
+# Download essential model for offline use (recommended first step)
+abstractvoice download-models
+# Download models for specific languages
+abstractvoice download-models --language fr    # French
+abstractvoice download-models --language de    # German
+abstractvoice download-models --language it    # Italian
+abstractvoice download-models --language es    # Spanish
+# Download specific model by name
+abstractvoice download-models --model tts_models/fr/css10/vits
+# Download all available models (large download!)
+abstractvoice download-models --all
+# Check current cache status
+abstractvoice download-models --status
+# Clear model cache
+abstractvoice download-models --clear
+```
+### Voice Interface
+```bash
+# Start voice interface (default)
+abstractvoice
+# Start CLI REPL with specific language
+abstractvoice cli --language fr
+# Start with specific model
+abstractvoice --model granite3.3:2b --language de
+# Run simple example
+abstractvoice simple
+# Check dependencies
+abstractvoice check-deps
+```
+### CLI Voice Commands
+In the CLI REPL, use these commands:
+```bash
+# List all available voices with download status
+/setvoice
+# Download and set specific voice
+/setvoice fr.css10_vits      # French CSS10 VITS
+/setvoice de.thorsten_vits   # German Thorsten
+/setvoice it.mai_male_vits   # Italian Male
+# Change language
+/language fr
+/language de
+# Voice controls
+/pause                       # Pause current speech
+/resume                      # Resume speech
+/stop                        # Stop speech
+# Exit
+/exit
+```
 ## Perspectives
 This is a test project that I designed with examples to work with Ollama, but I will adapt the examples and abstractvoice to work with any LLM provider (anthropic, openai, etc).

{abstractvoice-0.3.0 → abstractvoice-0.4.1}/README.md RENAMED Viewed

@@ -82,34 +82,58 @@ AbstractVoice automatically detects espeak-ng and upgrades to premium quality vo
 ## Quick Start
-### Basic Usage (Minimal Installation)
+### ⚡ Instant TTS (v0.4.0+)
 ```python
-# First install with minimal dependencies
-# pip install abstractvoice
 from abstractvoice import VoiceManager
-# This will show a helpful error message with installation instructions
-try:
-    vm = VoiceManager()
-except ImportError as e:
-    print(e)  # Shows: "TTS functionality requires optional dependencies..."
-    # Follow the instructions to install: pip install abstractvoice[all]
+# Initialize voice manager - automatically downloads essential model if needed
+vm = VoiceManager()
+# Text-to-speech works immediately!
+vm.speak("Hello! TTS works out of the box!")
 ```
-### Full Usage Example
+**That's it!** AbstractVoice v0.4.0+ automatically:
+- ✅ Downloads essential English model (107MB) on first use
+- ✅ Caches models permanently for offline use
+- ✅ Works immediately after first setup
+- ✅ No complex configuration needed
-```python
-# After installing with: pip install abstractvoice[all]
+### 🌍 Multi-Language Support
-from abstractvoice import VoiceManager
+```python
+# Download and use French voice
+vm.download_model('fr.css10_vits')  # Downloads automatically
+vm.set_language('fr')
+vm.speak("Bonjour! Je parle français maintenant.")
+# Download and use German voice
+vm.download_model('de.thorsten_vits')
+vm.set_language('de')
+vm.speak("Hallo! Ich spreche jetzt Deutsch.")
+```
-# Initialize voice manager
-vm = VoiceManager(language='en', debug_mode=True)
+### 🔧 Check System Status
-# Text-to-speech
-vm.speak("Hello! I can speak text and listen for responses.")
+```python
+from abstractvoice import is_ready, get_status, list_models
+import json
+# Quick readiness check
+ready = is_ready()
+print(f"TTS ready: {ready}")
+# Get detailed status
+status = json.loads(get_status())
+print(f"Models cached: {status['total_cached']}")
+print(f"Offline ready: {status['ready_for_offline']}")
+# List all available models
+models = json.loads(list_models())
+for lang, voices in models.items():
+    print(f"{lang}: {len(voices)} voices available")
+```
 # Speech-to-text with callbacks
 def on_transcription(text):
@@ -1207,6 +1231,80 @@ voice_manager.listen(
 )
 ```
+## 💻 CLI Commands (v0.4.0+)
+AbstractVoice provides powerful CLI commands for model management and voice interactions.
+### Model Management
+```bash
+# Download essential model for offline use (recommended first step)
+abstractvoice download-models
+# Download models for specific languages
+abstractvoice download-models --language fr    # French
+abstractvoice download-models --language de    # German
+abstractvoice download-models --language it    # Italian
+abstractvoice download-models --language es    # Spanish
+# Download specific model by name
+abstractvoice download-models --model tts_models/fr/css10/vits
+# Download all available models (large download!)
+abstractvoice download-models --all
+# Check current cache status
+abstractvoice download-models --status
+# Clear model cache
+abstractvoice download-models --clear
+```
+### Voice Interface
+```bash
+# Start voice interface (default)
+abstractvoice
+# Start CLI REPL with specific language
+abstractvoice cli --language fr
+# Start with specific model
+abstractvoice --model granite3.3:2b --language de
+# Run simple example
+abstractvoice simple
+# Check dependencies
+abstractvoice check-deps
+```
+### CLI Voice Commands
+In the CLI REPL, use these commands:
+```bash
+# List all available voices with download status
+/setvoice
+# Download and set specific voice
+/setvoice fr.css10_vits      # French CSS10 VITS
+/setvoice de.thorsten_vits   # German Thorsten
+/setvoice it.mai_male_vits   # Italian Male
+# Change language
+/language fr
+/language de
+# Voice controls
+/pause                       # Pause current speech
+/resume                      # Resume speech
+/stop                        # Stop speech
+# Exit
+/exit
+```
 ## Perspectives
 This is a test project that I designed with examples to work with Ollama, but I will adapt the examples and abstractvoice to work with any LLM provider (anthropic, openai, etc).

{abstractvoice-0.3.0 → abstractvoice-0.4.1}/abstractvoice/__init__.py RENAMED Viewed

@@ -29,5 +29,8 @@ warnings.filterwarnings(
 # Import the main class for public API
 from .voice_manager import VoiceManager
-__version__ = "0.2.0"
-__all__ = ['VoiceManager']
+# Import simple APIs for third-party applications
+from .simple_model_manager import list_models, download_model, get_status, is_ready
+__version__ = "0.4.1"
+__all__ = ['VoiceManager', 'list_models', 'download_model', 'get_status', 'is_ready']

{abstractvoice-0.3.0 → abstractvoice-0.4.1}/abstractvoice/examples/cli_repl.py RENAMED Viewed

@@ -38,7 +38,7 @@ class VoiceREPL(cmd.Cmd):
     use_rawinput = True
     def __init__(self, api_url="http://localhost:11434/api/chat",
-                 model="granite3.3:2b", debug_mode=False, language="en", tts_model=None):
+                 model="granite3.3:2b", debug_mode=False, language="en", tts_model=None, disable_tts=False):
         super().__init__()
         # Debug mode
@@ -54,11 +54,15 @@ class VoiceREPL(cmd.Cmd):
         self.current_language = language
         # Initialize voice manager with language support
-        self.voice_manager = VoiceManager(
-            language=language,
-            tts_model=tts_model,
-            debug_mode=debug_mode
-        )
+        if disable_tts:
+            self.voice_manager = None
+            print("🔇 TTS disabled - text-only mode")
+        else:
+            self.voice_manager = VoiceManager(
+                language=language,
+                tts_model=tts_model,
+                debug_mode=debug_mode
+            )
         # Settings
         self.use_tts = True
@@ -90,8 +94,11 @@ class VoiceREPL(cmd.Cmd):
     def _get_intro(self):
         """Generate intro message with help."""
         intro = f"\n{Colors.BOLD}Welcome to AbstractVoice CLI REPL{Colors.END}\n"
-        lang_name = self.voice_manager.get_language_name()
-        intro += f"API: {self.api_url} | Model: {self.model} | Voice: {lang_name}\n"
+        if self.voice_manager:
+            lang_name = self.voice_manager.get_language_name()
+            intro += f"API: {self.api_url} | Model: {self.model} | Voice: {lang_name}\n"
+        else:
+            intro += f"API: {self.api_url} | Model: {self.model} | Voice: Disabled\n"
         intro += f"\n{Colors.CYAN}Quick Start:{Colors.END}\n"
         intro += "  • Type messages to chat with the LLM\n"
         intro += "  • Use /voice <mode> to enable voice input\n"
@@ -232,7 +239,7 @@ class VoiceREPL(cmd.Cmd):
             print(f"{Colors.CYAN}{response_text}{Colors.END}")
             # Speak the response if voice manager is available
-            if self.voice_manager:
+            if self.voice_manager and self.use_tts:
                 self.voice_manager.speak(response_text)
         except requests.exceptions.ConnectionError as e:
@@ -376,18 +383,47 @@ class VoiceREPL(cmd.Cmd):
           /setvoice <voice_id>         # Set voice (format: language.voice_id)
         Examples:
-          /setvoice                    # List all voices
+          /setvoice                    # List all voices with JSON-like info
           /setvoice fr.css10_vits      # Set French CSS10 VITS voice
           /setvoice it.mai_male_vits   # Set Italian male VITS voice
         """
         if not args:
-            # Show all available voices organized by language
+            # Show all available voices with metadata
             print(f"\n{Colors.CYAN}Available Voice Models:{Colors.END}")
-            self.voice_manager.list_voices()
-            print(f"\n{Colors.YELLOW}Usage:{Colors.END}")
-            print("  /setvoice <language>.<voice_id>")
-            print("  Example: /setvoice fr.css10_vits")
+            try:
+                models = self.voice_manager.list_available_models()
+                for language, voices in models.items():
+                    # Get language name
+                    lang_names = {
+                        'en': 'English', 'fr': 'French', 'es': 'Spanish',
+                        'de': 'German', 'it': 'Italian'
+                    }
+                    lang_name = lang_names.get(language, language.upper())
+                    print(f"\n🌍 {lang_name} ({language}):")
+                    for voice_id, voice_info in voices.items():
+                        cached_icon = "✅" if voice_info.get('cached', False) else "📥"
+                        quality_icon = "✨" if voice_info['quality'] == 'excellent' else "🔧"
+                        size_text = f"{voice_info['size_mb']}MB"
+                        print(f"  {cached_icon} {quality_icon} {language}.{voice_id}")
+                        print(f"      {voice_info['name']} ({size_text})")
+                        print(f"      {voice_info['description']}")
+                        if voice_info.get('requires_espeak', False):
+                            print(f"      ⚠️ Requires espeak-ng")
+                print(f"\n{Colors.YELLOW}Usage:{Colors.END}")
+                print("  /setvoice <language>.<voice_id>")
+                print("  Example: /setvoice fr.css10_vits")
+                print("\n📥 = Download needed  ✅ = Ready  ✨ = High quality  🔧 = Good quality")
+            except Exception as e:
+                print(f"❌ Error listing models: {e}")
+                # Fallback to old method
+                self.voice_manager.list_voices()
             return
         voice_spec = args.strip()
@@ -412,45 +448,46 @@ class VoiceREPL(cmd.Cmd):
         else:
             was_active = False
-        # Set the specific voice
+        # Download and set the specific voice using programmatic API
         try:
-            success = self.voice_manager.set_voice(language, voice_id)
+            print(f"🔄 Setting voice {voice_spec}...")
+            # Use the programmatic download API
+            success = self.voice_manager.download_model(voice_spec)
             if success:
-                # Update current language to match the voice
-                self.current_language = language
+                # Now set the language to match
+                success = self.voice_manager.set_language(language)
-                # Get voice info for confirmation
-                voice_info = self.voice_manager.VOICE_CATALOG.get(language, {}).get(voice_id, {})
-                lang_name = self.voice_manager.get_language_name(language)
+                if success:
+                    # Update current language
+                    self.current_language = language
-                print(f"✅ Voice changed successfully!")
-                print(f"   Language: {lang_name} ({language})")
-                print(f"   Voice: {voice_id}")
-                if voice_info:
-                    quality_icon = "✨" if voice_info.get('quality') == 'premium' else "🔧"
-                    gender_icon = {"male": "👨", "female": "👩", "multiple": "👥"}.get(voice_info.get('gender'), "🗣️")
-                    print(f"   Details: {quality_icon} {gender_icon} {voice_info.get('accent', 'Unknown accent')}")
+                    print(f"✅ Voice set to {voice_spec}")
-                # Test the new voice
-                test_messages = {
-                    'en': "Voice changed to English.",
-                    'fr': "Voix changée en français.",
-                    'es': "Voz cambiada al español.",
-                    'de': "Stimme auf Deutsch geändert.",
-                    'it': "Voce cambiata in italiano."
-                }
-                test_msg = test_messages.get(language, "Voice changed successfully.")
-                self.voice_manager.speak(test_msg)
+                    # Test the voice
+                    test_messages = {
+                        'en': 'Voice changed to English.',
+                        'fr': 'Voix changée en français.',
+                        'es': 'Voz cambiada al español.',
+                        'de': 'Stimme auf Deutsch geändert.',
+                        'it': 'Voce cambiata in italiano.'
+                    }
+                    test_msg = test_messages.get(language, f'Voice changed to {language}.')
+                    self.voice_manager.speak(test_msg)
-                # Restart voice mode if it was active
-                if was_active:
-                    self.do_voice(self.voice_mode)
+                    # Restart voice mode if it was active
+                    if was_active:
+                        self.do_voice(self.voice_mode)
+                else:
+                    print(f"❌ Failed to set language: {language}")
             else:
-                print(f"❌ Failed to set voice: {voice_spec}")
-                print(f"   Run '/setvoice' to see available voices")
+                print(f"❌ Failed to download voice: {voice_spec}")
+                print("   Check your internet connection or try a different voice")
         except Exception as e:
             print(f"❌ Error setting voice: {e}")
+            print(f"   Run '/setvoice' to see available voices")
             if self.debug_mode:
                 import traceback
                 traceback.print_exc()

abstractvoice 0.3.0__tar.gz → 0.4.1__tar.gz

abstractvoice 0.3.0tar.gz → 0.4.1tar.gz