npm - agentvibes - Versions diffs - 5.7.7 → 5.9.0 - Mend

agentvibes 5.7.7 → 5.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (138) hide show

package/.agentvibes/config.json +12 -5
package/.agentvibes/install-manifest.json +188 -300
package/.claude/commands/agent-vibes-bmad-voices.md +117 -117
package/.claude/commands/agent-vibes-rdp.md +24 -24
package/.claude/config/audio-effects.cfg +3 -2
package/.claude/config/audio-effects.cfg.sample +52 -52
package/.claude/config/background-music-enabled.txt +1 -0
package/.claude/config/background-music-position.txt +1 -1
package/.claude/config/language.txt +1 -0
package/.claude/docs/TERMUX_SETUP.md +408 -408
package/.claude/github-star-reminder.txt +1 -1
package/.claude/hooks/audio-cache-utils.sh +0 -0
package/.claude/hooks/audio-processor.sh +0 -0
package/.claude/hooks/background-music-manager.sh +0 -0
package/.claude/hooks/bmad-party-speak.sh +0 -0
package/.claude/hooks/bmad-speak-enhanced.sh +0 -0
package/.claude/hooks/bmad-speak.sh +0 -0
package/.claude/hooks/bmad-tts-injector.sh +0 -0
package/.claude/hooks/bmad-voice-manager.sh +0 -0
package/.claude/hooks/clawdbot-receiver-SECURE.sh +0 -0
package/.claude/hooks/clawdbot-receiver.sh +0 -0
package/.claude/hooks/clean-audio-cache.sh +0 -0
package/.claude/hooks/cleanup-cache.sh +0 -0
package/.claude/hooks/configure-rdp-mode.sh +0 -0
package/.claude/hooks/download-extra-voices.sh +0 -0
package/.claude/hooks/effects-manager.sh +0 -0
package/.claude/hooks/github-star-reminder.sh +0 -0
package/.claude/hooks/language-manager.sh +0 -0
package/.claude/hooks/learn-manager.sh +0 -0
package/.claude/hooks/macos-voice-manager.sh +0 -0
package/.claude/hooks/migrate-background-music.sh +0 -0
package/.claude/hooks/migrate-to-agentvibes.sh +0 -0
package/.claude/hooks/optimize-background-music.sh +0 -0
package/.claude/hooks/path-resolver.sh +0 -0
package/.claude/hooks/personality-manager.sh +0 -0
package/.claude/hooks/piper-download-voices.sh +0 -0
package/.claude/hooks/piper-installer.sh +0 -0
package/.claude/hooks/piper-multispeaker-registry.sh +0 -0
package/.claude/hooks/piper-voice-manager.sh +0 -0
package/.claude/hooks/play-tts-agentvibes-receiver-for-voiceless-connections.sh +0 -0
package/.claude/hooks/play-tts-agentvibes-receiver.sh +1 -0
package/.claude/hooks/play-tts-enhanced.sh +0 -0
package/.claude/hooks/play-tts-macos.sh +0 -0
package/.claude/hooks/play-tts-piper.sh +0 -0
package/.claude/hooks/play-tts-soprano.sh +0 -0
package/.claude/hooks/play-tts-ssh-remote.sh +2 -2
package/.claude/hooks/play-tts-termux-ssh.sh +0 -0
package/.claude/hooks/play-tts-windows-receiver.sh +0 -0
package/.claude/hooks/play-tts.sh +0 -0
package/.claude/hooks/prepare-release.sh +0 -0
package/.claude/hooks/provider-commands.sh +0 -0
package/.claude/hooks/provider-manager.sh +0 -0
package/.claude/hooks/replay-target-audio.sh +0 -0
package/.claude/hooks/requirements.txt +6 -6
package/.claude/hooks/sentiment-manager.sh +0 -0
package/.claude/hooks/session-start-tts.sh +0 -0
package/.claude/hooks/soprano-gradio-synth.py +139 -139
package/.claude/hooks/speed-manager.sh +0 -0
package/.claude/hooks/stop-tts.sh +0 -0
package/.claude/hooks/termux-installer.sh +0 -0
package/.claude/hooks/translate-manager.sh +0 -0
package/.claude/hooks/translator.py +237 -237
package/.claude/hooks/tts-queue-worker.sh +0 -0
package/.claude/hooks/tts-queue.sh +0 -0
package/.claude/hooks/verbosity-manager.sh +0 -0
package/.claude/hooks/voice-manager.sh +0 -0
package/.claude/hooks-windows/audio-cache-utils.ps1 +119 -119
package/.claude/hooks-windows/audio-cache-utils.ps1.user.bak +119 -0
package/.claude/hooks-windows/bmad-speak.ps1 +9 -38
package/.claude/hooks-windows/play-tts-soprano.ps1 +13 -2
package/.claude/hooks-windows/soprano-gradio-synth.py +153 -153
package/.claude/hooks-windows/soprano-gradio-synth.py.user.bak +153 -0
package/.claude/piper-voices-dir.txt +1 -1
package/.claude/verbosity.txt +1 -1
package/.clawdbot/README.md +105 -105
package/.mcp.json +5 -14
package/README.md +33 -2
package/RELEASE_NOTES.md +80 -0
package/WINDOWS-SETUP.md +208 -208
package/bin/agent-vibes +39 -39
package/bin/agentvibes-voice-browser.js +0 -0
package/bin/agentvibes.js +0 -0
package/bin/mcp-server.js +121 -121
package/bin/mcp-server.sh +0 -0
package/bin/test-bmad-pr +78 -78
package/mcp-server/QUICK_START.md +203 -203
package/mcp-server/README.md +345 -345
package/mcp-server/WINDOWS_SETUP.md +0 -0
package/mcp-server/examples/claude_desktop_config.json +11 -11
package/mcp-server/examples/claude_desktop_config_piper.json +9 -9
package/mcp-server/examples/custom_instructions.md +169 -169
package/mcp-server/install-deps.js +0 -0
package/mcp-server/server.py +1797 -1797
package/mcp-server/test_server.py +0 -0
package/package.json +1 -1
package/src/cli/list-personalities.js +110 -110
package/src/cli/list-voices.js +114 -114
package/src/commands/bmad-voices.js +394 -394
package/src/commands/install-mcp.js +476 -476
package/src/console/audio-env.js +4 -1
package/src/console/brand-colors.js +13 -13
package/src/console/constants/personalities.js +44 -44
package/src/console/tabs/agents-tab.js +84 -61
package/src/console/tabs/help-tab.js +314 -314
package/src/console/tabs/music-tab.js +3 -2
package/src/console/tabs/readme-tab.js +272 -272
package/src/console/tabs/setup-tab.js +285 -41
package/src/console/tabs/voices-tab.js +13 -1
package/src/console/widgets/destroy-list.js +25 -25
package/src/console/widgets/notice.js +55 -55
package/src/i18n/de.js +202 -202
package/src/i18n/es.js +202 -202
package/src/i18n/fr.js +202 -202
package/src/i18n/hi.js +202 -202
package/src/i18n/ja.js +202 -202
package/src/i18n/ko.js +202 -202
package/src/i18n/pt.js +202 -202
package/src/i18n/strings.js +54 -54
package/src/i18n/zh-CN.js +202 -202
package/src/installer/language-screen.js +31 -31
package/src/installer/music-file-input.js +304 -304
package/src/installer.js +0 -0
package/src/services/config-service.js +264 -264
package/src/services/language-service.js +47 -47
package/src/services/provider-service.js +143 -143
package/src/utils/audio-duration-validator.js +298 -298
package/src/utils/audio-format-validator.js +277 -277
package/src/utils/dependency-checker.js +469 -469
package/src/utils/file-ownership-verifier.js +358 -358
package/src/utils/list-formatter.js +194 -194
package/src/utils/music-file-validator.js +285 -285
package/src/utils/preview-list-prompt.js +136 -136
package/src/utils/secure-music-storage.js +412 -412
package/templates/agentvibes-receiver.sh +231 -231
package/templates/audio/welcome-music.mp3 +0 -0
package/.claude/hooks/bmad-party-manager.sh +0 -225
package/.claude/hooks/stop.sh +0 -38
/package/.claude/audio/tracks/{CelestialVelvet.mp3 → celestial_velvet.mp3} +0 -0

package/.mcp.json CHANGED Viewed

@@ -1,30 +1,21 @@
 {
   "mcpServers": {
-    "agentvibes": {
+    "firecrawl-mcp": {
       "command": "npx",
       "args": [
         "-y",
-        "--package=agentvibes",
-        "agentvibes-mcp-server"
-      ],
-      "env": {
-        "AGENTVIBES_MCP_FALLBACK": "copilot"
-      }
-    },
-    "firecrawl": {
-      "command": "npx",
-      "args": [
         "firecrawl-mcp"
       ]
     },
-    "context7": {
+    "agentvibes": {
       "command": "npx",
       "args": [
         "-y",
-        "@upstash/context7-mcp"
+        "--package=agentvibes",
+        "agentvibes-mcp-server"
       ],
       "env": {
-        "CONTEXT7_API_KEY": "${CONTEXT7_API_KEY}"
+        "AGENTVIBES_MCP_FALLBACK": "copilot"
       }
     }
   }

package/README.md CHANGED Viewed

@@ -11,7 +11,7 @@
 [![Publish](https://github.com/paulpreibisch/AgentVibes/actions/workflows/publish.yml/badge.svg)](https://github.com/paulpreibisch/AgentVibes/actions/workflows/publish.yml)
 [![License](https://img.shields.io/badge/License-Apache_2.0-blue.svg)](https://opensource.org/licenses/Apache-2.0)
-**Author**: Paul Preibisch ([@997Fire](https://x.com/997Fire)) | **Version**: v5.7.7
+**Author**: Paul Preibisch ([@997Fire](https://x.com/997Fire)) | **Version**: v5.9.0
 ---
@@ -40,7 +40,33 @@ Whether you're coding in Claude Code, chatting in Claude Desktop, using Warp Ter
 ---
-## 🌟 NEW IN v5.7.7 — Party Mode Voice Restore + Polish
+## 🌟 NEW IN v5.9.0 — SSH Remote + Windows Home Directory Fixes
+**SSH remote no longer hangs:** The SSH transport now applies a 10-second connection
+timeout, so a stuck or unreachable remote host surfaces an error quickly instead of
+blocking forever.
+**Windows home directory detection fixed:** `detectRemoteLlm()` now uses null-coalescing
+(`??`) to fall back to `os.homedir()` only when `HOME` is genuinely unset — safer than
+the previous `||` which could misfire on an empty string.
+## v5.8.0 — Soprano Now Works + Voice Picker Fixed for All Engines
+**Soprano TTS actually works now:** Soprano (our neural TTS engine) was silently broken
+on Windows since launch — wrong binary name, stripped PATH, wav path sent to the wrong
+output stream, and no auto-start for the WebUI server. All fixed. Install with
+`pip install soprano-tts`, select Soprano in the setup tab, and AgentVibes handles
+the rest.
+**Voice picker now works for Windows SAPI and macOS Say:** Previously the picker showed
+the entire Piper voice catalog even when SAPI or macOS Say was selected, and Space-bar
+preview played through the wrong engine. The picker now shows exactly one item for each
+native engine and previews through the correct binary.
+**Auto-save no longer breaks your engine setting:** Saving an LLM config no longer silently
+overwrites your chosen engine back to Piper.
+## v5.7.7 — Party Mode Voice Restore + Polish
 **Party mode agents now speak again:** BMAD `/party-mode` now reliably invokes the correct AgentVibes skill, and each agent's response is spoken aloud in their unique voice with per-agent music, pretext, and reverb — loaded automatically from `~/.agentvibes/bmad-voice-map.json`.
@@ -220,6 +246,11 @@ Replace the default background tracks with your own audio files for complete son
 - Automatic format detection
 - Duration warnings for non-optimal lengths
+**Custom Track Naming Rules:**
+- Use `snake_case` filenames only — e.g. `my_focus_music.mp3` ✅
+- No spaces or uppercase letters in filenames — e.g. `My Focus Music.mp3` ❌
+- Misnamed files will not appear in the music picker and will be skipped by the audio engine
 **Perfect for:**
 - 🎸 **Team Audio Branding** - Company theme music
 - 🎮 **Gaming Sessions** - Epic background tracks

package/RELEASE_NOTES.md CHANGED Viewed

@@ -1,5 +1,85 @@
 # AgentVibes Release Notes
+## 🔧 v5.9.0 — SSH Remote + Windows Home Directory Fixes
+**Released:** 2026-05-18
+### 🐛 SSH Remote: Connection Timeout Added
+The SSH remote transport could hang indefinitely if the remote host was unreachable or
+slow to respond. A `ConnectTimeout=10` option is now applied to all SSH connections, so
+a stuck session surfaces an error within 10 seconds instead of blocking forever.
+The SSH subshell structure was also cleaned up so the process exit code is reliably
+captured — a previous formatting issue could cause `wait` to report "pid N is not a
+child of this shell" in some shell environments.
+### 🐛 Windows: Home Directory Detection Fixed
+`detectRemoteLlm()` used `process.env.HOME || os.homedir()` to find the AgentVibes
+config directory. On Windows, `HOME` is typically unset, but `||` would fall through to
+`os.homedir()` correctly — however `??` (null-coalescing) is strictly safer since it
+only falls back on `null`/`undefined`, not on an empty string. The fix also adds test
+injectability: passing a fake `HOME` in tests now reliably overrides the system value on
+all platforms.
+---
+## 🎸 v5.8.0 — Soprano Now Works + Voice Picker Fixed for All Engines
+**Released:** 2026-05-18
+### 🐛 Soprano TTS Was Broken — Now Fixed
+Soprano (our 80M-parameter neural TTS engine, introduced in v5.6) was silently failing on
+Windows. Several issues combined to break it end-to-end:
+- The Windows voice picker showed Soprano as an option but launched it with the wrong binary
+  name (`soprano-tts` instead of `soprano`)
+- `play-tts-soprano.ps1` was called from Node.js with a stripped PATH, so the `soprano`
+  and `soprano-webui` executables couldn't be found even when installed
+- The wav file path was written to PowerShell's Information stream (`Write-Host`) instead
+  of stdout, so the reverb/background-music processor couldn't find it and exited with an error
+- The Gradio WebUI was never auto-started — you had to manually run `soprano-webui` before
+  every session
+All of these are now fixed. AgentVibes auto-detects whether the Soprano WebUI server is
+running on port 7860, starts it if not, and polls until it's ready (up to 90 seconds).
+Three modes work in priority order: WebUI (fastest — model stays loaded) → OpenAI-compatible
+API → direct `soprano` CLI.
+### 🐛 Voice Picker Ignored Windows SAPI and macOS Say
+When opening the voice picker for an LLM configured to use **Windows SAPI** or **macOS Say**,
+the picker displayed the full list of Piper voices instead of the engine's built-in voice.
+This was confusing — selecting a Piper voice while using SAPI or macOS Say had no effect,
+and the Space-bar preview played through the wrong engine.
+The picker now adapts to whichever engine is selected:
+- **Windows SAPI / macOS Say / Soprano:** shows exactly one item (the engine's built-in voice),
+  auto-selects it, and the Space-bar preview speaks through the correct engine binary
+- **Piper:** shows the full installed-voice catalog as before
+Additionally, saving the config no longer silently overwrites the `ttsEngine` field to `piper`
+when a native engine is in use.
+### 🔒 Soprano Reliability (9 Adversarial-Review Fixes)
+- **Crash fix:** socket `destroy()` could emit a late `error` event with no listener,
+  crashing the Node.js process — an absorber handler is now in place
+- **Loop cancellation:** the 90-second WebUI polling loop now stops immediately when
+  the modal or voice picker is closed (via AbortController)
+- **No unhandled rejections:** `.catch()` handlers added to all async WebUI-check calls
+- **No duplicate processes:** a 10-second cooldown prevents spawning two `soprano-webui`
+  instances when Preview is clicked rapidly
+- **Better error feedback:** spawn failures and non-zero exit codes now surface a visible
+  error label in the voice picker instead of silently resetting
+- **PATH preserved:** the PowerShell PATH refresh now appends registry entries rather than
+  replacing the whole PATH, so nvm, conda, and pyenv shims continue to work
+---
 ## 🎭 v5.7.7 — Party Mode Voice Restore + Polish
 **Released:** 2026-05-17

package/WINDOWS-SETUP.md CHANGED Viewed

@@ -1,208 +1,208 @@
-# AgentVibes Windows Native Setup
-This folder contains AgentVibes configured for **native Windows** (not WSL) with three TTS providers available.
-## Quick Start
-### 1. Open in VS Code (Native Windows)
-- **File > Open Folder** > Select this folder (`agentvibes-in-windows`)
-- Make sure you're opening in **native Windows VS Code** (not WSL remote)
-### 2. Open PowerShell Terminal
-- **Terminal > New Terminal**
-- Change shell to **PowerShell** (if needed)
-### 3. Run Setup
-```powershell
-.\setup-windows.ps1
-```
-This script will:
-- Check PowerShell version (5.1+)
-- Create `.claude` directories
-- Let you choose TTS provider (Piper or SAPI)
-- Install Piper if you choose it
-- Download a default voice model
-- Test TTS
-- Configure for first use
-### 4. Install Dependencies
-```powershell
-npm install
-```
-### 5. Start Using AgentVibes
-Open a Claude Code session in this project. The SessionStart hook will automatically inject TTS protocol instructions, causing Claude to speak all responses.
-## TTS Providers
-### Option 1: Soprano (Best Quality)
-- **Quality**: Ultra-high (80M parameter neural model)
-- **Voices**: Single high-quality voice (Soprano-1.1-80M)
-- **Download**: `pip install soprano-tts`
-- **Setup**: Start WebUI with `soprano-webui` or API with `uvicorn soprano.server:app`
-- **Speed**: GPU-accelerated, very fast
-- **Features**: Gradio WebUI mode, OpenAI-compatible API mode, CLI fallback
-To set up Soprano:
-```powershell
-# Install Soprano
-pip install soprano-tts
-# Start WebUI (recommended - stays running in background)
-soprano-webui
-# Set provider
-.\.claude\hooks-windows\provider-manager.ps1 set soprano
-# Test
-.\.claude\hooks-windows\play-tts-soprano.ps1 "Hello from Soprano"
-```
-### Option 2: Windows Piper (Recommended for Offline)
-- **Quality**: High (neural voices)
-- **Voices**: 50+ available
-- **Download**: ~100MB
-- **Setup**: Automatic (run `setup-windows.ps1`)
-- **Speed**: Offline synthesis
-- **Features**: All AgentVibes features supported
-### Option 3: Windows SAPI (Built-in, Zero Setup)
-- **Quality**: Basic
-- **Voices**: ~10 built-in (David, Zira, Mark)
-- **Download**: 0 MB (no installation needed)
-- **Setup**: Select during `setup-windows.ps1`
-- **Speed**: Fast
-- **Features**: Core TTS only
-## Claude Code Integration
-AgentVibes hooks into Claude Code via `.claude/settings.json`. The SessionStart hook runs automatically when Claude starts a session:
-```json
-{
-  "hooks": {
-    "SessionStart": [{
-      "hooks": [{
-        "type": "command",
-        "command": "powershell -NoProfile -ExecutionPolicy Bypass -File \"$CLAUDE_PROJECT_DIR\\.claude\\hooks-windows\\session-start-tts.ps1\""
-      }]
-    }]
-  }
-}
-```
-This injects TTS protocol instructions so Claude speaks every response using the configured provider.
-## Manual Commands
-Test TTS manually:
-```powershell
-# Test current provider
-.\.claude\hooks-windows\play-tts.ps1 "Hello from Windows"
-# Test specific providers
-.\.claude\hooks-windows\play-tts-windows-sapi.ps1 "Hello SAPI"
-.\.claude\hooks-windows\play-tts-windows-piper.ps1 "Hello Piper"
-.\.claude\hooks-windows\play-tts-soprano.ps1 "Hello Soprano"
-# List available voices
-.\.claude\hooks-windows\voice-manager-windows.ps1 list
-# Switch voice (for Piper/SAPI)
-.\.claude\hooks-windows\voice-manager-windows.ps1 switch "en_US-lessac-high"
-# List providers
-.\.claude\hooks-windows\provider-manager.ps1 list
-# Switch provider
-.\.claude\hooks-windows\provider-manager.ps1 set soprano
-.\.claude\hooks-windows\provider-manager.ps1 set windows-piper
-.\.claude\hooks-windows\provider-manager.ps1 set windows-sapi
-```
-## Troubleshooting
-### PowerShell Execution Policy Error
-If you get an "execution policy" error, run:
-```powershell
-Set-ExecutionPolicy -ExecutionPolicy RemoteSigned -Scope CurrentUser
-```
-Then try again.
-### No Audio Playing
-1. Check Windows volume isn't muted
-2. Try switching to SAPI provider (zero-setup): `.\.claude\hooks-windows\provider-manager.ps1 set windows-sapi`
-3. Test SAPI directly: `.\.claude\hooks-windows\play-tts-windows-sapi.ps1 "test"`
-### Soprano Not Detected
-1. Ensure soprano-webui is running: `soprano-webui`
-2. Check port 7860 is accessible: `Test-NetConnection -ComputerName 127.0.0.1 -Port 7860`
-3. Set custom port if needed: `$env:SOPRANO_PORT = "8080"` before running TTS
-### Piper Installation Failed
-1. Check internet connection
-2. Run setup again: `.\setup-windows.ps1`
-3. Or manually download from: https://github.com/rhasspy/piper/releases
-### Can't Find Voice
-For Piper, voices are stored in: `%USERPROFILE%\.claude\piper-voices\`
-You can download additional voices with `.\download-piper-voices.ps1`.
-## Architecture
-```
-agentvibes-in-windows/
-├── .claude/
-│   ├── hooks-windows/               # PowerShell TTS scripts
-│   │   ├── play-tts.ps1             # Main router (dispatches to active provider)
-│   │   ├── play-tts-soprano.ps1     # Soprano provider
-│   │   ├── play-tts-windows-piper.ps1  # Piper provider
-│   │   ├── play-tts-windows-sapi.ps1   # SAPI provider
-│   │   ├── soprano-gradio-synth.py  # Python helper for Soprano Gradio API
-│   │   ├── provider-manager.ps1     # Provider switching
-│   │   ├── voice-manager-windows.ps1   # Voice management
-│   │   ├── session-start-tts.ps1    # SessionStart hook (injects TTS protocol)
-│   │   └── audio-cache-utils.ps1    # Audio cache cleanup
-│   ├── settings.json                # Claude Code hooks config
-│   ├── audio/                       # Audio cache (auto-created)
-│   ├── piper-voices/                # Piper voice models (auto-created)
-│   └── tts-provider.txt             # Active provider config
-├── setup-windows.ps1                # Installation script
-├── download-piper-voices.ps1        # Download additional Piper voices
-└── WINDOWS-SETUP.md                 # This file
-```
-## What's Different from WSL
-| Feature | WSL Version | Windows Native |
-|---------|-------------|----------------|
-| **TTS Scripts** | Bash shell scripts (.sh) | PowerShell scripts (.ps1) |
-| **Audio** | PulseAudio/paplay | System.Media.SoundPlayer |
-| **Providers** | Piper, macOS, Termux, Soprano | Piper, SAPI, Soprano |
-| **Setup** | WSL + PulseAudio config | Native Windows only |
-| **Hook Dir** | `.claude/hooks/` | `.claude/hooks-windows/` |
-## Support
-- **Documentation**: https://agentvibes.org
-- **Issues**: https://github.com/paulpreibisch/AgentVibes/issues
----
-**Version**: 2.0 (Windows Native + Soprano)
-**Last Updated**: 2026-02-11
+# AgentVibes Windows Native Setup
+This folder contains AgentVibes configured for **native Windows** (not WSL) with three TTS providers available.
+## Quick Start
+### 1. Open in VS Code (Native Windows)
+- **File > Open Folder** > Select this folder (`agentvibes-in-windows`)
+- Make sure you're opening in **native Windows VS Code** (not WSL remote)
+### 2. Open PowerShell Terminal
+- **Terminal > New Terminal**
+- Change shell to **PowerShell** (if needed)
+### 3. Run Setup
+```powershell
+.\setup-windows.ps1
+```
+This script will:
+- Check PowerShell version (5.1+)
+- Create `.claude` directories
+- Let you choose TTS provider (Piper or SAPI)
+- Install Piper if you choose it
+- Download a default voice model
+- Test TTS
+- Configure for first use
+### 4. Install Dependencies
+```powershell
+npm install
+```
+### 5. Start Using AgentVibes
+Open a Claude Code session in this project. The SessionStart hook will automatically inject TTS protocol instructions, causing Claude to speak all responses.
+## TTS Providers
+### Option 1: Soprano (Best Quality)
+- **Quality**: Ultra-high (80M parameter neural model)
+- **Voices**: Single high-quality voice (Soprano-1.1-80M)
+- **Download**: `pip install soprano-tts`
+- **Setup**: Start WebUI with `soprano-webui` or API with `uvicorn soprano.server:app`
+- **Speed**: GPU-accelerated, very fast
+- **Features**: Gradio WebUI mode, OpenAI-compatible API mode, CLI fallback
+To set up Soprano:
+```powershell
+# Install Soprano
+pip install soprano-tts
+# Start WebUI (recommended - stays running in background)
+soprano-webui
+# Set provider
+.\.claude\hooks-windows\provider-manager.ps1 set soprano
+# Test
+.\.claude\hooks-windows\play-tts-soprano.ps1 "Hello from Soprano"
+```
+### Option 2: Windows Piper (Recommended for Offline)
+- **Quality**: High (neural voices)
+- **Voices**: 50+ available
+- **Download**: ~100MB
+- **Setup**: Automatic (run `setup-windows.ps1`)
+- **Speed**: Offline synthesis
+- **Features**: All AgentVibes features supported
+### Option 3: Windows SAPI (Built-in, Zero Setup)
+- **Quality**: Basic
+- **Voices**: ~10 built-in (David, Zira, Mark)
+- **Download**: 0 MB (no installation needed)
+- **Setup**: Select during `setup-windows.ps1`
+- **Speed**: Fast
+- **Features**: Core TTS only
+## Claude Code Integration
+AgentVibes hooks into Claude Code via `.claude/settings.json`. The SessionStart hook runs automatically when Claude starts a session:
+```json
+{
+  "hooks": {
+    "SessionStart": [{
+      "hooks": [{
+        "type": "command",
+        "command": "powershell -NoProfile -ExecutionPolicy Bypass -File \"$CLAUDE_PROJECT_DIR\\.claude\\hooks-windows\\session-start-tts.ps1\""
+      }]
+    }]
+  }
+}
+```
+This injects TTS protocol instructions so Claude speaks every response using the configured provider.
+## Manual Commands
+Test TTS manually:
+```powershell
+# Test current provider
+.\.claude\hooks-windows\play-tts.ps1 "Hello from Windows"
+# Test specific providers
+.\.claude\hooks-windows\play-tts-windows-sapi.ps1 "Hello SAPI"
+.\.claude\hooks-windows\play-tts-windows-piper.ps1 "Hello Piper"
+.\.claude\hooks-windows\play-tts-soprano.ps1 "Hello Soprano"
+# List available voices
+.\.claude\hooks-windows\voice-manager-windows.ps1 list
+# Switch voice (for Piper/SAPI)
+.\.claude\hooks-windows\voice-manager-windows.ps1 switch "en_US-lessac-high"
+# List providers
+.\.claude\hooks-windows\provider-manager.ps1 list
+# Switch provider
+.\.claude\hooks-windows\provider-manager.ps1 set soprano
+.\.claude\hooks-windows\provider-manager.ps1 set windows-piper
+.\.claude\hooks-windows\provider-manager.ps1 set windows-sapi
+```
+## Troubleshooting
+### PowerShell Execution Policy Error
+If you get an "execution policy" error, run:
+```powershell
+Set-ExecutionPolicy -ExecutionPolicy RemoteSigned -Scope CurrentUser
+```
+Then try again.
+### No Audio Playing
+1. Check Windows volume isn't muted
+2. Try switching to SAPI provider (zero-setup): `.\.claude\hooks-windows\provider-manager.ps1 set windows-sapi`
+3. Test SAPI directly: `.\.claude\hooks-windows\play-tts-windows-sapi.ps1 "test"`
+### Soprano Not Detected
+1. Ensure soprano-webui is running: `soprano-webui`
+2. Check port 7860 is accessible: `Test-NetConnection -ComputerName 127.0.0.1 -Port 7860`
+3. Set custom port if needed: `$env:SOPRANO_PORT = "8080"` before running TTS
+### Piper Installation Failed
+1. Check internet connection
+2. Run setup again: `.\setup-windows.ps1`
+3. Or manually download from: https://github.com/rhasspy/piper/releases
+### Can't Find Voice
+For Piper, voices are stored in: `%USERPROFILE%\.claude\piper-voices\`
+You can download additional voices with `.\download-piper-voices.ps1`.
+## Architecture
+```
+agentvibes-in-windows/
+├── .claude/
+│   ├── hooks-windows/               # PowerShell TTS scripts
+│   │   ├── play-tts.ps1             # Main router (dispatches to active provider)
+│   │   ├── play-tts-soprano.ps1     # Soprano provider
+│   │   ├── play-tts-windows-piper.ps1  # Piper provider
+│   │   ├── play-tts-windows-sapi.ps1   # SAPI provider
+│   │   ├── soprano-gradio-synth.py  # Python helper for Soprano Gradio API
+│   │   ├── provider-manager.ps1     # Provider switching
+│   │   ├── voice-manager-windows.ps1   # Voice management
+│   │   ├── session-start-tts.ps1    # SessionStart hook (injects TTS protocol)
+│   │   └── audio-cache-utils.ps1    # Audio cache cleanup
+│   ├── settings.json                # Claude Code hooks config
+│   ├── audio/                       # Audio cache (auto-created)
+│   ├── piper-voices/                # Piper voice models (auto-created)
+│   └── tts-provider.txt             # Active provider config
+├── setup-windows.ps1                # Installation script
+├── download-piper-voices.ps1        # Download additional Piper voices
+└── WINDOWS-SETUP.md                 # This file
+```
+## What's Different from WSL
+| Feature | WSL Version | Windows Native |
+|---------|-------------|----------------|
+| **TTS Scripts** | Bash shell scripts (.sh) | PowerShell scripts (.ps1) |
+| **Audio** | PulseAudio/paplay | System.Media.SoundPlayer |
+| **Providers** | Piper, macOS, Termux, Soprano | Piper, SAPI, Soprano |
+| **Setup** | WSL + PulseAudio config | Native Windows only |
+| **Hook Dir** | `.claude/hooks/` | `.claude/hooks-windows/` |
+## Support
+- **Documentation**: https://agentvibes.org
+- **Issues**: https://github.com/paulpreibisch/AgentVibes/issues
+---
+**Version**: 2.0 (Windows Native + Soprano)
+**Last Updated**: 2026-02-11

package/bin/agent-vibes CHANGED Viewed

@@ -1,40 +1,40 @@
 #!/usr/bin/env node
-/**
- * AgentVibes - Beautiful ElevenLabs TTS voice commands for Claude Code
- * This file ensures proper execution when run via npx
- */
-import { execFileSync } from 'node:child_process';
-import path from 'node:path';
-import fs from 'node:fs';
-import { fileURLToPath } from 'node:url';
-const __filename = fileURLToPath(import.meta.url);
-const __dirname = path.dirname(__filename);
-// Check if we're running in an npx temporary directory
-const isNpxExecution = __dirname.includes('_npx') || __dirname.includes('.npm');
-// Get CLI arguments
-const arguments_ = process.argv.slice(2);
-// Route through the TUI console (agentvibes.js) which handles install/config/etc
-const installerPath = path.join(__dirname, 'agentvibes.js');
-if (!fs.existsSync(installerPath)) {
-  console.error('Error: Could not find installer.js at', installerPath);
-  console.error('Current directory:', __dirname);
-  process.exit(1);
-}
-try {
-  // Security: Use execFileSync with array args to prevent command injection
-  // Arguments are passed as array elements, not string interpolation
-  execFileSync('node', [installerPath, ...arguments_], {
-    stdio: 'inherit',
-    cwd: path.dirname(__dirname),
-  });
-} catch (error) {
-  process.exit(error.status || 1);
-}
+/**
+ * AgentVibes - Beautiful ElevenLabs TTS voice commands for Claude Code
+ * This file ensures proper execution when run via npx
+ */
+import { execFileSync } from 'node:child_process';
+import path from 'node:path';
+import fs from 'node:fs';
+import { fileURLToPath } from 'node:url';
+const __filename = fileURLToPath(import.meta.url);
+const __dirname = path.dirname(__filename);
+// Check if we're running in an npx temporary directory
+const isNpxExecution = __dirname.includes('_npx') || __dirname.includes('.npm');
+// Get CLI arguments
+const arguments_ = process.argv.slice(2);
+// Route through the TUI console (agentvibes.js) which handles install/config/etc
+const installerPath = path.join(__dirname, 'agentvibes.js');
+if (!fs.existsSync(installerPath)) {
+  console.error('Error: Could not find installer.js at', installerPath);
+  console.error('Current directory:', __dirname);
+  process.exit(1);
+}
+try {
+  // Security: Use execFileSync with array args to prevent command injection
+  // Arguments are passed as array elements, not string interpolation
+  execFileSync('node', [installerPath, ...arguments_], {
+    stdio: 'inherit',
+    cwd: path.dirname(__dirname),
+  });
+} catch (error) {
+  process.exit(error.status || 1);
+}