npm - agentvibes - Versions diffs - 5.9.0 → 5.10.1 - Mend

agentvibes 5.9.0 → 5.10.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (145) hide show

package/.agentvibes/config.json +3 -12
package/.claude/commands/agent-vibes-bmad-voices.md +117 -117
package/.claude/commands/agent-vibes-rdp.md +24 -24
package/.claude/config/audio-effects.cfg +4 -5
package/.claude/config/audio-effects.cfg.sample +52 -52
package/.claude/config/background-music-enabled.txt +1 -1
package/.claude/docs/TERMUX_SETUP.md +408 -408
package/.claude/github-star-reminder.txt +1 -1
package/.claude/hooks/audio-cache-utils.sh +0 -0
package/.claude/hooks/audio-processor.sh +0 -0
package/.claude/hooks/background-music-manager.sh +0 -0
package/.claude/hooks/bmad-party-speak.sh +0 -0
package/.claude/hooks/bmad-speak-enhanced.sh +0 -0
package/.claude/hooks/bmad-speak.sh +0 -0
package/.claude/hooks/bmad-tts-injector.sh +0 -0
package/.claude/hooks/bmad-voice-manager.sh +0 -0
package/.claude/hooks/clawdbot-receiver-SECURE.sh +0 -0
package/.claude/hooks/clawdbot-receiver.sh +0 -0
package/.claude/hooks/clean-audio-cache.sh +0 -0
package/.claude/hooks/cleanup-cache.sh +0 -0
package/.claude/hooks/configure-rdp-mode.sh +0 -0
package/.claude/hooks/download-extra-voices.sh +0 -0
package/.claude/hooks/effects-manager.sh +0 -0
package/.claude/hooks/github-star-reminder.sh +0 -0
package/.claude/hooks/language-manager.sh +0 -0
package/.claude/hooks/learn-manager.sh +0 -0
package/.claude/hooks/macos-voice-manager.sh +0 -0
package/.claude/hooks/migrate-background-music.sh +0 -0
package/.claude/hooks/migrate-to-agentvibes.sh +0 -0
package/.claude/hooks/optimize-background-music.sh +0 -0
package/.claude/hooks/path-resolver.sh +0 -0
package/.claude/hooks/personality-manager.sh +0 -0
package/.claude/hooks/piper-download-voices.sh +0 -0
package/.claude/hooks/piper-installer.sh +0 -0
package/.claude/hooks/piper-multispeaker-registry.sh +0 -0
package/.claude/hooks/piper-voice-manager.sh +0 -0
package/.claude/hooks/play-tts-agentvibes-receiver-for-voiceless-connections.sh +0 -0
package/.claude/hooks/play-tts-enhanced.sh +0 -0
package/.claude/hooks/play-tts-macos.sh +0 -0
package/.claude/hooks/play-tts-piper.sh +20 -13
package/.claude/hooks/play-tts-soprano.sh +0 -0
package/.claude/hooks/play-tts-ssh-remote.sh +0 -0
package/.claude/hooks/play-tts-termux-ssh.sh +0 -0
package/.claude/hooks/play-tts-windows-receiver.sh +0 -0
package/.claude/hooks/play-tts.sh +0 -0
package/.claude/hooks/prepare-release.sh +0 -0
package/.claude/hooks/provider-commands.sh +0 -0
package/.claude/hooks/provider-manager.sh +0 -0
package/.claude/hooks/replay-target-audio.sh +0 -0
package/.claude/hooks/requirements.txt +6 -6
package/.claude/hooks/sentiment-manager.sh +0 -0
package/.claude/hooks/session-start-tts.sh +0 -0
package/.claude/hooks/soprano-gradio-synth.py +139 -139
package/.claude/hooks/speed-manager.sh +0 -0
package/.claude/hooks/stop-tts.sh +0 -0
package/.claude/hooks/termux-installer.sh +0 -0
package/.claude/hooks/translate-manager.sh +0 -0
package/.claude/hooks/translator.py +237 -237
package/.claude/hooks/tts-queue-worker.sh +0 -0
package/.claude/hooks/tts-queue.sh +0 -0
package/.claude/hooks/verbosity-manager.sh +0 -0
package/.claude/hooks/voice-manager.sh +6 -0
package/.claude/hooks-windows/play-tts-windows-piper.ps1 +22 -16
package/.claude/hooks-windows/soprano-gradio-synth.py +153 -153
package/.claude/verbosity.txt +1 -1
package/.clawdbot/README.md +105 -105
package/.mcp.json +19 -6
package/README.md +1 -1
package/WINDOWS-SETUP.md +208 -208
package/bin/agent-vibes +39 -39
package/bin/agentvibes-voice-browser.js +0 -0
package/bin/agentvibes.js +0 -0
package/bin/mcp-server.js +121 -121
package/bin/mcp-server.sh +0 -0
package/bin/test-bmad-pr +78 -78
package/mcp-server/QUICK_START.md +203 -203
package/mcp-server/README.md +345 -345
package/mcp-server/WINDOWS_SETUP.md +0 -0
package/mcp-server/examples/claude_desktop_config.json +11 -11
package/mcp-server/examples/claude_desktop_config_piper.json +9 -9
package/mcp-server/examples/custom_instructions.md +169 -169
package/mcp-server/install-deps.js +0 -0
package/mcp-server/server.py +1807 -1797
package/mcp-server/test_server.py +0 -0
package/package.json +2 -2
package/src/cli/list-personalities.js +110 -110
package/src/cli/list-voices.js +114 -114
package/src/commands/bmad-voices.js +394 -394
package/src/commands/install-mcp.js +730 -476
package/src/console/app.js +3 -3
package/src/console/brand-colors.js +13 -13
package/src/console/constants/personalities.js +44 -44
package/src/console/tabs/agents-tab.js +6 -6
package/src/console/tabs/help-tab.js +314 -314
package/src/console/tabs/music-tab.js +1 -1
package/src/console/tabs/readme-tab.js +272 -272
package/src/console/tabs/receiver-tab.js +13 -13
package/src/console/tabs/settings-tab.js +2 -2
package/src/console/tabs/setup-tab.js +10 -10
package/src/console/tabs/voices-tab.js +4 -4
package/src/console/widgets/destroy-list.js +25 -25
package/src/console/widgets/notice.js +55 -55
package/src/console/widgets/personality-picker.js +2 -2
package/src/console/widgets/reverb-picker.js +1 -1
package/src/i18n/de.js +202 -202
package/src/i18n/es.js +202 -202
package/src/i18n/fr.js +202 -202
package/src/i18n/hi.js +202 -202
package/src/i18n/ja.js +202 -202
package/src/i18n/ko.js +202 -202
package/src/i18n/pt.js +202 -202
package/src/i18n/strings.js +54 -54
package/src/i18n/zh-CN.js +202 -202
package/src/installer/language-screen.js +31 -31
package/src/installer/music-file-input.js +304 -304
package/src/installer.js +32 -27
package/src/services/config-service.js +264 -264
package/src/services/language-service.js +47 -47
package/src/services/provider-service.js +143 -143
package/src/services/tts-engine-service.js +2 -2
package/src/utils/audio-duration-validator.js +298 -298
package/src/utils/audio-format-validator.js +277 -277
package/src/utils/dependency-checker.js +469 -469
package/src/utils/file-ownership-verifier.js +358 -358
package/src/utils/list-formatter.js +200 -194
package/src/utils/music-file-validator.js +285 -285
package/src/utils/platform-resolver.js +369 -0
package/src/utils/preview-list-prompt.js +136 -136
package/src/utils/provider-validator.js +9 -9
package/src/utils/secure-music-storage.js +412 -412
package/templates/agentvibes-receiver.sh +231 -231
package/templates/audio/welcome-music.mp3 +0 -0
package/.agentvibes/install-manifest.json +0 -330
package/.claude/config/background-music-position.txt +0 -27
package/.claude/config/background-music-volume.txt +0 -1
package/.claude/config/background-music.cfg +0 -1
package/.claude/config/background-music.txt +0 -1
package/.claude/config/language.txt +0 -1
package/.claude/config/reverb-level.txt +0 -1
package/.claude/config/tts-speech-rate.txt +0 -1
package/.claude/config/tts-verbosity.txt +0 -1
package/.claude/hooks/play-tts-agentvibes-receiver.sh +0 -1
package/.claude/hooks-windows/audio-cache-utils.ps1.user.bak +0 -119
package/.claude/hooks-windows/soprano-gradio-synth.py.user.bak +0 -153
package/.claude/piper-voices-dir.txt +0 -1

package/.claude/github-star-reminder.txt CHANGED Viewed

	@@ -1 +1 @@
1	- ~~20260516~~
1	+ 20260525

package/.claude/hooks/audio-cache-utils.sh CHANGED Viewed

File without changes

package/.claude/hooks/audio-processor.sh CHANGED Viewed

File without changes

package/.claude/hooks/background-music-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/bmad-party-speak.sh CHANGED Viewed

File without changes

package/.claude/hooks/bmad-speak-enhanced.sh CHANGED Viewed

File without changes

package/.claude/hooks/bmad-speak.sh CHANGED Viewed

File without changes

package/.claude/hooks/bmad-tts-injector.sh CHANGED Viewed

File without changes

package/.claude/hooks/bmad-voice-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/clawdbot-receiver-SECURE.sh CHANGED Viewed

File without changes

package/.claude/hooks/clawdbot-receiver.sh CHANGED Viewed

File without changes

package/.claude/hooks/clean-audio-cache.sh CHANGED Viewed

File without changes

package/.claude/hooks/cleanup-cache.sh CHANGED Viewed

File without changes

package/.claude/hooks/configure-rdp-mode.sh CHANGED Viewed

File without changes

package/.claude/hooks/download-extra-voices.sh CHANGED Viewed

File without changes

package/.claude/hooks/effects-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/github-star-reminder.sh CHANGED Viewed

File without changes

package/.claude/hooks/language-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/learn-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/macos-voice-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/migrate-background-music.sh CHANGED Viewed

File without changes

package/.claude/hooks/migrate-to-agentvibes.sh CHANGED Viewed

File without changes

package/.claude/hooks/optimize-background-music.sh CHANGED Viewed

File without changes

package/.claude/hooks/path-resolver.sh CHANGED Viewed

File without changes

package/.claude/hooks/personality-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/piper-download-voices.sh CHANGED Viewed

File without changes

package/.claude/hooks/piper-installer.sh CHANGED Viewed

File without changes

package/.claude/hooks/piper-multispeaker-registry.sh CHANGED Viewed

File without changes

package/.claude/hooks/piper-voice-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/play-tts-agentvibes-receiver-for-voiceless-connections.sh CHANGED Viewed

File without changes

package/.claude/hooks/play-tts-enhanced.sh CHANGED Viewed

File without changes

package/.claude/hooks/play-tts-macos.sh CHANGED Viewed

File without changes

package/.claude/hooks/play-tts-piper.sh CHANGED Viewed

@@ -73,10 +73,8 @@ TEXT=$(printf '%s' "$TEXT" | perl -CSD -pe '
   s/^\s*[-]\s*//g;                # list dashes
 ')
-# Source voice manager and language manager
-# Use readlink -f to handle symlinks correctly
-SCRIPT_PATH="$(readlink -f "${BASH_SOURCE[0]}")"
-SCRIPT_DIR="$(dirname "$SCRIPT_PATH")"
+# cd-based resolution works on macOS (BSD readlink lacks -f) and Linux alike
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd -P)"
 source "$SCRIPT_DIR/piper-voice-manager.sh"
 source "$SCRIPT_DIR/language-manager.sh"
 source "$SCRIPT_DIR/audio-cache-utils.sh"
@@ -226,11 +224,19 @@ if [[ -z "$TEXT" ]]; then
 fi
 # Augment PATH for non-interactive shells (pipx installs to ~/.local/bin which
-# interactive shells get via .bashrc/.zshrc, but Bash tool calls skip profile)
+# interactive shells get via .bashrc/.zshrc, but Bash tool calls skip profile).
+# Mac: add both Apple Silicon (/opt/homebrew) and Intel (/usr/local) Homebrew locations.
 export PATH="$HOME/.local/bin:$HOME/.local/share/pipx/venvs/piper-tts/bin:$PATH"
+if [[ "$(uname -s 2>/dev/null)" == "Darwin" ]]; then
+  export PATH="/opt/homebrew/bin:/usr/local/bin:$PATH"
+fi
+# Resolve explicit piper binary path — avoids bare `piper` invocation failing when
+# PATH augmentation above hasn't propagated into nested subshells.
+PIPER_BIN=$(command -v piper 2>/dev/null || echo "")
 # Check if Piper is installed
-if ! command -v piper &> /dev/null; then
+if [[ -z "$PIPER_BIN" ]]; then
   echo "❌ Error: Piper TTS not installed"
   echo "Install with: pipx install piper-tts"
   echo "Or run: .claude/hooks/piper-installer.sh"
@@ -309,6 +315,8 @@ else
 fi
 mkdir -p "$AUDIO_DIR"
+# Normalize to canonical path (handles Git Bash /tmp→/c/Users/..., macOS /var→/private/var)
+AUDIO_DIR=$(cd "$AUDIO_DIR" && pwd -P)
 _tmp=$(mktemp "$AUDIO_DIR/tts-XXXXXX"); TEMP_FILE="${_tmp}.wav"; mv "$_tmp" "$TEMP_FILE"
 # @function get_speech_rate
@@ -380,6 +388,10 @@ get_speech_rate() {
 SPEECH_RATE=$(get_speech_rate)
+# Ensure piper log directory exists so stderr redirect never silently fails
+_PIPER_LOG_DIR="${AGENTVIBES_LOG_DIR:-$HOME/.local/state/agentvibes/logs}"
+mkdir -p "$_PIPER_LOG_DIR" 2>/dev/null || true
 # @function synthesize_with_piper
 # @intent Generate speech using Piper TTS
 # @why Provides free, offline TTS alternative
@@ -391,10 +403,10 @@ SPEECH_RATE=$(get_speech_rate)
 if [[ -n "${SPEAKER_ID:-}" ]]; then
   # Multi-speaker voice: Pass speaker ID
   # SECURITY: Use printf instead of echo for pipe safety (#134)
-  printf '%s\n' "$TEXT" | piper --model "$VOICE_PATH" --speaker "$SPEAKER_ID" --length-scale "$SPEECH_RATE" --sentence-silence 2.0 --output_file "$TEMP_FILE" 2>/dev/null
+  printf '%s\n' "$TEXT" | "$PIPER_BIN" --model "$VOICE_PATH" --speaker "$SPEAKER_ID" --length-scale "$SPEECH_RATE" --sentence-silence 2.0 --output_file "$TEMP_FILE" 2>>"$_PIPER_LOG_DIR/piper.log"
 else
   # Single-speaker voice
-  printf '%s\n' "$TEXT" | piper --model "$VOICE_PATH" --length-scale "$SPEECH_RATE" --sentence-silence 2.0 --output_file "$TEMP_FILE" 2>/dev/null
+  printf '%s\n' "$TEXT" | "$PIPER_BIN" --model "$VOICE_PATH" --length-scale "$SPEECH_RATE" --sentence-silence 2.0 --output_file "$TEMP_FILE" 2>>"$_PIPER_LOG_DIR/piper.log"
 fi
 if [[ ! -f "$TEMP_FILE" ]] || [[ ! -s "$TEMP_FILE" ]]; then
@@ -538,11 +550,6 @@ AUDIO_DIR="${TEMP_FILE%/*}"
 WRITE_LOCK_FILE="$AUDIO_DIR/$(basename "$TEMP_FILE" .wav).lock"
 touch "$WRITE_LOCK_FILE"
-# Get audio duration for proper lock timing
-DURATION=$(ffprobe -v error -show_entries format=duration -of default=noprint_wrappers=1:nokey=1 "$TEMP_FILE" 2>/dev/null)
-DURATION=${DURATION%.*}  # Round to integer
-DURATION=${DURATION:-1}   # Default to 1 second if detection fails
 # Get audio duration for proper lock timing
 DURATION=$(ffprobe -v error -show_entries format=duration -of default=noprint_wrappers=1:nokey=1 "$TEMP_FILE" 2>/dev/null || true)
 DURATION=${DURATION%.*}  # Round to integer

package/.claude/hooks/play-tts-soprano.sh CHANGED Viewed

File without changes

package/.claude/hooks/play-tts-ssh-remote.sh CHANGED Viewed

File without changes

package/.claude/hooks/play-tts-termux-ssh.sh CHANGED Viewed

File without changes

package/.claude/hooks/play-tts-windows-receiver.sh CHANGED Viewed

File without changes

package/.claude/hooks/play-tts.sh CHANGED Viewed

File without changes

package/.claude/hooks/prepare-release.sh CHANGED Viewed

File without changes

package/.claude/hooks/provider-commands.sh CHANGED Viewed

File without changes

package/.claude/hooks/provider-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/replay-target-audio.sh CHANGED Viewed

File without changes

package/.claude/hooks/requirements.txt CHANGED Viewed

@@ -1,6 +1,6 @@
-# AgentVibes TTS Hooks Requirements
-# Install with: pip install -r requirements.txt
-# Translation support for multi-language TTS and learning mode
-deep-translator>=1.11.4
-langdetect>=1.0.9
+# AgentVibes TTS Hooks Requirements
+# Install with: pip install -r requirements.txt
+# Translation support for multi-language TTS and learning mode
+deep-translator>=1.11.4
+langdetect>=1.0.9

package/.claude/hooks/sentiment-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/session-start-tts.sh CHANGED Viewed

File without changes

package/.claude/hooks/soprano-gradio-synth.py CHANGED Viewed

@@ -1,139 +1,139 @@
-#!/usr/bin/env python3
-#
-# File: .claude/hooks/soprano-gradio-synth.py
-#
-# AgentVibes - Finally, your AI Agents can Talk Back!
-# Website: https://agentvibes.org
-# Repository: https://github.com/paulpreibisch/AgentVibes
-#
-# Co-created by Paul Preibisch with Claude AI
-# Copyright (c) 2025 Paul Preibisch
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-#
-# ---
-#
-# Soprano Gradio WebUI synthesizer helper.
-# Calls the Soprano WebUI's Gradio API and saves the result as a WAV file.
-# Uses only Python stdlib (json, sys, urllib) — no extra dependencies.
-#
-# Usage: python3 soprano-gradio-synth.py "text to speak" output.wav [port]
-#
-"""
-Soprano Gradio WebUI synthesizer helper for AgentVibes.
-Calls the Soprano WebUI's Gradio API via the Server-Sent Events (SSE) protocol
-and downloads the generated audio as a WAV file.
-Flow:
-  1. Submit generation request → get event_id
-  2. Poll SSE stream for audio file URL
-  3. Download WAV file to output path
-See: https://github.com/ekwek1/soprano
-"""
-import json
-import sys
-import urllib.request
-import urllib.error
-def synth(text: str, output_path: str, port: int = 7860) -> None:
-    base = f"http://127.0.0.1:{port}"
-    # Step 1: Submit generation request
-    # Args: text, temperature, top_p, repetition_penalty, chunk_size, streaming
-    payload = json.dumps({
-        "data": [text, 0.0, 0.95, 1.2, 1, False]
-    }).encode()
-    event_id = submit_request(base, payload)
-    # Step 2: Poll SSE stream for audio file URL
-    audio_url = poll_for_result(base, event_id)
-    # Step 3: Download the audio file
-    download_file(audio_url, output_path)
-def submit_request(base: str, payload: bytes) -> str:
-    """Submit generation request to Gradio API, return event_id."""
-    for api_base in ["/gradio_api/call", "/call"]:
-        url = f"{base}{api_base}/generate_speech"
-        req = urllib.request.Request(
-            url,
-            data=payload,
-            headers={"Content-Type": "application/json"},
-        )
-        try:
-            with urllib.request.urlopen(req, timeout=30) as resp:
-                return json.loads(resp.read())["event_id"]
-        except urllib.error.URLError:
-            continue
-    raise RuntimeError("Could not reach Soprano WebUI API")
-def poll_for_result(base: str, event_id: str) -> str:
-    """Poll SSE endpoint until audio file URL is returned."""
-    for api_base in ["/gradio_api/call", "/call"]:
-        url = f"{base}{api_base}/generate_speech/{event_id}"
-        req = urllib.request.Request(url)
-        try:
-            with urllib.request.urlopen(req, timeout=120) as resp:
-                for raw_line in resp:
-                    line = raw_line.decode("utf-8", errors="replace").strip()
-                    if not line.startswith("data: "):
-                        continue
-                    try:
-                        parsed = json.loads(line[6:])
-                    except json.JSONDecodeError:
-                        continue
-                    # Response format: [{"path": "...", "url": "...", ...}, "status string"]
-                    if isinstance(parsed, list) and len(parsed) >= 1:
-                        audio = parsed[0]
-                        if isinstance(audio, dict) and "url" in audio:
-                            return audio["url"]
-            break
-        except urllib.error.URLError:
-            continue
-    raise RuntimeError("No audio URL in Soprano response")
-def download_file(url: str, output_path: str) -> None:
-    """Download audio file from Gradio file server."""
-    req = urllib.request.Request(url)
-    with urllib.request.urlopen(req, timeout=30) as resp:
-        with open(output_path, "wb") as f:
-            while True:
-                chunk = resp.read(8192)
-                if not chunk:
-                    break
-                f.write(chunk)
-if __name__ == "__main__":
-    if len(sys.argv) < 3:
-        print(f"Usage: {sys.argv[0]} \"text\" output.wav [port]", file=sys.stderr)
-        sys.exit(1)
-    text = sys.argv[1]
-    output = sys.argv[2]
-    port = int(sys.argv[3]) if len(sys.argv) > 3 else 7860
-    try:
-        synth(text, output, port)
-    except Exception as e:
-        print(f"Error: {e}", file=sys.stderr)
-        sys.exit(1)
+#!/usr/bin/env python3
+#
+# File: .claude/hooks/soprano-gradio-synth.py
+#
+# AgentVibes - Finally, your AI Agents can Talk Back!
+# Website: https://agentvibes.org
+# Repository: https://github.com/paulpreibisch/AgentVibes
+#
+# Co-created by Paul Preibisch with Claude AI
+# Copyright (c) 2025 Paul Preibisch
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# ---
+#
+# Soprano Gradio WebUI synthesizer helper.
+# Calls the Soprano WebUI's Gradio API and saves the result as a WAV file.
+# Uses only Python stdlib (json, sys, urllib) — no extra dependencies.
+#
+# Usage: python3 soprano-gradio-synth.py "text to speak" output.wav [port]
+#
+"""
+Soprano Gradio WebUI synthesizer helper for AgentVibes.
+Calls the Soprano WebUI's Gradio API via the Server-Sent Events (SSE) protocol
+and downloads the generated audio as a WAV file.
+Flow:
+  1. Submit generation request → get event_id
+  2. Poll SSE stream for audio file URL
+  3. Download WAV file to output path
+See: https://github.com/ekwek1/soprano
+"""
+import json
+import sys
+import urllib.request
+import urllib.error
+def synth(text: str, output_path: str, port: int = 7860) -> None:
+    base = f"http://127.0.0.1:{port}"
+    # Step 1: Submit generation request
+    # Args: text, temperature, top_p, repetition_penalty, chunk_size, streaming
+    payload = json.dumps({
+        "data": [text, 0.0, 0.95, 1.2, 1, False]
+    }).encode()
+    event_id = submit_request(base, payload)
+    # Step 2: Poll SSE stream for audio file URL
+    audio_url = poll_for_result(base, event_id)
+    # Step 3: Download the audio file
+    download_file(audio_url, output_path)
+def submit_request(base: str, payload: bytes) -> str:
+    """Submit generation request to Gradio API, return event_id."""
+    for api_base in ["/gradio_api/call", "/call"]:
+        url = f"{base}{api_base}/generate_speech"
+        req = urllib.request.Request(
+            url,
+            data=payload,
+            headers={"Content-Type": "application/json"},
+        )
+        try:
+            with urllib.request.urlopen(req, timeout=30) as resp:
+                return json.loads(resp.read())["event_id"]
+        except urllib.error.URLError:
+            continue
+    raise RuntimeError("Could not reach Soprano WebUI API")
+def poll_for_result(base: str, event_id: str) -> str:
+    """Poll SSE endpoint until audio file URL is returned."""
+    for api_base in ["/gradio_api/call", "/call"]:
+        url = f"{base}{api_base}/generate_speech/{event_id}"
+        req = urllib.request.Request(url)
+        try:
+            with urllib.request.urlopen(req, timeout=120) as resp:
+                for raw_line in resp:
+                    line = raw_line.decode("utf-8", errors="replace").strip()
+                    if not line.startswith("data: "):
+                        continue
+                    try:
+                        parsed = json.loads(line[6:])
+                    except json.JSONDecodeError:
+                        continue
+                    # Response format: [{"path": "...", "url": "...", ...}, "status string"]
+                    if isinstance(parsed, list) and len(parsed) >= 1:
+                        audio = parsed[0]
+                        if isinstance(audio, dict) and "url" in audio:
+                            return audio["url"]
+            break
+        except urllib.error.URLError:
+            continue
+    raise RuntimeError("No audio URL in Soprano response")
+def download_file(url: str, output_path: str) -> None:
+    """Download audio file from Gradio file server."""
+    req = urllib.request.Request(url)
+    with urllib.request.urlopen(req, timeout=30) as resp:
+        with open(output_path, "wb") as f:
+            while True:
+                chunk = resp.read(8192)
+                if not chunk:
+                    break
+                f.write(chunk)
+if __name__ == "__main__":
+    if len(sys.argv) < 3:
+        print(f"Usage: {sys.argv[0]} \"text\" output.wav [port]", file=sys.stderr)
+        sys.exit(1)
+    text = sys.argv[1]
+    output = sys.argv[2]
+    port = int(sys.argv[3]) if len(sys.argv) > 3 else 7860
+    try:
+        synth(text, output, port)
+    except Exception as e:
+        print(f"Error: {e}", file=sys.stderr)
+        sys.exit(1)

package/.claude/hooks/speed-manager.sh CHANGED Viewed

File without changes

package/.claude/hooks/stop-tts.sh CHANGED Viewed

File without changes

package/.claude/hooks/termux-installer.sh CHANGED Viewed

File without changes

package/.claude/hooks/translate-manager.sh CHANGED Viewed

File without changes