agentvibes 2.0.3 → 2.0.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,54 @@
1
+ ---
2
+ description: Manage TTS providers (list, switch, info, test)
3
+ argument-hint: [command] [args...]
4
+ ---
5
+
6
+ # Provider Management Commands
7
+
8
+ Manage TTS providers (ElevenLabs, Piper) - switch between providers, view details, and test.
9
+
10
+ ## Usage
11
+
12
+ ```bash
13
+ /agent-vibes:provider list # Show all available providers
14
+ /agent-vibes:provider switch <name> # Switch to a different provider
15
+ /agent-vibes:provider info <name> # Show detailed provider information
16
+ /agent-vibes:provider test # Test current provider
17
+ /agent-vibes:provider get # Show current active provider
18
+ /agent-vibes:provider help # Show this help
19
+ ```
20
+
21
+ ## Examples
22
+
23
+ ```bash
24
+ # List available providers
25
+ /agent-vibes:provider list
26
+
27
+ # Switch to Piper (free, offline)
28
+ /agent-vibes:provider switch piper
29
+
30
+ # Switch to ElevenLabs (premium quality)
31
+ /agent-vibes:provider switch elevenlabs
32
+
33
+ # Get info about a provider
34
+ /agent-vibes:provider info piper
35
+
36
+ # Test current provider
37
+ /agent-vibes:provider test
38
+
39
+ # Show current provider
40
+ /agent-vibes:provider get
41
+ ```
42
+
43
+ ## Provider Comparison
44
+
45
+ | Feature | ElevenLabs | Piper |
46
+ |---------|------------|-------|
47
+ | Quality | ⭐⭐⭐⭐⭐ | ⭐⭐⭐⭐ |
48
+ | Cost | Free tier + $5-22/mo | Free forever |
49
+ | Offline | No | Yes |
50
+ | Platform | All | WSL/Linux only |
51
+
52
+ Learn more: agentvibes.org/providers
53
+
54
+ !bash .claude/hooks/provider-commands.sh $ARGUMENTS
@@ -0,0 +1,133 @@
1
+ #!/bin/bash
2
+ #
3
+ # @fileoverview Piper Voice Model Downloader
4
+ # @context Downloads Piper TTS voice models from HuggingFace
5
+ # @purpose Batch download popular voices after installation
6
+ # @dependencies piper-voice-manager.sh, piper binary
7
+ # @usage ./piper-download-voices.sh [--yes|-y]
8
+ # --yes|-y: Skip confirmation prompt (auto-download)
9
+ #
10
+
11
+ SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
12
+ source "$SCRIPT_DIR/piper-voice-manager.sh"
13
+
14
+ # Parse command line arguments
15
+ AUTO_YES=false
16
+ if [[ "$1" == "--yes" ]] || [[ "$1" == "-y" ]]; then
17
+ AUTO_YES=true
18
+ fi
19
+
20
+ # Common voice models to download
21
+ COMMON_VOICES=(
22
+ "en_US-lessac-medium" # Default, clear male
23
+ "en_US-amy-medium" # Warm female
24
+ "en_US-joe-medium" # Professional male
25
+ "en_US-ryan-high" # Expressive male
26
+ "en_US-libritts-high" # Premium quality
27
+ )
28
+
29
+ echo "🎙️ Piper Voice Model Downloader"
30
+ echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
31
+ echo ""
32
+ echo "This will download the most commonly used Piper voice models."
33
+ echo "Each voice is approximately 25MB."
34
+ echo ""
35
+
36
+ # Check if piper is installed
37
+ if ! command -v piper &> /dev/null; then
38
+ echo "❌ Error: Piper TTS not installed"
39
+ echo "Install with: pipx install piper-tts"
40
+ exit 1
41
+ fi
42
+
43
+ # Get storage directory
44
+ VOICE_DIR=$(get_voice_storage_dir)
45
+
46
+ echo "📂 Storage location: $VOICE_DIR"
47
+ echo ""
48
+
49
+ # Count already downloaded
50
+ ALREADY_DOWNLOADED=0
51
+ ALREADY_DOWNLOADED_LIST=()
52
+ NEED_DOWNLOAD=()
53
+
54
+ for voice in "${COMMON_VOICES[@]}"; do
55
+ if verify_voice "$voice" 2>/dev/null; then
56
+ ((ALREADY_DOWNLOADED++))
57
+ ALREADY_DOWNLOADED_LIST+=("$voice")
58
+ else
59
+ NEED_DOWNLOAD+=("$voice")
60
+ fi
61
+ done
62
+
63
+ echo "📊 Status:"
64
+ echo " Already downloaded: $ALREADY_DOWNLOADED voice(s)"
65
+ echo " Need to download: ${#NEED_DOWNLOAD[@]} voice(s)"
66
+ echo ""
67
+
68
+ # Show already downloaded voices
69
+ if [[ $ALREADY_DOWNLOADED -gt 0 ]]; then
70
+ echo "✅ Already downloaded (skipped):"
71
+ for voice in "${ALREADY_DOWNLOADED_LIST[@]}"; do
72
+ echo " ✓ $voice"
73
+ done
74
+ echo ""
75
+ fi
76
+
77
+ if [[ ${#NEED_DOWNLOAD[@]} -eq 0 ]]; then
78
+ echo "🎉 All common voices ready to use!"
79
+ exit 0
80
+ fi
81
+
82
+ echo "Voices to download:"
83
+ for voice in "${NEED_DOWNLOAD[@]}"; do
84
+ echo " • $voice (~25MB)"
85
+ done
86
+ echo ""
87
+
88
+ # Ask for confirmation (skip if --yes flag provided)
89
+ if [[ "$AUTO_YES" == "false" ]]; then
90
+ read -p "Download ${#NEED_DOWNLOAD[@]} voice model(s)? [Y/n]: " -n 1 -r
91
+ echo
92
+
93
+ if [[ ! $REPLY =~ ^[Yy]$ ]] && [[ -n $REPLY ]]; then
94
+ echo "❌ Download cancelled"
95
+ exit 0
96
+ fi
97
+ else
98
+ echo "Auto-downloading ${#NEED_DOWNLOAD[@]} voice model(s)..."
99
+ echo ""
100
+ fi
101
+
102
+ # Download each voice
103
+ DOWNLOADED=0
104
+ FAILED=0
105
+
106
+ for voice in "${NEED_DOWNLOAD[@]}"; do
107
+ echo ""
108
+ echo "📥 Downloading: $voice..."
109
+
110
+ if download_voice "$voice"; then
111
+ ((DOWNLOADED++))
112
+ echo "✅ Downloaded: $voice"
113
+ else
114
+ ((FAILED++))
115
+ echo "❌ Failed: $voice"
116
+ fi
117
+ done
118
+
119
+ echo ""
120
+ echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
121
+ echo "📊 Download Summary:"
122
+ echo " ✅ Successfully downloaded: $DOWNLOADED"
123
+ echo " ❌ Failed: $FAILED"
124
+ echo " 📦 Total voices available: $((ALREADY_DOWNLOADED + DOWNLOADED))"
125
+ echo ""
126
+
127
+ if [[ $DOWNLOADED -gt 0 ]]; then
128
+ echo "✨ Ready to use Piper TTS with downloaded voices!"
129
+ echo ""
130
+ echo "Try it:"
131
+ echo " /agent-vibes:provider switch piper"
132
+ echo " /agent-vibes:preview"
133
+ fi
@@ -0,0 +1,227 @@
1
+ #!/bin/bash
2
+ #
3
+ # @fileoverview Piper Voice Model Management
4
+ # @context Manages downloading, caching, and validating Piper ONNX voice models
5
+ # @architecture Voice model lifecycle management for Piper provider
6
+ # @dependencies curl, piper binary
7
+ # @entrypoints Sourced by play-tts-piper.sh and provider management commands
8
+ # @patterns HuggingFace model repository integration, file-based caching
9
+ # @related play-tts-piper.sh, provider-manager.sh, GitHub Issue #25
10
+ #
11
+
12
+ # Base URL for Piper voice models on HuggingFace
13
+ PIPER_VOICES_BASE_URL="https://huggingface.co/rhasspy/piper-voices/resolve/main"
14
+
15
+ # @function get_voice_storage_dir
16
+ # @intent Determine directory for storing Piper voice models
17
+ # @why Voice models are large (~25MB each) and should be shared globally across all projects
18
+ # @returns Echoes path to voice storage directory (~/.claude/piper-voices)
19
+ # @sideeffects Creates directory if it doesn't exist
20
+ # @architecture Supports custom path via PIPER_VOICES_DIR env var, defaults to global storage
21
+ get_voice_storage_dir() {
22
+ local voice_dir
23
+
24
+ # Check for custom path in environment or config file
25
+ if [[ -n "$PIPER_VOICES_DIR" ]]; then
26
+ voice_dir="$PIPER_VOICES_DIR"
27
+ else
28
+ # Check for config file (project-local first, then global)
29
+ local config_file
30
+ if [[ -n "$CLAUDE_PROJECT_DIR" ]] && [[ -f "$CLAUDE_PROJECT_DIR/.claude/piper-voices-dir.txt" ]]; then
31
+ config_file="$CLAUDE_PROJECT_DIR/.claude/piper-voices-dir.txt"
32
+ else
33
+ # Search up directory tree for .claude/
34
+ local current_dir="$PWD"
35
+ while [[ "$current_dir" != "/" ]]; do
36
+ if [[ -f "$current_dir/.claude/piper-voices-dir.txt" ]]; then
37
+ config_file="$current_dir/.claude/piper-voices-dir.txt"
38
+ break
39
+ fi
40
+ current_dir=$(dirname "$current_dir")
41
+ done
42
+
43
+ # Check global config
44
+ if [[ -z "$config_file" ]] && [[ -f "$HOME/.claude/piper-voices-dir.txt" ]]; then
45
+ config_file="$HOME/.claude/piper-voices-dir.txt"
46
+ fi
47
+ fi
48
+
49
+ if [[ -n "$config_file" ]]; then
50
+ voice_dir=$(cat "$config_file" | tr -d '[:space:]')
51
+ fi
52
+ fi
53
+
54
+ # Fallback to default global storage
55
+ if [[ -z "$voice_dir" ]]; then
56
+ voice_dir="$HOME/.claude/piper-voices"
57
+ fi
58
+
59
+ mkdir -p "$voice_dir"
60
+ echo "$voice_dir"
61
+ }
62
+
63
+ # @function verify_voice
64
+ # @intent Check if voice model files exist locally
65
+ # @why Avoid redundant downloads, detect missing models
66
+ # @param $1 {string} voice_name - Voice model name (e.g., en_US-lessac-medium)
67
+ # @returns None
68
+ # @exitcode 0=voice exists, 1=voice missing
69
+ # @sideeffects None
70
+ verify_voice() {
71
+ local voice_name="$1"
72
+ local voice_dir
73
+ voice_dir=$(get_voice_storage_dir)
74
+
75
+ local onnx_file="$voice_dir/${voice_name}.onnx"
76
+ local json_file="$voice_dir/${voice_name}.onnx.json"
77
+
78
+ [[ -f "$onnx_file" ]] && [[ -f "$json_file" ]]
79
+ }
80
+
81
+ # @function get_voice_path
82
+ # @intent Get absolute path to voice model ONNX file
83
+ # @why Piper binary requires full path to model file
84
+ # @param $1 {string} voice_name - Voice model name
85
+ # @returns Echoes path to .onnx file
86
+ # @exitcode 0=success, 1=voice not found
87
+ # @sideeffects None
88
+ get_voice_path() {
89
+ local voice_name="$1"
90
+ local voice_dir
91
+ voice_dir=$(get_voice_storage_dir)
92
+
93
+ local onnx_file="$voice_dir/${voice_name}.onnx"
94
+
95
+ if [[ ! -f "$onnx_file" ]]; then
96
+ echo "❌ Voice model not found: $voice_name" >&2
97
+ return 1
98
+ fi
99
+
100
+ echo "$onnx_file"
101
+ }
102
+
103
+ # @function parse_voice_components
104
+ # @intent Extract language, locale, speaker, quality from voice name
105
+ # @why HuggingFace uses directory structure: lang/locale/speaker/quality
106
+ # @param $1 {string} voice_name - Voice name (e.g., en_US-lessac-medium)
107
+ # @returns Sets global variables: LANG, LOCALE, SPEAKER, QUALITY
108
+ # @sideeffects Sets global variables
109
+ # AI NOTE: Voice name format is: lang_LOCALE-speaker-quality
110
+ parse_voice_components() {
111
+ local voice_name="$1"
112
+
113
+ # Extract components from voice name
114
+ # Format: en_US-lessac-medium
115
+ # lang_LOCALE-speaker-quality
116
+
117
+ local lang_locale="${voice_name%%-*}" # en_US
118
+ local speaker_quality="${voice_name#*-}" # lessac-medium
119
+
120
+ LANG="${lang_locale%%_*}" # en
121
+ LOCALE="${lang_locale#*_}" # US
122
+ SPEAKER="${speaker_quality%%-*}" # lessac
123
+ QUALITY="${speaker_quality#*-}" # medium
124
+ }
125
+
126
+ # @function download_voice
127
+ # @intent Download Piper voice model from HuggingFace
128
+ # @why Provide free offline TTS voices
129
+ # @param $1 {string} voice_name - Voice model name
130
+ # @param $2 {string} lang_code - Language code (optional, inferred from voice_name)
131
+ # @returns None
132
+ # @exitcode 0=success, 1=download failed
133
+ # @sideeffects Downloads .onnx and .onnx.json files
134
+ # @edgecases Handles network failures, validates file integrity
135
+ download_voice() {
136
+ local voice_name="$1"
137
+ local lang_code="${2:-}"
138
+
139
+ local voice_dir
140
+ voice_dir=$(get_voice_storage_dir)
141
+
142
+ # Check if already downloaded
143
+ if verify_voice "$voice_name"; then
144
+ echo "✅ Voice already downloaded: $voice_name"
145
+ return 0
146
+ fi
147
+
148
+ # Parse voice components
149
+ parse_voice_components "$voice_name"
150
+
151
+ # Construct download URLs
152
+ # Path format: {language}/{language}_{locale}/{speaker}/{quality}/{speaker}-{quality}.onnx
153
+ local model_path="${LANG}/${LANG}_${LOCALE}/${SPEAKER}/${QUALITY}/${voice_name}"
154
+ local onnx_url="${PIPER_VOICES_BASE_URL}/${model_path}.onnx"
155
+ local json_url="${PIPER_VOICES_BASE_URL}/${model_path}.onnx.json"
156
+
157
+ echo "📥 Downloading Piper voice: $voice_name"
158
+ echo " Source: HuggingFace (rhasspy/piper-voices)"
159
+ echo " Size: ~25MB"
160
+ echo ""
161
+
162
+ # Download ONNX model
163
+ echo " Downloading model file..."
164
+ if ! curl -L --progress-bar -o "$voice_dir/${voice_name}.onnx" "$onnx_url"; then
165
+ echo "❌ Failed to download voice model"
166
+ rm -f "$voice_dir/${voice_name}.onnx"
167
+ return 1
168
+ fi
169
+
170
+ # Download JSON config
171
+ echo " Downloading config file..."
172
+ if ! curl -L -s -o "$voice_dir/${voice_name}.onnx.json" "$json_url"; then
173
+ echo "❌ Failed to download voice config"
174
+ rm -f "$voice_dir/${voice_name}.onnx" "$voice_dir/${voice_name}.onnx.json"
175
+ return 1
176
+ fi
177
+
178
+ # Verify file integrity (basic check - file size > 0)
179
+ if [[ ! -s "$voice_dir/${voice_name}.onnx" ]]; then
180
+ echo "❌ Downloaded file is empty or corrupt"
181
+ rm -f "$voice_dir/${voice_name}.onnx" "$voice_dir/${voice_name}.onnx.json"
182
+ return 1
183
+ fi
184
+
185
+ echo "✅ Voice downloaded successfully: $voice_name"
186
+ echo " Location: $voice_dir/${voice_name}.onnx"
187
+ }
188
+
189
+ # @function list_downloaded_voices
190
+ # @intent Show all locally cached voice models
191
+ # @why Help users see what voices they have available
192
+ # @returns Echoes voice names (one per line)
193
+ # @exitcode 0=success
194
+ # @sideeffects None
195
+ list_downloaded_voices() {
196
+ local voice_dir
197
+ voice_dir=$(get_voice_storage_dir)
198
+
199
+ echo "📦 Downloaded Piper Voices:"
200
+ echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
201
+
202
+ local count=0
203
+ shopt -s nullglob
204
+ for onnx_file in "$voice_dir"/*.onnx; do
205
+ if [[ -f "$onnx_file" ]]; then
206
+ local voice_name
207
+ voice_name=$(basename "$onnx_file" .onnx)
208
+ local file_size
209
+ file_size=$(du -h "$onnx_file" | cut -f1)
210
+ echo " • $voice_name ($file_size)"
211
+ ((count++))
212
+ fi
213
+ done
214
+ shopt -u nullglob
215
+
216
+ if [[ $count -eq 0 ]]; then
217
+ echo " (No voices downloaded yet)"
218
+ fi
219
+
220
+ echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
221
+ echo "Total: $count voices"
222
+ }
223
+
224
+ # AI NOTE: This file manages the lifecycle of Piper voice models
225
+ # Voice models are ONNX files (~20-30MB each) downloaded from HuggingFace
226
+ # Files are cached locally to avoid repeated downloads
227
+ # Project-local storage preferred over global for isolation
@@ -0,0 +1,201 @@
1
+ #!/bin/bash
2
+ #
3
+ # @fileoverview ElevenLabs TTS Provider Implementation
4
+ # @context Provider-specific implementation for ElevenLabs API integration
5
+ # @architecture Part of multi-provider TTS system - implements provider interface
6
+ # @dependencies Requires ELEVENLABS_API_KEY, curl, ffmpeg, paplay/aplay/mpg123, jq
7
+ # @entrypoints Called by play-tts.sh router with ($1=text, $2=voice_name)
8
+ # @patterns Follows provider contract: accept text/voice, output audio file path
9
+ # @related play-tts.sh, provider-manager.sh, GitHub Issue #25
10
+ #
11
+
12
+ # Fix locale warnings
13
+ export LC_ALL=C
14
+
15
+ TEXT="$1"
16
+ VOICE_OVERRIDE="$2" # Optional: voice name or direct voice ID
17
+ API_KEY="${ELEVENLABS_API_KEY}"
18
+
19
+ # Check for project-local pretext configuration
20
+ CONFIG_DIR="${CLAUDE_PROJECT_DIR:-.}/.claude/config"
21
+ CONFIG_FILE="$CONFIG_DIR/agentvibes.json"
22
+
23
+ if [[ -f "$CONFIG_FILE" ]] && command -v jq &> /dev/null; then
24
+ PRETEXT=$(jq -r '.pretext // empty' "$CONFIG_FILE" 2>/dev/null)
25
+ if [[ -n "$PRETEXT" ]]; then
26
+ TEXT="$PRETEXT: $TEXT"
27
+ fi
28
+ fi
29
+
30
+ # Limit text length to prevent API issues (max 500 chars for safety)
31
+ if [ ${#TEXT} -gt 500 ]; then
32
+ TEXT="${TEXT:0:497}..."
33
+ echo "⚠️ Text truncated to 500 characters for API safety"
34
+ fi
35
+
36
+ # Source the single voice configuration file
37
+ SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
38
+ source "$SCRIPT_DIR/voices-config.sh"
39
+ source "$SCRIPT_DIR/language-manager.sh"
40
+
41
+ # @function determine_voice_and_language
42
+ # @intent Resolve voice name/ID and language for multilingual support
43
+ # @why Supports both voice names and direct IDs, plus language-specific voices
44
+ # @param $VOICE_OVERRIDE {string} Voice name or ID (optional)
45
+ # @returns Sets $VOICE_ID and $LANGUAGE_CODE global variables
46
+ # @sideeffects None
47
+ # @edgecases Handles unknown voices, falls back to default
48
+ VOICE_ID=""
49
+ LANGUAGE_CODE="en" # Default to English
50
+
51
+ # Get current language setting
52
+ CURRENT_LANGUAGE=$(get_current_language)
53
+
54
+ # Get language code for API
55
+ LANGUAGE_CODE=$(get_language_code_for_name "$CURRENT_LANGUAGE")
56
+ [[ -z "$LANGUAGE_CODE" ]] && LANGUAGE_CODE="en"
57
+
58
+ if [[ -n "$VOICE_OVERRIDE" ]]; then
59
+ # Check if override is a voice name (lookup in mapping)
60
+ if [[ -n "${VOICES[$VOICE_OVERRIDE]}" ]]; then
61
+ VOICE_ID="${VOICES[$VOICE_OVERRIDE]}"
62
+ echo "🎤 Using voice: $VOICE_OVERRIDE (session-specific)"
63
+ # Check if override looks like a voice ID (alphanumeric string ~20 chars)
64
+ elif [[ "$VOICE_OVERRIDE" =~ ^[a-zA-Z0-9]{15,30}$ ]]; then
65
+ VOICE_ID="$VOICE_OVERRIDE"
66
+ echo "🎤 Using custom voice ID (session-specific)"
67
+ else
68
+ echo "⚠️ Unknown voice '$VOICE_OVERRIDE', trying language-specific voice"
69
+ fi
70
+ fi
71
+
72
+ # If no override or invalid override, use language-specific voice
73
+ if [[ -z "$VOICE_ID" ]]; then
74
+ # Try to get voice for current language
75
+ LANG_VOICE=$(get_voice_for_language "$CURRENT_LANGUAGE" "elevenlabs" 2>/dev/null)
76
+
77
+ if [[ -n "$LANG_VOICE" ]] && [[ -n "${VOICES[$LANG_VOICE]}" ]]; then
78
+ VOICE_ID="${VOICES[$LANG_VOICE]}"
79
+ echo "🌍 Using $CURRENT_LANGUAGE voice: $LANG_VOICE"
80
+ else
81
+ # Fall back to voice manager
82
+ VOICE_MANAGER_SCRIPT="$(dirname "$0")/voice-manager.sh"
83
+ if [[ -f "$VOICE_MANAGER_SCRIPT" ]]; then
84
+ VOICE_NAME=$("$VOICE_MANAGER_SCRIPT" get)
85
+ VOICE_ID="${VOICES[$VOICE_NAME]}"
86
+ fi
87
+
88
+ # Final fallback to default
89
+ if [[ -z "$VOICE_ID" ]]; then
90
+ echo "⚠️ No voice configured, using default"
91
+ VOICE_ID="${VOICES[Aria]}"
92
+ fi
93
+ fi
94
+ fi
95
+
96
+ # @function validate_inputs
97
+ # @intent Check required parameters and API key
98
+ # @why Fail fast with clear errors if inputs missing
99
+ # @exitcode 1=missing text, 2=missing API key
100
+ if [ -z "$TEXT" ]; then
101
+ echo "Usage: $0 \"text to speak\" [voice_name_or_id]"
102
+ exit 1
103
+ fi
104
+
105
+ if [ -z "$API_KEY" ]; then
106
+ echo "Error: ELEVENLABS_API_KEY not set"
107
+ echo "Set your API key: export ELEVENLABS_API_KEY=your_key_here"
108
+ exit 2
109
+ fi
110
+
111
+ # @function determine_audio_directory
112
+ # @intent Find appropriate directory for audio file storage
113
+ # @why Supports project-local and global storage
114
+ # @returns Sets $AUDIO_DIR global variable
115
+ # @sideeffects None
116
+ # @edgecases Handles missing directories, creates if needed
117
+ # AI NOTE: Check project dir first, then search up tree, finally fall back to global
118
+ if [[ -n "$CLAUDE_PROJECT_DIR" ]]; then
119
+ AUDIO_DIR="$CLAUDE_PROJECT_DIR/.claude/audio"
120
+ else
121
+ # Fallback: try to find .claude directory in current path
122
+ CURRENT_DIR="$PWD"
123
+ while [[ "$CURRENT_DIR" != "/" ]]; do
124
+ if [[ -d "$CURRENT_DIR/.claude" ]]; then
125
+ AUDIO_DIR="$CURRENT_DIR/.claude/audio"
126
+ break
127
+ fi
128
+ CURRENT_DIR=$(dirname "$CURRENT_DIR")
129
+ done
130
+ # Final fallback to global if no project .claude found
131
+ if [[ -z "$AUDIO_DIR" ]]; then
132
+ AUDIO_DIR="$HOME/.claude/audio"
133
+ fi
134
+ fi
135
+
136
+ mkdir -p "$AUDIO_DIR"
137
+ TEMP_FILE="$AUDIO_DIR/tts-$(date +%s).mp3"
138
+
139
+ # @function synthesize_with_elevenlabs
140
+ # @intent Call ElevenLabs API to generate speech
141
+ # @why Encapsulates API call with error handling
142
+ # @param Uses globals: $TEXT, $VOICE_ID, $API_KEY
143
+ # @returns Creates audio file at $TEMP_FILE
144
+ # @exitcode 0=success, 3=API error
145
+ # @sideeffects Creates MP3 file in audio directory
146
+ # @edgecases Handles network failures, API errors, rate limiting
147
+ # Choose model based on language
148
+ if [[ "$LANGUAGE_CODE" == "en" ]]; then
149
+ MODEL_ID="eleven_monolingual_v1"
150
+ else
151
+ MODEL_ID="eleven_multilingual_v2"
152
+ fi
153
+
154
+ curl -s -X POST "https://api.elevenlabs.io/v1/text-to-speech/${VOICE_ID}" \
155
+ -H "xi-api-key: ${API_KEY}" \
156
+ -H "Content-Type: application/json" \
157
+ -d "{\"text\":\"${TEXT}\",\"model_id\":\"${MODEL_ID}\",\"language_code\":\"${LANGUAGE_CODE}\",\"voice_settings\":{\"stability\":0.5,\"similarity_boost\":0.75}}" \
158
+ -o "${TEMP_FILE}"
159
+
160
+ # @function add_silence_padding
161
+ # @intent Add silence to beginning of audio to prevent WSL static
162
+ # @why WSL audio subsystem cuts off first ~200ms, causing static/clipping
163
+ # @param Uses global: $TEMP_FILE
164
+ # @returns Updates $TEMP_FILE to padded version
165
+ # @sideeffects Modifies audio file, removes original
166
+ # @edgecases Gracefully falls back to unpadded if ffmpeg unavailable
167
+ # Add silence padding to prevent WSL audio static
168
+ if [ -f "${TEMP_FILE}" ]; then
169
+ # Check if ffmpeg is available for adding padding
170
+ if command -v ffmpeg &> /dev/null; then
171
+ PADDED_FILE="$AUDIO_DIR/tts-padded-$(date +%s).mp3"
172
+ # Add 200ms of silence at the beginning to prevent static
173
+ ffmpeg -f lavfi -i anullsrc=r=44100:cl=stereo:d=0.2 -i "${TEMP_FILE}" \
174
+ -filter_complex "[0:a][1:a]concat=n=2:v=0:a=1[out]" \
175
+ -map "[out]" -y "${PADDED_FILE}" 2>/dev/null
176
+
177
+ if [ -f "${PADDED_FILE}" ]; then
178
+ # Use padded file and clean up original
179
+ rm -f "${TEMP_FILE}"
180
+ TEMP_FILE="${PADDED_FILE}"
181
+ fi
182
+ # If padding failed, just use original file
183
+ fi
184
+
185
+ # @function play_audio
186
+ # @intent Play generated audio file using available player
187
+ # @why Support multiple audio players (paplay, aplay, mpg123)
188
+ # @param Uses global: $TEMP_FILE
189
+ # @sideeffects Plays audio in background
190
+ # @edgecases Falls through players until one works
191
+ # Play audio (WSL/Linux) in background to avoid blocking
192
+ (paplay "${TEMP_FILE}" 2>/dev/null || aplay "${TEMP_FILE}" 2>/dev/null || mpg123 "${TEMP_FILE}" 2>/dev/null) &
193
+
194
+ # Keep temp files for later review - cleaned up weekly by cron
195
+ echo "🎵 Saved to: ${TEMP_FILE}"
196
+ echo "🎤 Voice used: ${VOICE_NAME} (${VOICE_ID})"
197
+ else
198
+ echo "❌ Failed to generate audio - API may be unavailable"
199
+ echo "Check your API key and network connection"
200
+ exit 3
201
+ fi