agentvibes 5.1.3 → 5.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (34) hide show
  1. package/.agentvibes/config.json +23 -13
  2. package/.claude/commands/agent-vibes/verbosity.md +98 -89
  3. package/.claude/config/audio-effects.cfg +6 -1
  4. package/.claude/hooks/bmad-speak.sh +2 -2
  5. package/.claude/hooks/piper-download-voices.sh +233 -225
  6. package/.claude/hooks/piper-installer.sh +1 -1
  7. package/.claude/hooks/piper-voice-manager.sh +125 -0
  8. package/.claude/hooks/play-tts-agentvibes-receiver-for-voiceless-connections.sh +97 -90
  9. package/.claude/hooks/play-tts-enhanced.sh +1 -1
  10. package/.claude/hooks/play-tts-piper.sh +16 -5
  11. package/.claude/hooks/play-tts-ssh-remote.sh +168 -167
  12. package/.claude/hooks/play-tts.sh +31 -9
  13. package/.claude/hooks/session-start-tts.sh +4 -1
  14. package/.claude/hooks/stop-tts.sh +1 -1
  15. package/.claude/hooks/verbosity-manager.sh +185 -178
  16. package/.claude/hooks-windows/download-extra-voices.ps1 +243 -185
  17. package/.claude/hooks-windows/play-tts-piper.ps1 +7 -2
  18. package/.claude/hooks-windows/play-tts.ps1 +219 -65
  19. package/.claude/hooks-windows/session-start-tts.ps1 +2 -1
  20. package/.claude/hooks-windows/verbosity-manager.ps1 +126 -119
  21. package/README.md +24 -1
  22. package/RELEASE_NOTES.md +113 -0
  23. package/bin/agentvibes-voice-browser.js +1939 -1840
  24. package/mcp-server/server.py +75 -25
  25. package/package.json +1 -1
  26. package/src/console/tabs/receiver-tab.js +1527 -1483
  27. package/src/console/tabs/settings-tab.js +2 -2
  28. package/src/console/tabs/setup-tab.js +122 -20
  29. package/src/console/tabs/voices-tab.js +130 -13
  30. package/src/i18n/en.js +202 -202
  31. package/src/installer.js +29 -25
  32. package/src/services/llm-provider-service.js +114 -11
  33. package/src/services/verbosity-service.js +159 -157
  34. package/templates/agentvibes-receiver.sh +3 -2
@@ -1,225 +1,233 @@
1
- #!/usr/bin/env bash
2
- #
3
- # File: .claude/hooks/piper-download-voices.sh
4
- #
5
- # AgentVibes - Finally, your AI Agents can Talk Back! Text-to-Speech WITH personality for AI Assistants!
6
- # Website: https://agentvibes.org
7
- # Repository: https://github.com/paulpreibisch/AgentVibes
8
- #
9
- # Co-created by Paul Preibisch with Claude AI
10
- # Copyright (c) 2025 Paul Preibisch
11
- #
12
- # Licensed under the Apache License, Version 2.0 (the "License");
13
- # you may not use this file except in compliance with the License.
14
- # You may obtain a copy of the License at
15
- #
16
- # http://www.apache.org/licenses/LICENSE-2.0
17
- #
18
- # Unless required by applicable law or agreed to in writing, software
19
- # distributed under the License is distributed on an "AS IS" BASIS,
20
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
21
- # See the License for the specific language governing permissions and
22
- # limitations under the License.
23
- #
24
- # DISCLAIMER: This software is provided "AS IS", WITHOUT WARRANTY OF ANY KIND,
25
- # express or implied, including but not limited to the warranties of
26
- # merchantability, fitness for a particular purpose and noninfringement.
27
- # In no event shall the authors or copyright holders be liable for any claim,
28
- # damages or other liability, whether in an action of contract, tort or
29
- # otherwise, arising from, out of or in connection with the software or the
30
- # use or other dealings in the software.
31
- #
32
- # ---
33
- #
34
- # @fileoverview Piper Voice Model Downloader - Batch downloads popular Piper TTS voices from HuggingFace
35
- # @context Post-installation utility to download commonly used voices (~25MB each)
36
- # @architecture Wrapper around piper-voice-manager.sh download functions with progress tracking
37
- # @dependencies piper-voice-manager.sh (download logic), piper binary (for validation)
38
- # @entrypoints Called by piper-installer.sh or manually via ./piper-download-voices.sh [--yes|-y]
39
- # @patterns Batch operations, skip-existing logic, auto-yes flag for non-interactive use
40
- # @related piper-voice-manager.sh, piper-installer.sh
41
- #
42
-
43
- # REQUIRED: Bash strict mode for security and reliability (CLAUDE.md)
44
- set -euo pipefail
45
-
46
- SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
47
- source "$SCRIPT_DIR/piper-voice-manager.sh"
48
-
49
- # Parse command line arguments
50
- AUTO_YES=false
51
- if [[ "$1" == "--yes" ]] || [[ "$1" == "-y" ]]; then
52
- AUTO_YES=true
53
- fi
54
-
55
- # Common voice models to download
56
- COMMON_VOICES=(
57
- "en_US-ryan-high" # Default, expressive male (30MB) - BMAD: John (pm)
58
- "en_US-amy-medium" # Warm female (13MB) - BMAD: Mary (analyst)
59
- "en_US-hfc_female-medium" # Professional female (13MB) - BMAD: Amelia (dev)
60
- "en_US-lessac-medium" # Clear female (13MB) - BMAD: Murat (tea) - NOTE: Female voice
61
- "en_US-danny-low" # Calm male (13MB) - BMAD: Winston (architect)
62
- "en_US-bryce-medium" # Professional male (13MB) - BMAD: Bob (sm)
63
- "en_US-kathleen-low" # Clear female (13MB) - BMAD: Paige (tech-writer)
64
- "en_US-kusal-medium" # Male voice (13MB) - BMAD: Saif (frame-expert)
65
- "en_US-kristin-medium" # Female voice (13MB) - BMAD: Sally (ux-designer)
66
- "en_US-libritts_r-medium" # Premium male (57MB) - BMAD: BMad Master (NOTE: Changed from -high to -medium, -high doesn't exist)
67
- "en_US-libritts-high" # Premium quality (57MB)
68
- )
69
-
70
- echo "🎙️ Piper Voice Model Downloader"
71
- echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
72
- echo ""
73
- echo "This will download the most commonly used Piper voice models."
74
- echo "Each voice is approximately 25MB."
75
- echo ""
76
-
77
- # Check if piper is installed
78
- if ! command -v piper &> /dev/null; then
79
- echo "❌ Error: Piper TTS not installed" >&2
80
- echo "Install with: pipx install piper-tts" >&2
81
- exit 1
82
- fi
83
-
84
- # Get storage directory
85
- VOICE_DIR=$(get_voice_storage_dir)
86
-
87
- echo "📂 Storage location: \"$VOICE_DIR\""
88
- echo ""
89
-
90
- # Count already downloaded
91
- ALREADY_DOWNLOADED=0
92
- ALREADY_DOWNLOADED_LIST=()
93
- NEED_DOWNLOAD=()
94
-
95
- for voice in "${COMMON_VOICES[@]}"; do
96
- if verify_voice "$voice" 2>/dev/null; then
97
- ((ALREADY_DOWNLOADED++))
98
- ALREADY_DOWNLOADED_LIST+=("$voice")
99
- else
100
- NEED_DOWNLOAD+=("$voice")
101
- fi
102
- done
103
-
104
- echo "📊 Status:"
105
- echo " Already downloaded: \"$ALREADY_DOWNLOADED\" voice(s)"
106
- echo " Need to download: \"${#NEED_DOWNLOAD[@]}\" voice(s)"
107
- echo ""
108
-
109
- # Show already downloaded voices
110
- if [[ $ALREADY_DOWNLOADED -gt 0 ]]; then
111
- echo "✅ Already downloaded (skipped):"
112
- for voice in "${ALREADY_DOWNLOADED_LIST[@]}"; do
113
- echo " ✓ $voice"
114
- done
115
- echo ""
116
- fi
117
-
118
- if [[ ${#NEED_DOWNLOAD[@]} -eq 0 ]]; then
119
- echo "🎉 All common voices ready to use!"
120
- exit 0
121
- fi
122
-
123
- echo "Voices to download:"
124
- for voice in "${NEED_DOWNLOAD[@]}"; do
125
- echo " • $voice (~25MB)"
126
- done
127
- echo ""
128
-
129
- # Ask for confirmation (skip if --yes flag provided)
130
- if [[ "$AUTO_YES" == "false" ]]; then
131
- read -p "Download ${#NEED_DOWNLOAD[@]} voice model(s)? [Y/n]: " -n 1 -r
132
- echo
133
-
134
- # Validate input is Y, y, N, n, or empty (default to Y)
135
- if [[ ! $REPLY =~ ^[YyNn]?$ ]]; then
136
- echo "❌ Invalid input. Please enter Y or N." >&2
137
- exit 1
138
- fi
139
-
140
- if [[ $REPLY =~ ^[Nn]$ ]]; then
141
- echo "❌ Download cancelled" >&2
142
- exit 0
143
- fi
144
- else
145
- echo "Auto-downloading ${#NEED_DOWNLOAD[@]} voice model(s)..."
146
- echo ""
147
- fi
148
-
149
- # Download each voice
150
- DOWNLOADED=0
151
- FAILED=0
152
-
153
- for voice in "${NEED_DOWNLOAD[@]}"; do
154
- echo ""
155
- echo "📥 Downloading: $voice..."
156
-
157
- if download_voice "$voice"; then
158
- ((DOWNLOADED++))
159
- voice_path="$VOICE_DIR/${voice}.onnx"
160
- file_size=$(du -h "$voice_path" 2>/dev/null | cut -f1)
161
- echo " ✓ Downloaded: $voice"
162
- echo " 📁 Path: $voice_path"
163
- echo " 📦 Size: $file_size"
164
- else
165
- ((FAILED++))
166
- echo " ✗ Failed: $voice"
167
- fi
168
- done
169
-
170
- echo ""
171
- echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
172
- echo "📊 Download Summary:"
173
- echo ""
174
- echo "Installed voices:"
175
- for voice in "${ALREADY_DOWNLOADED_LIST[@]}"; do
176
- voice_path="$VOICE_DIR/${voice}.onnx"
177
- file_size=$(du -h "$voice_path" 2>/dev/null | cut -f1)
178
- echo " ✓ $voice ($file_size)"
179
- echo " $voice_path"
180
- done
181
-
182
- if [[ $DOWNLOADED -gt 0 ]]; then
183
- echo ""
184
- echo "Just downloaded:"
185
- for voice in "${NEED_DOWNLOAD[@]}"; do
186
- voice_path="$VOICE_DIR/${voice}.onnx"
187
- if [[ -f "$voice_path" ]]; then
188
- file_size=$(du -h "$voice_path" 2>/dev/null | cut -f1)
189
- echo " ✓ $voice ($file_size)"
190
- echo " $voice_path"
191
- fi
192
- done
193
- fi
194
-
195
- if [[ $FAILED -gt 0 ]]; then
196
- echo ""
197
- echo "Failed downloads:"
198
- for voice in "${NEED_DOWNLOAD[@]}"; do
199
- voice_path="$VOICE_DIR/${voice}.onnx"
200
- if [[ ! -f "$voice_path" ]]; then
201
- echo " ✗ $voice"
202
- fi
203
- done
204
- fi
205
-
206
- echo ""
207
- echo "Total: $((ALREADY_DOWNLOADED + DOWNLOADED)) voices available"
208
- echo ""
209
-
210
- if [[ $DOWNLOADED -gt 0 ]]; then
211
- echo "✨ Ready to use Piper TTS with downloaded voices!"
212
- echo ""
213
- echo "Try it:"
214
- echo " /agent-vibes:provider switch piper"
215
- echo " /agent-vibes:preview"
216
- fi
217
-
218
- # Exit with error code if any downloads failed (Unix convention)
219
- if [[ $FAILED -gt 0 ]]; then
220
- echo "" >&2
221
- echo "⚠️ Warning: $FAILED download(s) failed. Some voices may not be available." >&2
222
- exit 1
223
- fi
224
-
225
- exit 0
1
+ #!/usr/bin/env bash
2
+ #
3
+ # File: .claude/hooks/piper-download-voices.sh
4
+ #
5
+ # AgentVibes - Finally, your AI Agents can Talk Back! Text-to-Speech WITH personality for AI Assistants!
6
+ # Website: https://agentvibes.org
7
+ # Repository: https://github.com/paulpreibisch/AgentVibes
8
+ #
9
+ # Co-created by Paul Preibisch with Claude AI
10
+ # Copyright (c) 2025 Paul Preibisch
11
+ #
12
+ # Licensed under the Apache License, Version 2.0 (the "License");
13
+ # you may not use this file except in compliance with the License.
14
+ # You may obtain a copy of the License at
15
+ #
16
+ # http://www.apache.org/licenses/LICENSE-2.0
17
+ #
18
+ # Unless required by applicable law or agreed to in writing, software
19
+ # distributed under the License is distributed on an "AS IS" BASIS,
20
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
21
+ # See the License for the specific language governing permissions and
22
+ # limitations under the License.
23
+ #
24
+ # DISCLAIMER: This software is provided "AS IS", WITHOUT WARRANTY OF ANY KIND,
25
+ # express or implied, including but not limited to the warranties of
26
+ # merchantability, fitness for a particular purpose and noninfringement.
27
+ # In no event shall the authors or copyright holders be liable for any claim,
28
+ # damages or other liability, whether in an action of contract, tort or
29
+ # otherwise, arising from, out of or in connection with the software or the
30
+ # use or other dealings in the software.
31
+ #
32
+ # ---
33
+ #
34
+ # @fileoverview Piper Voice Model Downloader - Batch downloads popular Piper TTS voices from HuggingFace
35
+ # @context Post-installation utility to download commonly used voices (~25MB each)
36
+ # @architecture Wrapper around piper-voice-manager.sh download functions with progress tracking
37
+ # @dependencies piper-voice-manager.sh (download logic), piper binary (for validation)
38
+ # @entrypoints Called by piper-installer.sh or manually via ./piper-download-voices.sh [--yes|-y]
39
+ # @patterns Batch operations, skip-existing logic, auto-yes flag for non-interactive use
40
+ # @related piper-voice-manager.sh, piper-installer.sh
41
+ #
42
+
43
+ # REQUIRED: Bash strict mode for security and reliability (CLAUDE.md)
44
+ set -euo pipefail
45
+
46
+ SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
47
+ source "$SCRIPT_DIR/piper-voice-manager.sh"
48
+
49
+ # Parse command line arguments
50
+ AUTO_YES=false
51
+ if [[ "$1" == "--yes" ]] || [[ "$1" == "-y" ]]; then
52
+ AUTO_YES=true
53
+ fi
54
+
55
+ # Common voice models to download
56
+ COMMON_VOICES=(
57
+ "en_US-ryan-high" # Default, expressive male (30MB) - BMAD: John (pm)
58
+ "en_US-amy-medium" # Warm female (13MB) - BMAD: Mary (analyst)
59
+ "en_US-hfc_female-medium" # Professional female (13MB) - BMAD: Amelia (dev)
60
+ "en_US-lessac-medium" # Clear female (13MB) - BMAD: Murat (tea) - NOTE: Female voice
61
+ "en_US-danny-low" # Calm male (13MB) - BMAD: Winston (architect)
62
+ "en_US-bryce-medium" # Professional male (13MB) - BMAD: Bob (sm)
63
+ "en_US-kathleen-low" # Clear female (13MB) - BMAD: Paige (tech-writer)
64
+ "en_US-kusal-medium" # Male voice (13MB) - BMAD: Saif (frame-expert)
65
+ "en_US-kristin-medium" # Female voice (13MB) - BMAD: Sally (ux-designer)
66
+ "en_US-libritts_r-medium" # Premium male (57MB) - BMAD: BMad Master (NOTE: Changed from -high to -medium, -high doesn't exist)
67
+ "en_US-libritts-high" # Premium quality (57MB)
68
+ )
69
+
70
+ echo "🎙️ Piper Voice Model Downloader"
71
+ echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
72
+ echo ""
73
+ echo "This will download the most commonly used Piper voice models."
74
+ echo "Each voice is approximately 25MB."
75
+ echo ""
76
+
77
+ # Check if piper is installed
78
+ if ! command -v piper &> /dev/null; then
79
+ echo "❌ Error: Piper TTS not installed" >&2
80
+ echo "Install with: pipx install piper-tts" >&2
81
+ exit 1
82
+ fi
83
+
84
+ # Get storage directory
85
+ VOICE_DIR=$(get_voice_storage_dir)
86
+
87
+ echo "📂 Storage location: \"$VOICE_DIR\""
88
+ echo ""
89
+
90
+ # Count already downloaded
91
+ ALREADY_DOWNLOADED=0
92
+ ALREADY_DOWNLOADED_LIST=()
93
+ NEED_DOWNLOAD=()
94
+
95
+ for voice in "${COMMON_VOICES[@]}"; do
96
+ if verify_voice "$voice" 2>/dev/null; then
97
+ ((ALREADY_DOWNLOADED++))
98
+ ALREADY_DOWNLOADED_LIST+=("$voice")
99
+ else
100
+ NEED_DOWNLOAD+=("$voice")
101
+ fi
102
+ done
103
+
104
+ echo "📊 Status:"
105
+ echo " Already downloaded: \"$ALREADY_DOWNLOADED\" voice(s)"
106
+ echo " Need to download: \"${#NEED_DOWNLOAD[@]}\" voice(s)"
107
+ echo ""
108
+
109
+ # Show already downloaded voices
110
+ if [[ $ALREADY_DOWNLOADED -gt 0 ]]; then
111
+ echo "✅ Already downloaded (skipped):"
112
+ for voice in "${ALREADY_DOWNLOADED_LIST[@]}"; do
113
+ echo " ✓ $voice"
114
+ done
115
+ echo ""
116
+ fi
117
+
118
+ if [[ ${#NEED_DOWNLOAD[@]} -eq 0 ]]; then
119
+ echo "🎉 All common voices ready to use!"
120
+ exit 0
121
+ fi
122
+
123
+ echo "Voices to download:"
124
+ for voice in "${NEED_DOWNLOAD[@]}"; do
125
+ echo " • $voice (~25MB)"
126
+ done
127
+ echo ""
128
+
129
+ # Ask for confirmation (skip if --yes flag provided)
130
+ if [[ "$AUTO_YES" == "false" ]]; then
131
+ read -p "Download ${#NEED_DOWNLOAD[@]} voice model(s)? [Y/n]: " -n 1 -r
132
+ echo
133
+
134
+ # Validate input is Y, y, N, n, or empty (default to Y)
135
+ if [[ ! $REPLY =~ ^[YyNn]?$ ]]; then
136
+ echo "❌ Invalid input. Please enter Y or N." >&2
137
+ exit 1
138
+ fi
139
+
140
+ if [[ $REPLY =~ ^[Nn]$ ]]; then
141
+ echo "❌ Download cancelled" >&2
142
+ exit 0
143
+ fi
144
+ else
145
+ echo "Auto-downloading ${#NEED_DOWNLOAD[@]} voice model(s)..."
146
+ echo ""
147
+ fi
148
+
149
+ # Download each voice
150
+ DOWNLOADED=0
151
+ FAILED=0
152
+
153
+ for voice in "${NEED_DOWNLOAD[@]}"; do
154
+ echo ""
155
+ echo "📥 Downloading: $voice..."
156
+
157
+ if download_voice "$voice"; then
158
+ ((DOWNLOADED++))
159
+ voice_path="$VOICE_DIR/${voice}.onnx"
160
+ file_size=$(du -h "$voice_path" 2>/dev/null | cut -f1)
161
+ echo " ✓ Downloaded: $voice"
162
+ echo " 📁 Path: $voice_path"
163
+ echo " 📦 Size: $file_size"
164
+ else
165
+ ((FAILED++))
166
+ echo " ✗ Failed: $voice"
167
+ fi
168
+ done
169
+
170
+ # Patch LibriTTS speaker names for any libritts models (existing or just downloaded)
171
+ VOICE_DIR=$(get_voice_storage_dir)
172
+ for voice in "${COMMON_VOICES[@]}"; do
173
+ if [[ "$voice" == *libritts* ]] && [[ -f "$VOICE_DIR/${voice}.onnx.json" ]]; then
174
+ patch_libritts_speaker_names "$VOICE_DIR" "$voice"
175
+ fi
176
+ done
177
+
178
+ echo ""
179
+ echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
180
+ echo "📊 Download Summary:"
181
+ echo ""
182
+ echo "Installed voices:"
183
+ for voice in "${ALREADY_DOWNLOADED_LIST[@]}"; do
184
+ voice_path="$VOICE_DIR/${voice}.onnx"
185
+ file_size=$(du -h "$voice_path" 2>/dev/null | cut -f1)
186
+ echo "$voice ($file_size)"
187
+ echo " $voice_path"
188
+ done
189
+
190
+ if [[ $DOWNLOADED -gt 0 ]]; then
191
+ echo ""
192
+ echo "Just downloaded:"
193
+ for voice in "${NEED_DOWNLOAD[@]}"; do
194
+ voice_path="$VOICE_DIR/${voice}.onnx"
195
+ if [[ -f "$voice_path" ]]; then
196
+ file_size=$(du -h "$voice_path" 2>/dev/null | cut -f1)
197
+ echo " $voice ($file_size)"
198
+ echo " $voice_path"
199
+ fi
200
+ done
201
+ fi
202
+
203
+ if [[ $FAILED -gt 0 ]]; then
204
+ echo ""
205
+ echo "Failed downloads:"
206
+ for voice in "${NEED_DOWNLOAD[@]}"; do
207
+ voice_path="$VOICE_DIR/${voice}.onnx"
208
+ if [[ ! -f "$voice_path" ]]; then
209
+ echo " ✗ $voice"
210
+ fi
211
+ done
212
+ fi
213
+
214
+ echo ""
215
+ echo "Total: $((ALREADY_DOWNLOADED + DOWNLOADED)) voices available"
216
+ echo ""
217
+
218
+ if [[ $DOWNLOADED -gt 0 ]]; then
219
+ echo "✨ Ready to use Piper TTS with downloaded voices!"
220
+ echo ""
221
+ echo "Try it:"
222
+ echo " /agent-vibes:provider switch piper"
223
+ echo " /agent-vibes:preview"
224
+ fi
225
+
226
+ # Exit with error code if any downloads failed (Unix convention)
227
+ if [[ $FAILED -gt 0 ]]; then
228
+ echo "" >&2
229
+ echo "⚠️ Warning: $FAILED download(s) failed. Some voices may not be available." >&2
230
+ exit 1
231
+ fi
232
+
233
+ exit 0
@@ -67,7 +67,7 @@ if [[ -d "/data/data/com.termux" ]]; then
67
67
  echo ""
68
68
  SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
69
69
  if [[ -f "$SCRIPT_DIR/termux-installer.sh" ]]; then
70
- exec "$SCRIPT_DIR/termux-installer.sh" "$@"
70
+ exec bash "$SCRIPT_DIR/termux-installer.sh" "$@"
71
71
  else
72
72
  echo "❌ Error: termux-installer.sh not found"
73
73
  echo " Please download it from the AgentVibes repository"
@@ -265,10 +265,135 @@ download_voice() {
265
265
  return 1
266
266
  fi
267
267
 
268
+ # Patch LibriTTS speaker names if this is a libritts model
269
+ if [[ "$voice_name" == *libritts* ]]; then
270
+ patch_libritts_speaker_names "$voice_dir" "$voice_name"
271
+ fi
272
+
268
273
  echo "✅ Voice downloaded successfully: $voice_name"
269
274
  echo " Location: $voice_dir/${voice_name}.onnx"
270
275
  }
271
276
 
277
+ # @function patch_libritts_speaker_names
278
+ # @intent Replace raw corpus IDs (p3922, p8699) with friendly names (Anna, Bella) in LibriTTS .onnx.json
279
+ # @why Users see cryptic "p100Bell" names instead of friendly names without this patch
280
+ # @param $1 {string} voice_dir - Directory containing the .onnx.json file
281
+ # @param $2 {string} voice_name - Voice model name (e.g., en_US-libritts-high)
282
+ # @returns None
283
+ # @exitcode Always 0 (non-fatal)
284
+ # @sideeffects Rewrites speaker_id_map in .onnx.json with friendly names from voice-assignments.json
285
+ # @calledby download_voice (for libritts models), piper-download-voices.sh (post-download)
286
+ # @calls python3/node (for JSON manipulation)
287
+ patch_libritts_speaker_names() {
288
+ local voice_dir="$1"
289
+ local voice_name="$2"
290
+ local json_file="$voice_dir/${voice_name}.onnx.json"
291
+
292
+ if [[ ! -f "$json_file" ]]; then
293
+ return 0
294
+ fi
295
+
296
+ # Find voice-assignments.json relative to this script (SCRIPT_DIR/../.. = project root)
297
+ local script_dir
298
+ script_dir="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
299
+ local project_root
300
+ project_root="$(cd "$script_dir/../.." 2>/dev/null && pwd)"
301
+ local catalog="$project_root/voice-assignments.json"
302
+
303
+ # Also check npm global install location
304
+ if [[ ! -f "$catalog" ]]; then
305
+ # Try npm root
306
+ local npm_root
307
+ npm_root="$(npm root -g 2>/dev/null)/agentvibes" || true
308
+ if [[ -f "$npm_root/voice-assignments.json" ]]; then
309
+ catalog="$npm_root/voice-assignments.json"
310
+ fi
311
+ fi
312
+
313
+ if [[ ! -f "$catalog" ]]; then
314
+ return 0
315
+ fi
316
+
317
+ # Check if already patched (first key doesn't start with 'p' + digits)
318
+ if command -v python3 &>/dev/null; then
319
+ python3 -c "
320
+ import json, sys
321
+
322
+ json_path = sys.argv[1]
323
+ catalog_path = sys.argv[2]
324
+
325
+ with open(json_path, 'r') as f:
326
+ data = json.load(f)
327
+
328
+ sid_map = data.get('speaker_id_map', {})
329
+ if not sid_map or data.get('num_speakers', 0) <= 1:
330
+ sys.exit(0)
331
+
332
+ # Check if already patched
333
+ import re
334
+ first_key = next(iter(sid_map))
335
+ if not re.match(r'^p\d+$', first_key):
336
+ sys.exit(0)
337
+
338
+ # Load catalog
339
+ with open(catalog_path, 'r') as f:
340
+ catalog = json.load(f)
341
+
342
+ speakers = catalog.get('libritts_speakers', {})
343
+
344
+ # Build reverse map: index -> p-name
345
+ index_to_p = {v: k for k, v in sid_map.items()}
346
+
347
+ # Rebuild with friendly names
348
+ new_map = {}
349
+ for idx, pname in index_to_p.items():
350
+ friendly = speakers.get(str(idx), {}).get('voice_name')
351
+ new_map[friendly if friendly else pname] = idx
352
+
353
+ data['speaker_id_map'] = new_map
354
+
355
+ with open(json_path, 'w') as f:
356
+ json.dump(data, f, indent=2)
357
+
358
+ print(' Patched LibriTTS speaker names to friendly names')
359
+ " "$json_file" "$catalog" 2>/dev/null || true
360
+ elif command -v node &>/dev/null; then
361
+ node -e "
362
+ const fs = require('fs');
363
+ const path = require('path');
364
+
365
+ const jsonPath = process.argv[1];
366
+ const catalogPath = process.argv[2];
367
+
368
+ const data = JSON.parse(fs.readFileSync(jsonPath, 'utf8'));
369
+ const sidMap = data.speaker_id_map || {};
370
+ if (!Object.keys(sidMap).length || (data.num_speakers || 0) <= 1) process.exit(0);
371
+
372
+ // Check if already patched
373
+ const firstKey = Object.keys(sidMap)[0];
374
+ if (!/^p\d+$/.test(firstKey)) process.exit(0);
375
+
376
+ const catalog = JSON.parse(fs.readFileSync(catalogPath, 'utf8'));
377
+ const speakers = catalog.libritts_speakers || {};
378
+
379
+ // Build reverse map
380
+ const indexToP = {};
381
+ for (const [pname, idx] of Object.entries(sidMap)) indexToP[idx] = pname;
382
+
383
+ // Rebuild with friendly names
384
+ const newMap = {};
385
+ for (const [idx, pname] of Object.entries(indexToP)) {
386
+ const friendly = speakers[String(idx)]?.voice_name;
387
+ newMap[friendly || pname] = parseInt(idx, 10);
388
+ }
389
+
390
+ data.speaker_id_map = newMap;
391
+ fs.writeFileSync(jsonPath, JSON.stringify(data, null, 2), 'utf8');
392
+ console.log(' Patched LibriTTS speaker names to friendly names');
393
+ " "$json_file" "$catalog" 2>/dev/null || true
394
+ fi
395
+ }
396
+
272
397
  # @function list_downloaded_voices
273
398
  # @intent Display all locally cached voice models with file sizes
274
399
  # @why Help users see what voices they have available and storage usage