agentvibes 5.2.1 → 5.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (222) hide show
  1. package/.agentvibes/LITE-MODE.md +236 -0
  2. package/.agentvibes/README.md +136 -0
  3. package/.agentvibes/backup/session-start-tts.sh.20251210_212814 +141 -0
  4. package/.agentvibes/backups/agents/analyst_20260204_144958.md +78 -0
  5. package/.agentvibes/backups/agents/architect_20260204_144958.md +72 -0
  6. package/.agentvibes/backups/agents/dev_20260204_144958.md +74 -0
  7. package/.agentvibes/backups/agents/pm_20260204_144958.md +72 -0
  8. package/.agentvibes/backups/agents/quick-flow-solo-dev_20260204_144958.md +64 -0
  9. package/.agentvibes/backups/agents/sm_20260204_144958.md +87 -0
  10. package/.agentvibes/backups/agents/tea_20260204_144958.md +79 -0
  11. package/.agentvibes/backups/agents/tech-writer_20260204_144958.md +82 -0
  12. package/.agentvibes/backups/agents/ux-designer_20260204_144958.md +80 -0
  13. package/.agentvibes/bmad/bmad-voices.md +69 -69
  14. package/.agentvibes/config/README-personality-defaults.md +162 -0
  15. package/.agentvibes/config/mode.txt +1 -0
  16. package/.agentvibes/config/personality-voice-defaults.default.json +21 -0
  17. package/.agentvibes/config/save-audio.txt +1 -0
  18. package/.agentvibes/config/voice-metadata.json +160 -0
  19. package/.agentvibes/config.json +24 -15
  20. package/.agentvibes/hooks/help.sh +191 -0
  21. package/.agentvibes/hooks/post-tool-use-lite.sh +111 -0
  22. package/.agentvibes/hooks/save-audio-manager.sh +162 -0
  23. package/.agentvibes/hooks/session-start-full-optimized.sh +102 -0
  24. package/.agentvibes/hooks/session-start-full.sh +142 -0
  25. package/.agentvibes/hooks/session-start-lite-v2.sh +34 -0
  26. package/.agentvibes/hooks/session-start-lite.sh +29 -0
  27. package/.agentvibes/hooks/stop-lite.sh +115 -0
  28. package/.agentvibes/hooks/switch-mode.sh +215 -0
  29. package/.agentvibes/output-styles/audio-summary.md +30 -0
  30. package/.claude/activation-instructions +54 -54
  31. package/.claude/audio/voice-samples/piper/alan.wav +0 -0
  32. package/.claude/audio/voice-samples/piper/amy.wav +0 -0
  33. package/.claude/audio/voice-samples/piper/charlotte.wav +0 -0
  34. package/.claude/audio/voice-samples/piper/joe.wav +0 -0
  35. package/.claude/audio/voice-samples/piper/john.wav +0 -0
  36. package/.claude/audio/voice-samples/piper/katherine.wav +0 -0
  37. package/.claude/audio/voice-samples/piper/kristin.wav +0 -0
  38. package/.claude/audio/voice-samples/piper/linda.wav +0 -0
  39. package/.claude/audio/voice-samples/piper/marcus.wav +0 -0
  40. package/.claude/audio/voice-samples/piper/ryan.wav +0 -0
  41. package/.claude/commands/agent-vibes/add.md +21 -21
  42. package/.claude/commands/agent-vibes/agent-vibes.md +101 -101
  43. package/.claude/commands/agent-vibes/agent.md +79 -79
  44. package/.claude/commands/agent-vibes/background-music.md +111 -111
  45. package/.claude/commands/agent-vibes/bmad.md +198 -198
  46. package/.claude/commands/agent-vibes/clean.md +18 -18
  47. package/.claude/commands/agent-vibes/cleanup.md +18 -18
  48. package/.claude/commands/agent-vibes/commands.json +145 -145
  49. package/.claude/commands/agent-vibes/effects.md +97 -97
  50. package/.claude/commands/agent-vibes/get.md +9 -9
  51. package/.claude/commands/agent-vibes/hide.md +91 -91
  52. package/.claude/commands/agent-vibes/language.md +23 -23
  53. package/.claude/commands/agent-vibes/learn.md +67 -67
  54. package/.claude/commands/agent-vibes/list.md +13 -13
  55. package/.claude/commands/agent-vibes/mute.md +37 -37
  56. package/.claude/commands/agent-vibes/preview.md +17 -17
  57. package/.claude/commands/agent-vibes/provider.md +68 -68
  58. package/.claude/commands/agent-vibes/replay-target.md +14 -14
  59. package/.claude/commands/agent-vibes/sample.md +12 -12
  60. package/.claude/commands/agent-vibes/set-favorite-voice.md +84 -84
  61. package/.claude/commands/agent-vibes/set-pretext.md +65 -65
  62. package/.claude/commands/agent-vibes/set-speed.md +41 -41
  63. package/.claude/commands/agent-vibes/show.md +84 -84
  64. package/.claude/commands/agent-vibes/switch.md +87 -87
  65. package/.claude/commands/agent-vibes/target-voice.md +26 -26
  66. package/.claude/commands/agent-vibes/target.md +30 -30
  67. package/.claude/commands/agent-vibes/translate.md +68 -68
  68. package/.claude/commands/agent-vibes/unmute.md +45 -45
  69. package/.claude/commands/agent-vibes/whoami.md +7 -7
  70. package/.claude/commands/agent-vibes-bmad-voices.md +117 -117
  71. package/.claude/commands/agent-vibes-rdp.md +24 -24
  72. package/.claude/config/audio-effects.cfg +4 -11
  73. package/.claude/config/audio-effects.cfg.sample +52 -52
  74. package/.claude/config/background-music-position.txt +27 -0
  75. package/.claude/config/background-music-volume.txt +1 -1
  76. package/.claude/config/background-music.cfg +1 -0
  77. package/.claude/config/background-music.txt +1 -0
  78. package/.claude/config/tts-speech-rate.txt +1 -4
  79. package/.claude/config/tts-verbosity.txt +1 -0
  80. package/.claude/docs/TERMUX_SETUP.md +408 -408
  81. package/.claude/github-star-reminder.txt +1 -1
  82. package/.claude/hooks/README-TTS-QUEUE.md +135 -135
  83. package/.claude/hooks/audio-cache-utils.sh +0 -0
  84. package/.claude/hooks/audio-processor.sh +60 -14
  85. package/.claude/hooks/background-music-manager.sh +0 -0
  86. package/.claude/hooks/bmad-party-manager.sh +225 -0
  87. package/.claude/hooks/bmad-speak-enhanced.sh +0 -0
  88. package/.claude/hooks/bmad-speak.sh +6 -13
  89. package/.claude/hooks/bmad-tts-injector.sh +0 -0
  90. package/.claude/hooks/bmad-voice-manager.sh +0 -0
  91. package/.claude/hooks/clawdbot-receiver-SECURE.sh +25 -23
  92. package/.claude/hooks/clawdbot-receiver.sh +4 -28
  93. package/.claude/hooks/clean-audio-cache.sh +0 -0
  94. package/.claude/hooks/cleanup-cache.sh +0 -0
  95. package/.claude/hooks/configure-rdp-mode.sh +0 -0
  96. package/.claude/hooks/download-extra-voices.sh +0 -0
  97. package/.claude/hooks/effects-manager.sh +0 -0
  98. package/.claude/hooks/github-star-reminder.sh +0 -0
  99. package/.claude/hooks/language-manager.sh +0 -0
  100. package/.claude/hooks/learn-manager.sh +0 -0
  101. package/.claude/hooks/macos-voice-manager.sh +0 -0
  102. package/.claude/hooks/migrate-background-music.sh +0 -0
  103. package/.claude/hooks/migrate-to-agentvibes.sh +0 -0
  104. package/.claude/hooks/optimize-background-music.sh +0 -0
  105. package/.claude/hooks/personality-manager.sh +0 -0
  106. package/.claude/hooks/piper-download-voices.sh +0 -0
  107. package/.claude/hooks/piper-installer.sh +1 -1
  108. package/.claude/hooks/piper-multispeaker-registry.sh +0 -0
  109. package/.claude/hooks/piper-voice-manager.sh +0 -0
  110. package/.claude/hooks/play-tts-enhanced.sh +0 -0
  111. package/.claude/hooks/play-tts-macos.sh +6 -12
  112. package/.claude/hooks/play-tts-piper.sh +50 -79
  113. package/.claude/hooks/play-tts-soprano.sh +9 -43
  114. package/.claude/hooks/play-tts-ssh-remote.sh +42 -120
  115. package/.claude/hooks/play-tts-termux-ssh.sh +0 -0
  116. package/.claude/hooks/play-tts.sh +48 -37
  117. package/.claude/hooks/post-response.sh +41 -0
  118. package/.claude/hooks/prepare-release.sh +0 -0
  119. package/.claude/hooks/provider-commands.sh +0 -0
  120. package/.claude/hooks/provider-manager.sh +0 -0
  121. package/.claude/hooks/replay-target-audio.sh +0 -0
  122. package/.claude/hooks/requirements.txt +6 -6
  123. package/.claude/hooks/sentiment-manager.sh +0 -0
  124. package/.claude/hooks/session-start-tts.sh +56 -39
  125. package/.claude/hooks/soprano-gradio-synth.py +139 -139
  126. package/.claude/hooks/speed-manager.sh +0 -0
  127. package/.claude/hooks/stop.sh +63 -0
  128. package/.claude/hooks/termux-installer.sh +0 -0
  129. package/.claude/hooks/translate-manager.sh +0 -0
  130. package/.claude/hooks/translator.py +237 -237
  131. package/.claude/hooks/tts-queue-worker.sh +0 -0
  132. package/.claude/hooks/tts-queue.sh +0 -0
  133. package/.claude/hooks/verbosity-manager.sh +0 -0
  134. package/.claude/hooks/voice-manager.sh +26 -4
  135. package/.claude/hooks-windows/audio-cache-utils.ps1 +119 -119
  136. package/.claude/hooks-windows/bmad-party-speak.ps1 +278 -274
  137. package/.claude/hooks-windows/bmad-speak.ps1 +264 -264
  138. package/.claude/hooks-windows/clean-audio-cache.ps1 +53 -53
  139. package/.claude/hooks-windows/effects-manager.ps1 +294 -294
  140. package/.claude/hooks-windows/language-manager.ps1 +193 -193
  141. package/.claude/hooks-windows/learn-manager.ps1 +241 -241
  142. package/.claude/hooks-windows/personality-manager.ps1 +266 -266
  143. package/.claude/hooks-windows/play-tts-soprano.ps1 +5 -5
  144. package/.claude/hooks-windows/play-tts-termux-ssh.ps1 +138 -138
  145. package/.claude/hooks-windows/play-tts-windows-piper.ps1 +164 -0
  146. package/.claude/hooks-windows/play-tts-windows-sapi.ps1 +108 -0
  147. package/.claude/hooks-windows/play-tts.ps1 +104 -481
  148. package/.claude/hooks-windows/provider-manager.ps1 +158 -192
  149. package/.claude/hooks-windows/session-start-tts.ps1 +55 -46
  150. package/.claude/hooks-windows/soprano-gradio-synth.py +153 -153
  151. package/.claude/hooks-windows/speed-manager.ps1 +166 -166
  152. package/.claude/hooks-windows/voice-manager-windows.ps1 +176 -260
  153. package/.claude/output-styles/agent-vibes.md +202 -202
  154. package/.claude/personalities/angry.md +14 -14
  155. package/.claude/personalities/annoying.md +14 -14
  156. package/.claude/personalities/crass.md +14 -14
  157. package/.claude/personalities/dramatic.md +14 -14
  158. package/.claude/personalities/dry-humor.md +50 -50
  159. package/.claude/personalities/flirty.md +20 -20
  160. package/.claude/personalities/funny.md +14 -14
  161. package/.claude/personalities/grandpa.md +32 -32
  162. package/.claude/personalities/millennial.md +14 -14
  163. package/.claude/personalities/moody.md +14 -14
  164. package/.claude/personalities/normal.md +16 -16
  165. package/.claude/personalities/pirate.md +14 -14
  166. package/.claude/personalities/poetic.md +14 -14
  167. package/.claude/personalities/professional.md +14 -14
  168. package/.claude/personalities/rapper.md +55 -55
  169. package/.claude/personalities/robot.md +14 -14
  170. package/.claude/personalities/sarcastic.md +38 -38
  171. package/.claude/personalities/sassy.md +14 -14
  172. package/.claude/personalities/surfer-dude.md +14 -14
  173. package/.claude/personalities/zen.md +14 -14
  174. package/.claude/piper-voices-dir.txt +1 -0
  175. package/.claude/settings.json +25 -15
  176. package/.claude/verbosity.txt +1 -1
  177. package/.clawdbot/README.md +105 -105
  178. package/.clawdbot/skill/SKILL.md +149 -145
  179. package/.mcp.json +30 -11
  180. package/CLAUDE.md +170 -215
  181. package/README.md +206 -515
  182. package/RELEASE_NOTES.md +1132 -1884
  183. package/WINDOWS-SETUP.md +208 -208
  184. package/bin/agent-vibes +0 -0
  185. package/bin/agentvibes-voice-browser.js +64 -1289
  186. package/bin/agentvibes.js +0 -0
  187. package/bin/ensure-soprano-running.sh +43 -0
  188. package/bin/mcp-server.js +121 -121
  189. package/bin/mcp-server.sh +0 -0
  190. package/bin/test-bmad-pr +78 -78
  191. package/mcp-server/QUICK_START.md +203 -203
  192. package/mcp-server/README.md +345 -345
  193. package/mcp-server/WINDOWS_SETUP.md +260 -260
  194. package/mcp-server/docs/troubleshooting-audio.md +313 -313
  195. package/mcp-server/examples/claude_desktop_config.json +11 -11
  196. package/mcp-server/examples/claude_desktop_config_piper.json +9 -9
  197. package/mcp-server/examples/custom_instructions.md +169 -169
  198. package/mcp-server/install-deps.js +130 -130
  199. package/mcp-server/pyproject.toml +52 -52
  200. package/mcp-server/requirements.txt +2 -2
  201. package/mcp-server/server.py +1451 -1578
  202. package/mcp-server/test_server.py +395 -395
  203. package/package.json +1 -3
  204. package/setup-windows.ps1 +815 -815
  205. package/src/console/tabs/setup-tab.js +9 -6
  206. package/src/console/tabs/voices-tab.js +9 -3
  207. package/src/installer.js +42 -5
  208. package/src/services/llm-provider-service.js +13 -0
  209. package/templates/agentvibes-receiver.sh +158 -483
  210. package/templates/audio/welcome-music.mp3 +0 -0
  211. package/.agentvibes/bmad-voice-map.json +0 -104
  212. package/.agentvibes/copilot-sessions.log +0 -4
  213. package/.claude/config/audio-effects-bmad.cfg +0 -50
  214. package/.claude/config/background-music-enabled.txt +0 -1
  215. package/.claude/config/intro-text.txt +0 -1
  216. package/.claude/config/personality.txt +0 -1
  217. package/.claude/config/piper-speech-rate.txt +0 -4
  218. package/.claude/config/piper-target-speech-rate.txt +0 -1
  219. package/.claude/config/reverb-level.txt +0 -1
  220. package/.claude/config/tts-target-speech-rate.txt +0 -1
  221. package/voice-assignments.json +0 -8245
  222. /package/{.claude → .agentvibes}/config/agentvibes.json +0 -0
@@ -1,153 +1,153 @@
1
- #!/usr/bin/env python3
2
- #
3
- # File: .claude/hooks-windows/soprano-gradio-synth.py
4
- #
5
- # AgentVibes - Finally, your AI Agents can Talk Back!
6
- # Website: https://agentvibes.org
7
- # Repository: https://github.com/paulpreibisch/AgentVibes
8
- #
9
- # Co-created by Paul Preibisch with Claude AI
10
- # Copyright (c) 2025 Paul Preibisch
11
- #
12
- # Licensed under the Apache License, Version 2.0 (the "License");
13
- # you may not use this file except in compliance with the License.
14
- # You may obtain a copy of the License at
15
- #
16
- # http://www.apache.org/licenses/LICENSE-2.0
17
- #
18
- # Unless required by applicable law or agreed to in writing, software
19
- # distributed under the License is distributed on an "AS IS" BASIS,
20
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
21
- # See the License for the specific language governing permissions and
22
- # limitations under the License.
23
- #
24
- # ---
25
- #
26
- # Soprano Gradio WebUI synthesizer helper.
27
- # Calls the Soprano WebUI's Gradio API and saves the result as a WAV file.
28
- # Uses only Python stdlib (json, sys, urllib) — no extra dependencies.
29
- #
30
- # Usage: python3 soprano-gradio-synth.py "text to speak" output.wav [port]
31
- #
32
- """
33
- Soprano Gradio WebUI synthesizer helper for AgentVibes.
34
-
35
- Calls the Soprano WebUI's Gradio API via the Server-Sent Events (SSE) protocol
36
- and downloads the generated audio as a WAV file.
37
-
38
- Flow:
39
- 1. Submit generation request -> get event_id
40
- 2. Poll SSE stream for audio file URL
41
- 3. Download WAV file to output path
42
-
43
- See: https://github.com/ekwek1/soprano
44
- """
45
- import json
46
- import sys
47
- import urllib.request
48
- import urllib.error
49
-
50
-
51
- def synth(text: str, output_path: str, port: int = 7860) -> None:
52
- base = f"http://127.0.0.1:{port}"
53
-
54
- # Step 1: Submit generation request
55
- # Args: text, temperature, top_p, repetition_penalty, chunk_size, streaming
56
- payload = json.dumps({
57
- "data": [text, 0.0, 0.95, 1.2, 1, False]
58
- }).encode()
59
-
60
- event_id = submit_request(base, payload)
61
-
62
- # Step 2: Poll SSE stream for audio file URL
63
- audio_url = poll_for_result(base, event_id)
64
-
65
- # Step 3: Download the audio file (validate localhost to prevent SSRF)
66
- download_file(audio_url, output_path, port)
67
-
68
-
69
- def submit_request(base: str, payload: bytes) -> str:
70
- """Submit generation request to Gradio API, return event_id."""
71
- for api_base in ["/gradio_api/call", "/call"]:
72
- url = f"{base}{api_base}/generate_speech"
73
- req = urllib.request.Request(
74
- url,
75
- data=payload,
76
- headers={"Content-Type": "application/json"},
77
- )
78
- try:
79
- with urllib.request.urlopen(req, timeout=30) as resp:
80
- return json.loads(resp.read())["event_id"]
81
- except urllib.error.URLError:
82
- continue
83
-
84
- raise RuntimeError("Could not reach Soprano WebUI API")
85
-
86
-
87
- def poll_for_result(base: str, event_id: str) -> str:
88
- """Poll SSE endpoint until audio file URL is returned."""
89
- for api_base in ["/gradio_api/call", "/call"]:
90
- url = f"{base}{api_base}/generate_speech/{event_id}"
91
- req = urllib.request.Request(url)
92
- try:
93
- with urllib.request.urlopen(req, timeout=120) as resp:
94
- for raw_line in resp:
95
- line = raw_line.decode("utf-8", errors="replace").strip()
96
- if not line.startswith("data: "):
97
- continue
98
- try:
99
- parsed = json.loads(line[6:])
100
- except json.JSONDecodeError:
101
- continue
102
- # Response format: [{"path": "...", "url": "...", ...}, "status string"]
103
- if isinstance(parsed, list) and len(parsed) >= 1:
104
- audio = parsed[0]
105
- if isinstance(audio, dict) and "url" in audio:
106
- return audio["url"]
107
- break
108
- except urllib.error.URLError:
109
- continue
110
-
111
- raise RuntimeError("No audio URL in Soprano response")
112
-
113
-
114
- def download_file(url: str, output_path: str, port: int = 7860) -> None:
115
- """Download audio file from Gradio file server.
116
-
117
- Security: Validates URL points to localhost to prevent SSRF.
118
- """
119
- # Validate URL is localhost to prevent SSRF via crafted Gradio responses
120
- allowed_prefixes = [
121
- f"http://127.0.0.1:{port}/",
122
- f"http://localhost:{port}/",
123
- ]
124
- if not any(url.startswith(prefix) for prefix in allowed_prefixes):
125
- raise RuntimeError(f"Refused download from non-localhost URL: {url[:80]}")
126
-
127
- req = urllib.request.Request(url)
128
- with urllib.request.urlopen(req, timeout=30) as resp:
129
- with open(output_path, "wb") as f:
130
- while True:
131
- chunk = resp.read(8192)
132
- if not chunk:
133
- break
134
- f.write(chunk)
135
-
136
-
137
- if __name__ == "__main__":
138
- if len(sys.argv) < 3:
139
- print(f"Usage: {sys.argv[0]} \"text\" output.wav [port]", file=sys.stderr)
140
- sys.exit(1)
141
-
142
- text = sys.argv[1]
143
- output = sys.argv[2]
144
- port = int(sys.argv[3]) if len(sys.argv) > 3 else 7860
145
- if not (1 <= port <= 65535):
146
- print(f"Error: Invalid port number: {port}", file=sys.stderr)
147
- sys.exit(1)
148
-
149
- try:
150
- synth(text, output, port)
151
- except Exception as e:
152
- print(f"Error: {e}", file=sys.stderr)
153
- sys.exit(1)
1
+ #!/usr/bin/env python3
2
+ #
3
+ # File: .claude/hooks-windows/soprano-gradio-synth.py
4
+ #
5
+ # AgentVibes - Finally, your AI Agents can Talk Back!
6
+ # Website: https://agentvibes.org
7
+ # Repository: https://github.com/paulpreibisch/AgentVibes
8
+ #
9
+ # Co-created by Paul Preibisch with Claude AI
10
+ # Copyright (c) 2025 Paul Preibisch
11
+ #
12
+ # Licensed under the Apache License, Version 2.0 (the "License");
13
+ # you may not use this file except in compliance with the License.
14
+ # You may obtain a copy of the License at
15
+ #
16
+ # http://www.apache.org/licenses/LICENSE-2.0
17
+ #
18
+ # Unless required by applicable law or agreed to in writing, software
19
+ # distributed under the License is distributed on an "AS IS" BASIS,
20
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
21
+ # See the License for the specific language governing permissions and
22
+ # limitations under the License.
23
+ #
24
+ # ---
25
+ #
26
+ # Soprano Gradio WebUI synthesizer helper.
27
+ # Calls the Soprano WebUI's Gradio API and saves the result as a WAV file.
28
+ # Uses only Python stdlib (json, sys, urllib) — no extra dependencies.
29
+ #
30
+ # Usage: python3 soprano-gradio-synth.py "text to speak" output.wav [port]
31
+ #
32
+ """
33
+ Soprano Gradio WebUI synthesizer helper for AgentVibes.
34
+
35
+ Calls the Soprano WebUI's Gradio API via the Server-Sent Events (SSE) protocol
36
+ and downloads the generated audio as a WAV file.
37
+
38
+ Flow:
39
+ 1. Submit generation request -> get event_id
40
+ 2. Poll SSE stream for audio file URL
41
+ 3. Download WAV file to output path
42
+
43
+ See: https://github.com/ekwek1/soprano
44
+ """
45
+ import json
46
+ import sys
47
+ import urllib.request
48
+ import urllib.error
49
+
50
+
51
+ def synth(text: str, output_path: str, port: int = 7860) -> None:
52
+ base = f"http://127.0.0.1:{port}"
53
+
54
+ # Step 1: Submit generation request
55
+ # Args: text, temperature, top_p, repetition_penalty, chunk_size, streaming
56
+ payload = json.dumps({
57
+ "data": [text, 0.0, 0.95, 1.2, 1, False]
58
+ }).encode()
59
+
60
+ event_id = submit_request(base, payload)
61
+
62
+ # Step 2: Poll SSE stream for audio file URL
63
+ audio_url = poll_for_result(base, event_id)
64
+
65
+ # Step 3: Download the audio file (validate localhost to prevent SSRF)
66
+ download_file(audio_url, output_path, port)
67
+
68
+
69
+ def submit_request(base: str, payload: bytes) -> str:
70
+ """Submit generation request to Gradio API, return event_id."""
71
+ for api_base in ["/gradio_api/call", "/call"]:
72
+ url = f"{base}{api_base}/generate_speech"
73
+ req = urllib.request.Request(
74
+ url,
75
+ data=payload,
76
+ headers={"Content-Type": "application/json"},
77
+ )
78
+ try:
79
+ with urllib.request.urlopen(req, timeout=30) as resp:
80
+ return json.loads(resp.read())["event_id"]
81
+ except urllib.error.URLError:
82
+ continue
83
+
84
+ raise RuntimeError("Could not reach Soprano WebUI API")
85
+
86
+
87
+ def poll_for_result(base: str, event_id: str) -> str:
88
+ """Poll SSE endpoint until audio file URL is returned."""
89
+ for api_base in ["/gradio_api/call", "/call"]:
90
+ url = f"{base}{api_base}/generate_speech/{event_id}"
91
+ req = urllib.request.Request(url)
92
+ try:
93
+ with urllib.request.urlopen(req, timeout=120) as resp:
94
+ for raw_line in resp:
95
+ line = raw_line.decode("utf-8", errors="replace").strip()
96
+ if not line.startswith("data: "):
97
+ continue
98
+ try:
99
+ parsed = json.loads(line[6:])
100
+ except json.JSONDecodeError:
101
+ continue
102
+ # Response format: [{"path": "...", "url": "...", ...}, "status string"]
103
+ if isinstance(parsed, list) and len(parsed) >= 1:
104
+ audio = parsed[0]
105
+ if isinstance(audio, dict) and "url" in audio:
106
+ return audio["url"]
107
+ break
108
+ except urllib.error.URLError:
109
+ continue
110
+
111
+ raise RuntimeError("No audio URL in Soprano response")
112
+
113
+
114
+ def download_file(url: str, output_path: str, port: int = 7860) -> None:
115
+ """Download audio file from Gradio file server.
116
+
117
+ Security: Validates URL points to localhost to prevent SSRF.
118
+ """
119
+ # Validate URL is localhost to prevent SSRF via crafted Gradio responses
120
+ allowed_prefixes = [
121
+ f"http://127.0.0.1:{port}/",
122
+ f"http://localhost:{port}/",
123
+ ]
124
+ if not any(url.startswith(prefix) for prefix in allowed_prefixes):
125
+ raise RuntimeError(f"Refused download from non-localhost URL: {url[:80]}")
126
+
127
+ req = urllib.request.Request(url)
128
+ with urllib.request.urlopen(req, timeout=30) as resp:
129
+ with open(output_path, "wb") as f:
130
+ while True:
131
+ chunk = resp.read(8192)
132
+ if not chunk:
133
+ break
134
+ f.write(chunk)
135
+
136
+
137
+ if __name__ == "__main__":
138
+ if len(sys.argv) < 3:
139
+ print(f"Usage: {sys.argv[0]} \"text\" output.wav [port]", file=sys.stderr)
140
+ sys.exit(1)
141
+
142
+ text = sys.argv[1]
143
+ output = sys.argv[2]
144
+ port = int(sys.argv[3]) if len(sys.argv) > 3 else 7860
145
+ if not (1 <= port <= 65535):
146
+ print(f"Error: Invalid port number: {port}", file=sys.stderr)
147
+ sys.exit(1)
148
+
149
+ try:
150
+ synth(text, output, port)
151
+ except Exception as e:
152
+ print(f"Error: {e}", file=sys.stderr)
153
+ sys.exit(1)
@@ -1,166 +1,166 @@
1
- #
2
- # File: .claude/hooks-windows/speed-manager.ps1
3
- #
4
- # AgentVibes - Finally, your AI Agents can Talk Back!
5
- # Website: https://agentvibes.org
6
- # Copyright (c) 2025 Paul Preibisch
7
- # Licensed under the Apache License, Version 2.0
8
-
9
- param(
10
- [Parameter(Position=0)]
11
- [string]$Command = "help",
12
- [Parameter(Position=1)]
13
- [string]$Arg1 = ""
14
- )
15
-
16
- $ScriptDir = Split-Path -Parent $MyInvocation.MyCommand.Path
17
- $ClaudeDir = Split-Path -Parent $ScriptDir
18
-
19
- # Determine config directory
20
- if ($env:CLAUDE_PROJECT_DIR -and (Test-Path "$env:CLAUDE_PROJECT_DIR\.claude")) {
21
- $ConfigDir = Join-Path $env:CLAUDE_PROJECT_DIR ".claude" "config"
22
- } else {
23
- $ConfigDir = Join-Path $ClaudeDir "config"
24
- }
25
-
26
- if (-not (Test-Path $ConfigDir)) { New-Item -ItemType Directory -Path $ConfigDir -Force | Out-Null }
27
-
28
- $MainSpeedFile = Join-Path $ConfigDir "tts-speech-rate.txt"
29
- $TargetSpeedFile = Join-Path $ConfigDir "tts-target-speech-rate.txt"
30
-
31
- # Legacy migration
32
- $LegacyMain = Join-Path $ConfigDir "piper-speech-rate.txt"
33
- $LegacyTarget = Join-Path $ConfigDir "piper-target-speech-rate.txt"
34
- if ((Test-Path $LegacyMain) -and -not (Test-Path $MainSpeedFile)) {
35
- Copy-Item $LegacyMain $MainSpeedFile
36
- }
37
- if ((Test-Path $LegacyTarget) -and -not (Test-Path $TargetSpeedFile)) {
38
- Copy-Item $LegacyTarget $TargetSpeedFile
39
- }
40
-
41
- function Parse-SpeedValue {
42
- param([string]$Input)
43
-
44
- switch -Regex ($Input) {
45
- '^(normal|1x|1\.0)$' { return "1.0" }
46
- '^(slow|slower|0\.5x)$' { return "0.5" }
47
- '^(fast|2x|2\.0)$' { return "2.0" }
48
- '^(faster|3x|3\.0)$' { return "3.0" }
49
- }
50
-
51
- $val = $Input -replace '^[+-]', '' -replace 'x$', ''
52
- if ($val -match '^\d+\.?\d*$') { return $val }
53
- return "ERROR"
54
- }
55
-
56
- function Set-Speed {
57
- param([bool]$IsTarget = $false, [string]$SpeedInput)
58
-
59
- if (-not $SpeedInput) {
60
- Write-Output "Error: Speed value required"
61
- Write-Output "Usage: speed-manager.ps1 [target] <speed>"
62
- exit 1
63
- }
64
-
65
- $speedValue = Parse-SpeedValue $SpeedInput
66
- if ($speedValue -eq "ERROR") {
67
- Write-Output "Invalid speed value: $SpeedInput"
68
- Write-Output "Valid values: normal, 0.5x, 1x, 2x, 3x"
69
- exit 1
70
- }
71
-
72
- if ($IsTarget) {
73
- $configFile = $TargetSpeedFile
74
- $voiceType = "target language"
75
- } else {
76
- $configFile = $MainSpeedFile
77
- $voiceType = "main voice"
78
- }
79
-
80
- Set-Content -Path $configFile -Value $speedValue -NoNewline
81
-
82
- Write-Output "Speech speed set for $voiceType"
83
- Write-Output ""
84
- Write-Output "Speed: ${speedValue}x"
85
-
86
- switch ($speedValue) {
87
- "0.5" { Write-Output "Effect: Half speed (slower)" }
88
- "1.0" { Write-Output "Effect: Normal speed" }
89
- "2.0" { Write-Output "Effect: Double speed (faster)" }
90
- "3.0" { Write-Output "Effect: Triple speed (very fast)" }
91
- default {
92
- if ([double]$speedValue -gt 1.0) {
93
- Write-Output "Effect: Faster speech"
94
- } else {
95
- Write-Output "Effect: Slower speech"
96
- }
97
- }
98
- }
99
- }
100
-
101
- function Get-Speed {
102
- Write-Output "---------------------------------------"
103
- Write-Output " Current Speech Speed Settings"
104
- Write-Output "---------------------------------------"
105
- Write-Output ""
106
-
107
- if (Test-Path $MainSpeedFile) {
108
- $mainSpeed = (Get-Content $MainSpeedFile | Where-Object { $_ -notmatch '^\s*#' -and $_.Trim() -ne '' } | Select-Object -Last 1).Trim()
109
- Write-Output "Main voice: ${mainSpeed}x"
110
- } else {
111
- Write-Output "Main voice: 1.0x (default, normal speed)"
112
- }
113
-
114
- if (Test-Path $TargetSpeedFile) {
115
- $targetSpeed = (Get-Content $TargetSpeedFile | Where-Object { $_ -notmatch '^\s*#' -and $_.Trim() -ne '' } | Select-Object -Last 1).Trim()
116
- Write-Output "Target language: ${targetSpeed}x"
117
- } else {
118
- Write-Output "Target language: 0.5x (default, slower for learning)"
119
- }
120
-
121
- Write-Output ""
122
- Write-Output "Scale: 0.5x=slower, 1.0x=normal, 2.0x=faster, 3.0x=very fast"
123
- Write-Output "---------------------------------------"
124
- }
125
-
126
- switch -Regex ($Command) {
127
- "^target$" {
128
- Set-Speed -IsTarget $true -SpeedInput $Arg1
129
- }
130
- "^(get|status)$" {
131
- Get-Speed
132
- }
133
- "^(normal|fast|slow|slower)$" {
134
- Set-Speed -SpeedInput $Command
135
- }
136
- "^.*x$" {
137
- Set-Speed -SpeedInput $Command
138
- }
139
- "^\d+\.?\d*$" {
140
- Set-Speed -SpeedInput $Command
141
- }
142
- "^[+-]" {
143
- Set-Speed -SpeedInput $Command
144
- }
145
- "^help$" {
146
- Write-Output "Speech Speed Manager"
147
- Write-Output ""
148
- Write-Output "Usage:"
149
- Write-Output " speed-manager.ps1 <speed> Set main voice speed"
150
- Write-Output " speed-manager.ps1 target <speed> Set target language speed"
151
- Write-Output " speed-manager.ps1 get Show current speeds"
152
- Write-Output ""
153
- Write-Output "Speed values: 0.5x, 1x, 2x, 3x, normal, slow, fast, faster"
154
- }
155
- default {
156
- # Try as speed value
157
- $parsed = Parse-SpeedValue $Command
158
- if ($parsed -ne "ERROR") {
159
- Set-Speed -SpeedInput $Command
160
- } else {
161
- Write-Output "Unknown command: $Command"
162
- Write-Output "Usage: speed-manager.ps1 {get|target|<speed>}"
163
- exit 1
164
- }
165
- }
166
- }
1
+ #
2
+ # File: .claude/hooks-windows/speed-manager.ps1
3
+ #
4
+ # AgentVibes - Finally, your AI Agents can Talk Back!
5
+ # Website: https://agentvibes.org
6
+ # Copyright (c) 2025 Paul Preibisch
7
+ # Licensed under the Apache License, Version 2.0
8
+
9
+ param(
10
+ [Parameter(Position=0)]
11
+ [string]$Command = "help",
12
+ [Parameter(Position=1)]
13
+ [string]$Arg1 = ""
14
+ )
15
+
16
+ $ScriptDir = Split-Path -Parent $MyInvocation.MyCommand.Path
17
+ $ClaudeDir = Split-Path -Parent $ScriptDir
18
+
19
+ # Determine config directory
20
+ if ($env:CLAUDE_PROJECT_DIR -and (Test-Path "$env:CLAUDE_PROJECT_DIR\.claude")) {
21
+ $ConfigDir = Join-Path $env:CLAUDE_PROJECT_DIR ".claude" "config"
22
+ } else {
23
+ $ConfigDir = Join-Path $ClaudeDir "config"
24
+ }
25
+
26
+ if (-not (Test-Path $ConfigDir)) { New-Item -ItemType Directory -Path $ConfigDir -Force | Out-Null }
27
+
28
+ $MainSpeedFile = Join-Path $ConfigDir "tts-speech-rate.txt"
29
+ $TargetSpeedFile = Join-Path $ConfigDir "tts-target-speech-rate.txt"
30
+
31
+ # Legacy migration
32
+ $LegacyMain = Join-Path $ConfigDir "piper-speech-rate.txt"
33
+ $LegacyTarget = Join-Path $ConfigDir "piper-target-speech-rate.txt"
34
+ if ((Test-Path $LegacyMain) -and -not (Test-Path $MainSpeedFile)) {
35
+ Copy-Item $LegacyMain $MainSpeedFile
36
+ }
37
+ if ((Test-Path $LegacyTarget) -and -not (Test-Path $TargetSpeedFile)) {
38
+ Copy-Item $LegacyTarget $TargetSpeedFile
39
+ }
40
+
41
+ function Parse-SpeedValue {
42
+ param([string]$Input)
43
+
44
+ switch -Regex ($Input) {
45
+ '^(normal|1x|1\.0)$' { return "1.0" }
46
+ '^(slow|slower|0\.5x)$' { return "0.5" }
47
+ '^(fast|2x|2\.0)$' { return "2.0" }
48
+ '^(faster|3x|3\.0)$' { return "3.0" }
49
+ }
50
+
51
+ $val = $Input -replace '^[+-]', '' -replace 'x$', ''
52
+ if ($val -match '^\d+\.?\d*$') { return $val }
53
+ return "ERROR"
54
+ }
55
+
56
+ function Set-Speed {
57
+ param([bool]$IsTarget = $false, [string]$SpeedInput)
58
+
59
+ if (-not $SpeedInput) {
60
+ Write-Output "Error: Speed value required"
61
+ Write-Output "Usage: speed-manager.ps1 [target] <speed>"
62
+ exit 1
63
+ }
64
+
65
+ $speedValue = Parse-SpeedValue $SpeedInput
66
+ if ($speedValue -eq "ERROR") {
67
+ Write-Output "Invalid speed value: $SpeedInput"
68
+ Write-Output "Valid values: normal, 0.5x, 1x, 2x, 3x"
69
+ exit 1
70
+ }
71
+
72
+ if ($IsTarget) {
73
+ $configFile = $TargetSpeedFile
74
+ $voiceType = "target language"
75
+ } else {
76
+ $configFile = $MainSpeedFile
77
+ $voiceType = "main voice"
78
+ }
79
+
80
+ Set-Content -Path $configFile -Value $speedValue -NoNewline
81
+
82
+ Write-Output "Speech speed set for $voiceType"
83
+ Write-Output ""
84
+ Write-Output "Speed: ${speedValue}x"
85
+
86
+ switch ($speedValue) {
87
+ "0.5" { Write-Output "Effect: Half speed (slower)" }
88
+ "1.0" { Write-Output "Effect: Normal speed" }
89
+ "2.0" { Write-Output "Effect: Double speed (faster)" }
90
+ "3.0" { Write-Output "Effect: Triple speed (very fast)" }
91
+ default {
92
+ if ([double]$speedValue -gt 1.0) {
93
+ Write-Output "Effect: Faster speech"
94
+ } else {
95
+ Write-Output "Effect: Slower speech"
96
+ }
97
+ }
98
+ }
99
+ }
100
+
101
+ function Get-Speed {
102
+ Write-Output "---------------------------------------"
103
+ Write-Output " Current Speech Speed Settings"
104
+ Write-Output "---------------------------------------"
105
+ Write-Output ""
106
+
107
+ if (Test-Path $MainSpeedFile) {
108
+ $mainSpeed = (Get-Content $MainSpeedFile | Where-Object { $_ -notmatch '^\s*#' -and $_.Trim() -ne '' } | Select-Object -Last 1).Trim()
109
+ Write-Output "Main voice: ${mainSpeed}x"
110
+ } else {
111
+ Write-Output "Main voice: 1.0x (default, normal speed)"
112
+ }
113
+
114
+ if (Test-Path $TargetSpeedFile) {
115
+ $targetSpeed = (Get-Content $TargetSpeedFile | Where-Object { $_ -notmatch '^\s*#' -and $_.Trim() -ne '' } | Select-Object -Last 1).Trim()
116
+ Write-Output "Target language: ${targetSpeed}x"
117
+ } else {
118
+ Write-Output "Target language: 0.5x (default, slower for learning)"
119
+ }
120
+
121
+ Write-Output ""
122
+ Write-Output "Scale: 0.5x=slower, 1.0x=normal, 2.0x=faster, 3.0x=very fast"
123
+ Write-Output "---------------------------------------"
124
+ }
125
+
126
+ switch -Regex ($Command) {
127
+ "^target$" {
128
+ Set-Speed -IsTarget $true -SpeedInput $Arg1
129
+ }
130
+ "^(get|status)$" {
131
+ Get-Speed
132
+ }
133
+ "^(normal|fast|slow|slower)$" {
134
+ Set-Speed -SpeedInput $Command
135
+ }
136
+ "^.*x$" {
137
+ Set-Speed -SpeedInput $Command
138
+ }
139
+ "^\d+\.?\d*$" {
140
+ Set-Speed -SpeedInput $Command
141
+ }
142
+ "^[+-]" {
143
+ Set-Speed -SpeedInput $Command
144
+ }
145
+ "^help$" {
146
+ Write-Output "Speech Speed Manager"
147
+ Write-Output ""
148
+ Write-Output "Usage:"
149
+ Write-Output " speed-manager.ps1 <speed> Set main voice speed"
150
+ Write-Output " speed-manager.ps1 target <speed> Set target language speed"
151
+ Write-Output " speed-manager.ps1 get Show current speeds"
152
+ Write-Output ""
153
+ Write-Output "Speed values: 0.5x, 1x, 2x, 3x, normal, slow, fast, faster"
154
+ }
155
+ default {
156
+ # Try as speed value
157
+ $parsed = Parse-SpeedValue $Command
158
+ if ($parsed -ne "ERROR") {
159
+ Set-Speed -SpeedInput $Command
160
+ } else {
161
+ Write-Output "Unknown command: $Command"
162
+ Write-Output "Usage: speed-manager.ps1 {get|target|<speed>}"
163
+ exit 1
164
+ }
165
+ }
166
+ }