agentvibes 5.3.0 → 5.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (222) hide show
  1. package/.agentvibes/LITE-MODE.md +236 -0
  2. package/.agentvibes/README.md +136 -0
  3. package/.agentvibes/backup/session-start-tts.sh.20251210_212814 +141 -0
  4. package/.agentvibes/backups/agents/analyst_20260204_144958.md +78 -0
  5. package/.agentvibes/backups/agents/architect_20260204_144958.md +72 -0
  6. package/.agentvibes/backups/agents/dev_20260204_144958.md +74 -0
  7. package/.agentvibes/backups/agents/pm_20260204_144958.md +72 -0
  8. package/.agentvibes/backups/agents/quick-flow-solo-dev_20260204_144958.md +64 -0
  9. package/.agentvibes/backups/agents/sm_20260204_144958.md +87 -0
  10. package/.agentvibes/backups/agents/tea_20260204_144958.md +79 -0
  11. package/.agentvibes/backups/agents/tech-writer_20260204_144958.md +82 -0
  12. package/.agentvibes/backups/agents/ux-designer_20260204_144958.md +80 -0
  13. package/.agentvibes/bmad/bmad-voices.md +69 -69
  14. package/.agentvibes/config/README-personality-defaults.md +162 -0
  15. package/.agentvibes/config/mode.txt +1 -0
  16. package/.agentvibes/config/personality-voice-defaults.default.json +21 -0
  17. package/.agentvibes/config/save-audio.txt +1 -0
  18. package/.agentvibes/config/voice-metadata.json +160 -0
  19. package/.agentvibes/config.json +24 -15
  20. package/.agentvibes/hooks/help.sh +191 -0
  21. package/.agentvibes/hooks/post-tool-use-lite.sh +111 -0
  22. package/.agentvibes/hooks/save-audio-manager.sh +162 -0
  23. package/.agentvibes/hooks/session-start-full-optimized.sh +102 -0
  24. package/.agentvibes/hooks/session-start-full.sh +142 -0
  25. package/.agentvibes/hooks/session-start-lite-v2.sh +34 -0
  26. package/.agentvibes/hooks/session-start-lite.sh +29 -0
  27. package/.agentvibes/hooks/stop-lite.sh +115 -0
  28. package/.agentvibes/hooks/switch-mode.sh +215 -0
  29. package/.agentvibes/output-styles/audio-summary.md +30 -0
  30. package/.claude/activation-instructions +54 -54
  31. package/.claude/audio/voice-samples/piper/alan.wav +0 -0
  32. package/.claude/audio/voice-samples/piper/amy.wav +0 -0
  33. package/.claude/audio/voice-samples/piper/charlotte.wav +0 -0
  34. package/.claude/audio/voice-samples/piper/joe.wav +0 -0
  35. package/.claude/audio/voice-samples/piper/john.wav +0 -0
  36. package/.claude/audio/voice-samples/piper/katherine.wav +0 -0
  37. package/.claude/audio/voice-samples/piper/kristin.wav +0 -0
  38. package/.claude/audio/voice-samples/piper/linda.wav +0 -0
  39. package/.claude/audio/voice-samples/piper/marcus.wav +0 -0
  40. package/.claude/audio/voice-samples/piper/ryan.wav +0 -0
  41. package/.claude/commands/agent-vibes/add.md +21 -21
  42. package/.claude/commands/agent-vibes/agent-vibes.md +101 -101
  43. package/.claude/commands/agent-vibes/agent.md +79 -79
  44. package/.claude/commands/agent-vibes/background-music.md +111 -111
  45. package/.claude/commands/agent-vibes/bmad.md +198 -198
  46. package/.claude/commands/agent-vibes/clean.md +18 -18
  47. package/.claude/commands/agent-vibes/cleanup.md +18 -18
  48. package/.claude/commands/agent-vibes/commands.json +145 -145
  49. package/.claude/commands/agent-vibes/effects.md +97 -97
  50. package/.claude/commands/agent-vibes/get.md +9 -9
  51. package/.claude/commands/agent-vibes/hide.md +91 -91
  52. package/.claude/commands/agent-vibes/language.md +23 -23
  53. package/.claude/commands/agent-vibes/learn.md +67 -67
  54. package/.claude/commands/agent-vibes/list.md +13 -13
  55. package/.claude/commands/agent-vibes/mute.md +37 -37
  56. package/.claude/commands/agent-vibes/preview.md +17 -17
  57. package/.claude/commands/agent-vibes/provider.md +68 -68
  58. package/.claude/commands/agent-vibes/replay-target.md +14 -14
  59. package/.claude/commands/agent-vibes/sample.md +12 -12
  60. package/.claude/commands/agent-vibes/set-favorite-voice.md +84 -84
  61. package/.claude/commands/agent-vibes/set-pretext.md +65 -65
  62. package/.claude/commands/agent-vibes/set-speed.md +41 -41
  63. package/.claude/commands/agent-vibes/show.md +84 -84
  64. package/.claude/commands/agent-vibes/switch.md +87 -87
  65. package/.claude/commands/agent-vibes/target-voice.md +26 -26
  66. package/.claude/commands/agent-vibes/target.md +30 -30
  67. package/.claude/commands/agent-vibes/translate.md +68 -68
  68. package/.claude/commands/agent-vibes/unmute.md +45 -45
  69. package/.claude/commands/agent-vibes/whoami.md +7 -7
  70. package/.claude/commands/agent-vibes-bmad-voices.md +117 -117
  71. package/.claude/commands/agent-vibes-rdp.md +24 -24
  72. package/.claude/config/audio-effects.cfg +16 -11
  73. package/.claude/config/audio-effects.cfg.sample +52 -52
  74. package/.claude/config/background-music-position.txt +27 -0
  75. package/.claude/config/background-music-volume.txt +1 -1
  76. package/.claude/config/background-music.cfg +1 -0
  77. package/.claude/config/background-music.txt +1 -0
  78. package/.claude/config/tts-speech-rate.txt +1 -4
  79. package/.claude/config/tts-verbosity.txt +1 -0
  80. package/.claude/docs/TERMUX_SETUP.md +408 -408
  81. package/.claude/github-star-reminder.txt +1 -1
  82. package/.claude/hooks/README-TTS-QUEUE.md +135 -135
  83. package/.claude/hooks/audio-cache-utils.sh +0 -0
  84. package/.claude/hooks/audio-processor.sh +60 -14
  85. package/.claude/hooks/background-music-manager.sh +0 -0
  86. package/.claude/hooks/bmad-party-manager.sh +225 -0
  87. package/.claude/hooks/bmad-party-speak.sh +0 -0
  88. package/.claude/hooks/bmad-speak-enhanced.sh +0 -0
  89. package/.claude/hooks/bmad-speak.sh +12 -15
  90. package/.claude/hooks/bmad-tts-injector.sh +0 -0
  91. package/.claude/hooks/bmad-voice-manager.sh +0 -0
  92. package/.claude/hooks/clawdbot-receiver-SECURE.sh +25 -23
  93. package/.claude/hooks/clawdbot-receiver.sh +4 -28
  94. package/.claude/hooks/clean-audio-cache.sh +0 -0
  95. package/.claude/hooks/cleanup-cache.sh +0 -0
  96. package/.claude/hooks/configure-rdp-mode.sh +0 -0
  97. package/.claude/hooks/download-extra-voices.sh +0 -0
  98. package/.claude/hooks/effects-manager.sh +0 -0
  99. package/.claude/hooks/github-star-reminder.sh +0 -0
  100. package/.claude/hooks/language-manager.sh +0 -0
  101. package/.claude/hooks/learn-manager.sh +0 -0
  102. package/.claude/hooks/macos-voice-manager.sh +0 -0
  103. package/.claude/hooks/migrate-background-music.sh +0 -0
  104. package/.claude/hooks/migrate-to-agentvibes.sh +0 -0
  105. package/.claude/hooks/optimize-background-music.sh +0 -0
  106. package/.claude/hooks/personality-manager.sh +0 -0
  107. package/.claude/hooks/piper-download-voices.sh +0 -0
  108. package/.claude/hooks/piper-installer.sh +1 -1
  109. package/.claude/hooks/piper-multispeaker-registry.sh +0 -0
  110. package/.claude/hooks/piper-voice-manager.sh +0 -0
  111. package/.claude/hooks/play-tts-enhanced.sh +0 -0
  112. package/.claude/hooks/play-tts-macos.sh +6 -12
  113. package/.claude/hooks/play-tts-piper.sh +52 -81
  114. package/.claude/hooks/play-tts-soprano.sh +9 -43
  115. package/.claude/hooks/play-tts-ssh-remote.sh +43 -215
  116. package/.claude/hooks/play-tts-termux-ssh.sh +0 -0
  117. package/.claude/hooks/play-tts.sh +41 -20
  118. package/.claude/hooks/post-response.sh +41 -0
  119. package/.claude/hooks/prepare-release.sh +0 -0
  120. package/.claude/hooks/provider-commands.sh +0 -0
  121. package/.claude/hooks/provider-manager.sh +0 -0
  122. package/.claude/hooks/replay-target-audio.sh +0 -0
  123. package/.claude/hooks/requirements.txt +6 -6
  124. package/.claude/hooks/sentiment-manager.sh +0 -0
  125. package/.claude/hooks/session-start-tts.sh +56 -39
  126. package/.claude/hooks/soprano-gradio-synth.py +139 -139
  127. package/.claude/hooks/speed-manager.sh +0 -0
  128. package/.claude/hooks/stop.sh +63 -0
  129. package/.claude/hooks/termux-installer.sh +0 -0
  130. package/.claude/hooks/translate-manager.sh +0 -0
  131. package/.claude/hooks/translator.py +237 -237
  132. package/.claude/hooks/tts-queue-worker.sh +0 -0
  133. package/.claude/hooks/tts-queue.sh +0 -0
  134. package/.claude/hooks/verbosity-manager.sh +0 -0
  135. package/.claude/hooks/voice-manager.sh +26 -4
  136. package/.claude/hooks-windows/audio-cache-utils.ps1 +119 -119
  137. package/.claude/hooks-windows/bmad-party-speak.ps1 +278 -278
  138. package/.claude/hooks-windows/bmad-speak.ps1 +264 -264
  139. package/.claude/hooks-windows/clean-audio-cache.ps1 +53 -53
  140. package/.claude/hooks-windows/effects-manager.ps1 +294 -294
  141. package/.claude/hooks-windows/language-manager.ps1 +193 -193
  142. package/.claude/hooks-windows/learn-manager.ps1 +241 -241
  143. package/.claude/hooks-windows/personality-manager.ps1 +266 -266
  144. package/.claude/hooks-windows/play-tts-soprano.ps1 +5 -5
  145. package/.claude/hooks-windows/play-tts-termux-ssh.ps1 +138 -138
  146. package/.claude/hooks-windows/play-tts-windows-piper.ps1 +178 -0
  147. package/.claude/hooks-windows/play-tts-windows-sapi.ps1 +108 -0
  148. package/.claude/hooks-windows/play-tts.ps1 +265 -507
  149. package/.claude/hooks-windows/provider-manager.ps1 +158 -192
  150. package/.claude/hooks-windows/session-start-tts.ps1 +55 -46
  151. package/.claude/hooks-windows/soprano-gradio-synth.py +153 -153
  152. package/.claude/hooks-windows/speed-manager.ps1 +166 -166
  153. package/.claude/hooks-windows/voice-manager-windows.ps1 +176 -260
  154. package/.claude/output-styles/agent-vibes.md +202 -202
  155. package/.claude/personalities/angry.md +14 -14
  156. package/.claude/personalities/annoying.md +14 -14
  157. package/.claude/personalities/crass.md +14 -14
  158. package/.claude/personalities/dramatic.md +14 -14
  159. package/.claude/personalities/dry-humor.md +50 -50
  160. package/.claude/personalities/flirty.md +20 -20
  161. package/.claude/personalities/funny.md +14 -14
  162. package/.claude/personalities/grandpa.md +32 -32
  163. package/.claude/personalities/millennial.md +14 -14
  164. package/.claude/personalities/moody.md +14 -14
  165. package/.claude/personalities/normal.md +16 -16
  166. package/.claude/personalities/pirate.md +14 -14
  167. package/.claude/personalities/poetic.md +14 -14
  168. package/.claude/personalities/professional.md +14 -14
  169. package/.claude/personalities/rapper.md +55 -55
  170. package/.claude/personalities/robot.md +14 -14
  171. package/.claude/personalities/sarcastic.md +38 -38
  172. package/.claude/personalities/sassy.md +14 -14
  173. package/.claude/personalities/surfer-dude.md +14 -14
  174. package/.claude/personalities/zen.md +14 -14
  175. package/.claude/piper-voices-dir.txt +1 -0
  176. package/.claude/settings.json +25 -15
  177. package/.claude/verbosity.txt +1 -1
  178. package/.clawdbot/README.md +105 -105
  179. package/.clawdbot/skill/SKILL.md +149 -145
  180. package/.mcp.json +30 -11
  181. package/CLAUDE.md +170 -215
  182. package/README.md +207 -521
  183. package/RELEASE_NOTES.md +1172 -1976
  184. package/WINDOWS-SETUP.md +208 -208
  185. package/bin/agent-vibes +0 -0
  186. package/bin/agentvibes-voice-browser.js +64 -1289
  187. package/bin/agentvibes.js +28 -0
  188. package/bin/ensure-soprano-running.sh +43 -0
  189. package/bin/mcp-server.js +121 -121
  190. package/bin/mcp-server.sh +0 -0
  191. package/bin/test-bmad-pr +78 -78
  192. package/mcp-server/QUICK_START.md +203 -203
  193. package/mcp-server/README.md +345 -345
  194. package/mcp-server/WINDOWS_SETUP.md +260 -260
  195. package/mcp-server/docs/troubleshooting-audio.md +313 -313
  196. package/mcp-server/examples/claude_desktop_config.json +11 -11
  197. package/mcp-server/examples/claude_desktop_config_piper.json +9 -9
  198. package/mcp-server/examples/custom_instructions.md +169 -169
  199. package/mcp-server/install-deps.js +130 -130
  200. package/mcp-server/pyproject.toml +52 -52
  201. package/mcp-server/requirements.txt +2 -2
  202. package/mcp-server/server.py +1467 -1578
  203. package/mcp-server/test_server.py +395 -395
  204. package/package.json +1 -3
  205. package/setup-windows.ps1 +815 -815
  206. package/src/console/tabs/music-tab.js +5 -2
  207. package/src/console/tabs/voices-tab.js +71 -37
  208. package/src/installer.js +52 -5
  209. package/src/services/llm-provider-service.js +1 -1
  210. package/templates/agentvibes-receiver.sh +158 -483
  211. package/templates/audio/welcome-music.mp3 +0 -0
  212. package/.agentvibes/bmad-voice-map.json +0 -104
  213. package/.agentvibes/copilot-sessions.log +0 -4
  214. package/.claude/config/audio-effects-bmad.cfg +0 -50
  215. package/.claude/config/intro-text.txt +0 -1
  216. package/.claude/config/personality.txt +0 -1
  217. package/.claude/config/piper-speech-rate.txt +0 -4
  218. package/.claude/config/piper-target-speech-rate.txt +0 -1
  219. package/.claude/config/reverb-level.txt +0 -1
  220. package/.claude/config/tts-target-speech-rate.txt +0 -1
  221. package/voice-assignments.json +0 -8245
  222. /package/{.claude → .agentvibes}/config/agentvibes.json +0 -0
@@ -1,153 +1,153 @@
1
- #!/usr/bin/env python3
2
- #
3
- # File: .claude/hooks-windows/soprano-gradio-synth.py
4
- #
5
- # AgentVibes - Finally, your AI Agents can Talk Back!
6
- # Website: https://agentvibes.org
7
- # Repository: https://github.com/paulpreibisch/AgentVibes
8
- #
9
- # Co-created by Paul Preibisch with Claude AI
10
- # Copyright (c) 2025 Paul Preibisch
11
- #
12
- # Licensed under the Apache License, Version 2.0 (the "License");
13
- # you may not use this file except in compliance with the License.
14
- # You may obtain a copy of the License at
15
- #
16
- # http://www.apache.org/licenses/LICENSE-2.0
17
- #
18
- # Unless required by applicable law or agreed to in writing, software
19
- # distributed under the License is distributed on an "AS IS" BASIS,
20
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
21
- # See the License for the specific language governing permissions and
22
- # limitations under the License.
23
- #
24
- # ---
25
- #
26
- # Soprano Gradio WebUI synthesizer helper.
27
- # Calls the Soprano WebUI's Gradio API and saves the result as a WAV file.
28
- # Uses only Python stdlib (json, sys, urllib) — no extra dependencies.
29
- #
30
- # Usage: python3 soprano-gradio-synth.py "text to speak" output.wav [port]
31
- #
32
- """
33
- Soprano Gradio WebUI synthesizer helper for AgentVibes.
34
-
35
- Calls the Soprano WebUI's Gradio API via the Server-Sent Events (SSE) protocol
36
- and downloads the generated audio as a WAV file.
37
-
38
- Flow:
39
- 1. Submit generation request -> get event_id
40
- 2. Poll SSE stream for audio file URL
41
- 3. Download WAV file to output path
42
-
43
- See: https://github.com/ekwek1/soprano
44
- """
45
- import json
46
- import sys
47
- import urllib.request
48
- import urllib.error
49
-
50
-
51
- def synth(text: str, output_path: str, port: int = 7860) -> None:
52
- base = f"http://127.0.0.1:{port}"
53
-
54
- # Step 1: Submit generation request
55
- # Args: text, temperature, top_p, repetition_penalty, chunk_size, streaming
56
- payload = json.dumps({
57
- "data": [text, 0.0, 0.95, 1.2, 1, False]
58
- }).encode()
59
-
60
- event_id = submit_request(base, payload)
61
-
62
- # Step 2: Poll SSE stream for audio file URL
63
- audio_url = poll_for_result(base, event_id)
64
-
65
- # Step 3: Download the audio file (validate localhost to prevent SSRF)
66
- download_file(audio_url, output_path, port)
67
-
68
-
69
- def submit_request(base: str, payload: bytes) -> str:
70
- """Submit generation request to Gradio API, return event_id."""
71
- for api_base in ["/gradio_api/call", "/call"]:
72
- url = f"{base}{api_base}/generate_speech"
73
- req = urllib.request.Request(
74
- url,
75
- data=payload,
76
- headers={"Content-Type": "application/json"},
77
- )
78
- try:
79
- with urllib.request.urlopen(req, timeout=30) as resp:
80
- return json.loads(resp.read())["event_id"]
81
- except urllib.error.URLError:
82
- continue
83
-
84
- raise RuntimeError("Could not reach Soprano WebUI API")
85
-
86
-
87
- def poll_for_result(base: str, event_id: str) -> str:
88
- """Poll SSE endpoint until audio file URL is returned."""
89
- for api_base in ["/gradio_api/call", "/call"]:
90
- url = f"{base}{api_base}/generate_speech/{event_id}"
91
- req = urllib.request.Request(url)
92
- try:
93
- with urllib.request.urlopen(req, timeout=120) as resp:
94
- for raw_line in resp:
95
- line = raw_line.decode("utf-8", errors="replace").strip()
96
- if not line.startswith("data: "):
97
- continue
98
- try:
99
- parsed = json.loads(line[6:])
100
- except json.JSONDecodeError:
101
- continue
102
- # Response format: [{"path": "...", "url": "...", ...}, "status string"]
103
- if isinstance(parsed, list) and len(parsed) >= 1:
104
- audio = parsed[0]
105
- if isinstance(audio, dict) and "url" in audio:
106
- return audio["url"]
107
- break
108
- except urllib.error.URLError:
109
- continue
110
-
111
- raise RuntimeError("No audio URL in Soprano response")
112
-
113
-
114
- def download_file(url: str, output_path: str, port: int = 7860) -> None:
115
- """Download audio file from Gradio file server.
116
-
117
- Security: Validates URL points to localhost to prevent SSRF.
118
- """
119
- # Validate URL is localhost to prevent SSRF via crafted Gradio responses
120
- allowed_prefixes = [
121
- f"http://127.0.0.1:{port}/",
122
- f"http://localhost:{port}/",
123
- ]
124
- if not any(url.startswith(prefix) for prefix in allowed_prefixes):
125
- raise RuntimeError(f"Refused download from non-localhost URL: {url[:80]}")
126
-
127
- req = urllib.request.Request(url)
128
- with urllib.request.urlopen(req, timeout=30) as resp:
129
- with open(output_path, "wb") as f:
130
- while True:
131
- chunk = resp.read(8192)
132
- if not chunk:
133
- break
134
- f.write(chunk)
135
-
136
-
137
- if __name__ == "__main__":
138
- if len(sys.argv) < 3:
139
- print(f"Usage: {sys.argv[0]} \"text\" output.wav [port]", file=sys.stderr)
140
- sys.exit(1)
141
-
142
- text = sys.argv[1]
143
- output = sys.argv[2]
144
- port = int(sys.argv[3]) if len(sys.argv) > 3 else 7860
145
- if not (1 <= port <= 65535):
146
- print(f"Error: Invalid port number: {port}", file=sys.stderr)
147
- sys.exit(1)
148
-
149
- try:
150
- synth(text, output, port)
151
- except Exception as e:
152
- print(f"Error: {e}", file=sys.stderr)
153
- sys.exit(1)
1
+ #!/usr/bin/env python3
2
+ #
3
+ # File: .claude/hooks-windows/soprano-gradio-synth.py
4
+ #
5
+ # AgentVibes - Finally, your AI Agents can Talk Back!
6
+ # Website: https://agentvibes.org
7
+ # Repository: https://github.com/paulpreibisch/AgentVibes
8
+ #
9
+ # Co-created by Paul Preibisch with Claude AI
10
+ # Copyright (c) 2025 Paul Preibisch
11
+ #
12
+ # Licensed under the Apache License, Version 2.0 (the "License");
13
+ # you may not use this file except in compliance with the License.
14
+ # You may obtain a copy of the License at
15
+ #
16
+ # http://www.apache.org/licenses/LICENSE-2.0
17
+ #
18
+ # Unless required by applicable law or agreed to in writing, software
19
+ # distributed under the License is distributed on an "AS IS" BASIS,
20
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
21
+ # See the License for the specific language governing permissions and
22
+ # limitations under the License.
23
+ #
24
+ # ---
25
+ #
26
+ # Soprano Gradio WebUI synthesizer helper.
27
+ # Calls the Soprano WebUI's Gradio API and saves the result as a WAV file.
28
+ # Uses only Python stdlib (json, sys, urllib) — no extra dependencies.
29
+ #
30
+ # Usage: python3 soprano-gradio-synth.py "text to speak" output.wav [port]
31
+ #
32
+ """
33
+ Soprano Gradio WebUI synthesizer helper for AgentVibes.
34
+
35
+ Calls the Soprano WebUI's Gradio API via the Server-Sent Events (SSE) protocol
36
+ and downloads the generated audio as a WAV file.
37
+
38
+ Flow:
39
+ 1. Submit generation request -> get event_id
40
+ 2. Poll SSE stream for audio file URL
41
+ 3. Download WAV file to output path
42
+
43
+ See: https://github.com/ekwek1/soprano
44
+ """
45
+ import json
46
+ import sys
47
+ import urllib.request
48
+ import urllib.error
49
+
50
+
51
+ def synth(text: str, output_path: str, port: int = 7860) -> None:
52
+ base = f"http://127.0.0.1:{port}"
53
+
54
+ # Step 1: Submit generation request
55
+ # Args: text, temperature, top_p, repetition_penalty, chunk_size, streaming
56
+ payload = json.dumps({
57
+ "data": [text, 0.0, 0.95, 1.2, 1, False]
58
+ }).encode()
59
+
60
+ event_id = submit_request(base, payload)
61
+
62
+ # Step 2: Poll SSE stream for audio file URL
63
+ audio_url = poll_for_result(base, event_id)
64
+
65
+ # Step 3: Download the audio file (validate localhost to prevent SSRF)
66
+ download_file(audio_url, output_path, port)
67
+
68
+
69
+ def submit_request(base: str, payload: bytes) -> str:
70
+ """Submit generation request to Gradio API, return event_id."""
71
+ for api_base in ["/gradio_api/call", "/call"]:
72
+ url = f"{base}{api_base}/generate_speech"
73
+ req = urllib.request.Request(
74
+ url,
75
+ data=payload,
76
+ headers={"Content-Type": "application/json"},
77
+ )
78
+ try:
79
+ with urllib.request.urlopen(req, timeout=30) as resp:
80
+ return json.loads(resp.read())["event_id"]
81
+ except urllib.error.URLError:
82
+ continue
83
+
84
+ raise RuntimeError("Could not reach Soprano WebUI API")
85
+
86
+
87
+ def poll_for_result(base: str, event_id: str) -> str:
88
+ """Poll SSE endpoint until audio file URL is returned."""
89
+ for api_base in ["/gradio_api/call", "/call"]:
90
+ url = f"{base}{api_base}/generate_speech/{event_id}"
91
+ req = urllib.request.Request(url)
92
+ try:
93
+ with urllib.request.urlopen(req, timeout=120) as resp:
94
+ for raw_line in resp:
95
+ line = raw_line.decode("utf-8", errors="replace").strip()
96
+ if not line.startswith("data: "):
97
+ continue
98
+ try:
99
+ parsed = json.loads(line[6:])
100
+ except json.JSONDecodeError:
101
+ continue
102
+ # Response format: [{"path": "...", "url": "...", ...}, "status string"]
103
+ if isinstance(parsed, list) and len(parsed) >= 1:
104
+ audio = parsed[0]
105
+ if isinstance(audio, dict) and "url" in audio:
106
+ return audio["url"]
107
+ break
108
+ except urllib.error.URLError:
109
+ continue
110
+
111
+ raise RuntimeError("No audio URL in Soprano response")
112
+
113
+
114
+ def download_file(url: str, output_path: str, port: int = 7860) -> None:
115
+ """Download audio file from Gradio file server.
116
+
117
+ Security: Validates URL points to localhost to prevent SSRF.
118
+ """
119
+ # Validate URL is localhost to prevent SSRF via crafted Gradio responses
120
+ allowed_prefixes = [
121
+ f"http://127.0.0.1:{port}/",
122
+ f"http://localhost:{port}/",
123
+ ]
124
+ if not any(url.startswith(prefix) for prefix in allowed_prefixes):
125
+ raise RuntimeError(f"Refused download from non-localhost URL: {url[:80]}")
126
+
127
+ req = urllib.request.Request(url)
128
+ with urllib.request.urlopen(req, timeout=30) as resp:
129
+ with open(output_path, "wb") as f:
130
+ while True:
131
+ chunk = resp.read(8192)
132
+ if not chunk:
133
+ break
134
+ f.write(chunk)
135
+
136
+
137
+ if __name__ == "__main__":
138
+ if len(sys.argv) < 3:
139
+ print(f"Usage: {sys.argv[0]} \"text\" output.wav [port]", file=sys.stderr)
140
+ sys.exit(1)
141
+
142
+ text = sys.argv[1]
143
+ output = sys.argv[2]
144
+ port = int(sys.argv[3]) if len(sys.argv) > 3 else 7860
145
+ if not (1 <= port <= 65535):
146
+ print(f"Error: Invalid port number: {port}", file=sys.stderr)
147
+ sys.exit(1)
148
+
149
+ try:
150
+ synth(text, output, port)
151
+ except Exception as e:
152
+ print(f"Error: {e}", file=sys.stderr)
153
+ sys.exit(1)
@@ -1,166 +1,166 @@
1
- #
2
- # File: .claude/hooks-windows/speed-manager.ps1
3
- #
4
- # AgentVibes - Finally, your AI Agents can Talk Back!
5
- # Website: https://agentvibes.org
6
- # Copyright (c) 2025 Paul Preibisch
7
- # Licensed under the Apache License, Version 2.0
8
-
9
- param(
10
- [Parameter(Position=0)]
11
- [string]$Command = "help",
12
- [Parameter(Position=1)]
13
- [string]$Arg1 = ""
14
- )
15
-
16
- $ScriptDir = Split-Path -Parent $MyInvocation.MyCommand.Path
17
- $ClaudeDir = Split-Path -Parent $ScriptDir
18
-
19
- # Determine config directory
20
- if ($env:CLAUDE_PROJECT_DIR -and (Test-Path "$env:CLAUDE_PROJECT_DIR\.claude")) {
21
- $ConfigDir = Join-Path $env:CLAUDE_PROJECT_DIR ".claude" "config"
22
- } else {
23
- $ConfigDir = Join-Path $ClaudeDir "config"
24
- }
25
-
26
- if (-not (Test-Path $ConfigDir)) { New-Item -ItemType Directory -Path $ConfigDir -Force | Out-Null }
27
-
28
- $MainSpeedFile = Join-Path $ConfigDir "tts-speech-rate.txt"
29
- $TargetSpeedFile = Join-Path $ConfigDir "tts-target-speech-rate.txt"
30
-
31
- # Legacy migration
32
- $LegacyMain = Join-Path $ConfigDir "piper-speech-rate.txt"
33
- $LegacyTarget = Join-Path $ConfigDir "piper-target-speech-rate.txt"
34
- if ((Test-Path $LegacyMain) -and -not (Test-Path $MainSpeedFile)) {
35
- Copy-Item $LegacyMain $MainSpeedFile
36
- }
37
- if ((Test-Path $LegacyTarget) -and -not (Test-Path $TargetSpeedFile)) {
38
- Copy-Item $LegacyTarget $TargetSpeedFile
39
- }
40
-
41
- function Parse-SpeedValue {
42
- param([string]$Input)
43
-
44
- switch -Regex ($Input) {
45
- '^(normal|1x|1\.0)$' { return "1.0" }
46
- '^(slow|slower|0\.5x)$' { return "0.5" }
47
- '^(fast|2x|2\.0)$' { return "2.0" }
48
- '^(faster|3x|3\.0)$' { return "3.0" }
49
- }
50
-
51
- $val = $Input -replace '^[+-]', '' -replace 'x$', ''
52
- if ($val -match '^\d+\.?\d*$') { return $val }
53
- return "ERROR"
54
- }
55
-
56
- function Set-Speed {
57
- param([bool]$IsTarget = $false, [string]$SpeedInput)
58
-
59
- if (-not $SpeedInput) {
60
- Write-Output "Error: Speed value required"
61
- Write-Output "Usage: speed-manager.ps1 [target] <speed>"
62
- exit 1
63
- }
64
-
65
- $speedValue = Parse-SpeedValue $SpeedInput
66
- if ($speedValue -eq "ERROR") {
67
- Write-Output "Invalid speed value: $SpeedInput"
68
- Write-Output "Valid values: normal, 0.5x, 1x, 2x, 3x"
69
- exit 1
70
- }
71
-
72
- if ($IsTarget) {
73
- $configFile = $TargetSpeedFile
74
- $voiceType = "target language"
75
- } else {
76
- $configFile = $MainSpeedFile
77
- $voiceType = "main voice"
78
- }
79
-
80
- Set-Content -Path $configFile -Value $speedValue -NoNewline
81
-
82
- Write-Output "Speech speed set for $voiceType"
83
- Write-Output ""
84
- Write-Output "Speed: ${speedValue}x"
85
-
86
- switch ($speedValue) {
87
- "0.5" { Write-Output "Effect: Half speed (slower)" }
88
- "1.0" { Write-Output "Effect: Normal speed" }
89
- "2.0" { Write-Output "Effect: Double speed (faster)" }
90
- "3.0" { Write-Output "Effect: Triple speed (very fast)" }
91
- default {
92
- if ([double]$speedValue -gt 1.0) {
93
- Write-Output "Effect: Faster speech"
94
- } else {
95
- Write-Output "Effect: Slower speech"
96
- }
97
- }
98
- }
99
- }
100
-
101
- function Get-Speed {
102
- Write-Output "---------------------------------------"
103
- Write-Output " Current Speech Speed Settings"
104
- Write-Output "---------------------------------------"
105
- Write-Output ""
106
-
107
- if (Test-Path $MainSpeedFile) {
108
- $mainSpeed = (Get-Content $MainSpeedFile | Where-Object { $_ -notmatch '^\s*#' -and $_.Trim() -ne '' } | Select-Object -Last 1).Trim()
109
- Write-Output "Main voice: ${mainSpeed}x"
110
- } else {
111
- Write-Output "Main voice: 1.0x (default, normal speed)"
112
- }
113
-
114
- if (Test-Path $TargetSpeedFile) {
115
- $targetSpeed = (Get-Content $TargetSpeedFile | Where-Object { $_ -notmatch '^\s*#' -and $_.Trim() -ne '' } | Select-Object -Last 1).Trim()
116
- Write-Output "Target language: ${targetSpeed}x"
117
- } else {
118
- Write-Output "Target language: 0.5x (default, slower for learning)"
119
- }
120
-
121
- Write-Output ""
122
- Write-Output "Scale: 0.5x=slower, 1.0x=normal, 2.0x=faster, 3.0x=very fast"
123
- Write-Output "---------------------------------------"
124
- }
125
-
126
- switch -Regex ($Command) {
127
- "^target$" {
128
- Set-Speed -IsTarget $true -SpeedInput $Arg1
129
- }
130
- "^(get|status)$" {
131
- Get-Speed
132
- }
133
- "^(normal|fast|slow|slower)$" {
134
- Set-Speed -SpeedInput $Command
135
- }
136
- "^.*x$" {
137
- Set-Speed -SpeedInput $Command
138
- }
139
- "^\d+\.?\d*$" {
140
- Set-Speed -SpeedInput $Command
141
- }
142
- "^[+-]" {
143
- Set-Speed -SpeedInput $Command
144
- }
145
- "^help$" {
146
- Write-Output "Speech Speed Manager"
147
- Write-Output ""
148
- Write-Output "Usage:"
149
- Write-Output " speed-manager.ps1 <speed> Set main voice speed"
150
- Write-Output " speed-manager.ps1 target <speed> Set target language speed"
151
- Write-Output " speed-manager.ps1 get Show current speeds"
152
- Write-Output ""
153
- Write-Output "Speed values: 0.5x, 1x, 2x, 3x, normal, slow, fast, faster"
154
- }
155
- default {
156
- # Try as speed value
157
- $parsed = Parse-SpeedValue $Command
158
- if ($parsed -ne "ERROR") {
159
- Set-Speed -SpeedInput $Command
160
- } else {
161
- Write-Output "Unknown command: $Command"
162
- Write-Output "Usage: speed-manager.ps1 {get|target|<speed>}"
163
- exit 1
164
- }
165
- }
166
- }
1
+ #
2
+ # File: .claude/hooks-windows/speed-manager.ps1
3
+ #
4
+ # AgentVibes - Finally, your AI Agents can Talk Back!
5
+ # Website: https://agentvibes.org
6
+ # Copyright (c) 2025 Paul Preibisch
7
+ # Licensed under the Apache License, Version 2.0
8
+
9
+ param(
10
+ [Parameter(Position=0)]
11
+ [string]$Command = "help",
12
+ [Parameter(Position=1)]
13
+ [string]$Arg1 = ""
14
+ )
15
+
16
+ $ScriptDir = Split-Path -Parent $MyInvocation.MyCommand.Path
17
+ $ClaudeDir = Split-Path -Parent $ScriptDir
18
+
19
+ # Determine config directory
20
+ if ($env:CLAUDE_PROJECT_DIR -and (Test-Path "$env:CLAUDE_PROJECT_DIR\.claude")) {
21
+ $ConfigDir = Join-Path $env:CLAUDE_PROJECT_DIR ".claude" "config"
22
+ } else {
23
+ $ConfigDir = Join-Path $ClaudeDir "config"
24
+ }
25
+
26
+ if (-not (Test-Path $ConfigDir)) { New-Item -ItemType Directory -Path $ConfigDir -Force | Out-Null }
27
+
28
+ $MainSpeedFile = Join-Path $ConfigDir "tts-speech-rate.txt"
29
+ $TargetSpeedFile = Join-Path $ConfigDir "tts-target-speech-rate.txt"
30
+
31
+ # Legacy migration
32
+ $LegacyMain = Join-Path $ConfigDir "piper-speech-rate.txt"
33
+ $LegacyTarget = Join-Path $ConfigDir "piper-target-speech-rate.txt"
34
+ if ((Test-Path $LegacyMain) -and -not (Test-Path $MainSpeedFile)) {
35
+ Copy-Item $LegacyMain $MainSpeedFile
36
+ }
37
+ if ((Test-Path $LegacyTarget) -and -not (Test-Path $TargetSpeedFile)) {
38
+ Copy-Item $LegacyTarget $TargetSpeedFile
39
+ }
40
+
41
+ function Parse-SpeedValue {
42
+ param([string]$Input)
43
+
44
+ switch -Regex ($Input) {
45
+ '^(normal|1x|1\.0)$' { return "1.0" }
46
+ '^(slow|slower|0\.5x)$' { return "0.5" }
47
+ '^(fast|2x|2\.0)$' { return "2.0" }
48
+ '^(faster|3x|3\.0)$' { return "3.0" }
49
+ }
50
+
51
+ $val = $Input -replace '^[+-]', '' -replace 'x$', ''
52
+ if ($val -match '^\d+\.?\d*$') { return $val }
53
+ return "ERROR"
54
+ }
55
+
56
+ function Set-Speed {
57
+ param([bool]$IsTarget = $false, [string]$SpeedInput)
58
+
59
+ if (-not $SpeedInput) {
60
+ Write-Output "Error: Speed value required"
61
+ Write-Output "Usage: speed-manager.ps1 [target] <speed>"
62
+ exit 1
63
+ }
64
+
65
+ $speedValue = Parse-SpeedValue $SpeedInput
66
+ if ($speedValue -eq "ERROR") {
67
+ Write-Output "Invalid speed value: $SpeedInput"
68
+ Write-Output "Valid values: normal, 0.5x, 1x, 2x, 3x"
69
+ exit 1
70
+ }
71
+
72
+ if ($IsTarget) {
73
+ $configFile = $TargetSpeedFile
74
+ $voiceType = "target language"
75
+ } else {
76
+ $configFile = $MainSpeedFile
77
+ $voiceType = "main voice"
78
+ }
79
+
80
+ Set-Content -Path $configFile -Value $speedValue -NoNewline
81
+
82
+ Write-Output "Speech speed set for $voiceType"
83
+ Write-Output ""
84
+ Write-Output "Speed: ${speedValue}x"
85
+
86
+ switch ($speedValue) {
87
+ "0.5" { Write-Output "Effect: Half speed (slower)" }
88
+ "1.0" { Write-Output "Effect: Normal speed" }
89
+ "2.0" { Write-Output "Effect: Double speed (faster)" }
90
+ "3.0" { Write-Output "Effect: Triple speed (very fast)" }
91
+ default {
92
+ if ([double]$speedValue -gt 1.0) {
93
+ Write-Output "Effect: Faster speech"
94
+ } else {
95
+ Write-Output "Effect: Slower speech"
96
+ }
97
+ }
98
+ }
99
+ }
100
+
101
+ function Get-Speed {
102
+ Write-Output "---------------------------------------"
103
+ Write-Output " Current Speech Speed Settings"
104
+ Write-Output "---------------------------------------"
105
+ Write-Output ""
106
+
107
+ if (Test-Path $MainSpeedFile) {
108
+ $mainSpeed = (Get-Content $MainSpeedFile | Where-Object { $_ -notmatch '^\s*#' -and $_.Trim() -ne '' } | Select-Object -Last 1).Trim()
109
+ Write-Output "Main voice: ${mainSpeed}x"
110
+ } else {
111
+ Write-Output "Main voice: 1.0x (default, normal speed)"
112
+ }
113
+
114
+ if (Test-Path $TargetSpeedFile) {
115
+ $targetSpeed = (Get-Content $TargetSpeedFile | Where-Object { $_ -notmatch '^\s*#' -and $_.Trim() -ne '' } | Select-Object -Last 1).Trim()
116
+ Write-Output "Target language: ${targetSpeed}x"
117
+ } else {
118
+ Write-Output "Target language: 0.5x (default, slower for learning)"
119
+ }
120
+
121
+ Write-Output ""
122
+ Write-Output "Scale: 0.5x=slower, 1.0x=normal, 2.0x=faster, 3.0x=very fast"
123
+ Write-Output "---------------------------------------"
124
+ }
125
+
126
+ switch -Regex ($Command) {
127
+ "^target$" {
128
+ Set-Speed -IsTarget $true -SpeedInput $Arg1
129
+ }
130
+ "^(get|status)$" {
131
+ Get-Speed
132
+ }
133
+ "^(normal|fast|slow|slower)$" {
134
+ Set-Speed -SpeedInput $Command
135
+ }
136
+ "^.*x$" {
137
+ Set-Speed -SpeedInput $Command
138
+ }
139
+ "^\d+\.?\d*$" {
140
+ Set-Speed -SpeedInput $Command
141
+ }
142
+ "^[+-]" {
143
+ Set-Speed -SpeedInput $Command
144
+ }
145
+ "^help$" {
146
+ Write-Output "Speech Speed Manager"
147
+ Write-Output ""
148
+ Write-Output "Usage:"
149
+ Write-Output " speed-manager.ps1 <speed> Set main voice speed"
150
+ Write-Output " speed-manager.ps1 target <speed> Set target language speed"
151
+ Write-Output " speed-manager.ps1 get Show current speeds"
152
+ Write-Output ""
153
+ Write-Output "Speed values: 0.5x, 1x, 2x, 3x, normal, slow, fast, faster"
154
+ }
155
+ default {
156
+ # Try as speed value
157
+ $parsed = Parse-SpeedValue $Command
158
+ if ($parsed -ne "ERROR") {
159
+ Set-Speed -SpeedInput $Command
160
+ } else {
161
+ Write-Output "Unknown command: $Command"
162
+ Write-Output "Usage: speed-manager.ps1 {get|target|<speed>}"
163
+ exit 1
164
+ }
165
+ }
166
+ }