voice-mcp-server 0.1.7 → 0.1.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +2 -2
- package/package.json +1 -1
- package/src/daemon/audio_server.py +1 -1
- package/src/mcp_server.py +3 -3
package/README.md
CHANGED
|
@@ -112,14 +112,14 @@ You can now add the server to your favorite client. Using `npx -y` ensures it wo
|
|
|
112
112
|
|
|
113
113
|
**For Gemini CLI:**
|
|
114
114
|
```bash
|
|
115
|
-
gemini mcp add voice-mcp-server npx -y voice-mcp-server
|
|
115
|
+
gemini mcp add voice-mcp-server --scope user npx -y voice-mcp-server
|
|
116
116
|
```
|
|
117
117
|
|
|
118
118
|
**For Cursor / Claude Desktop:**
|
|
119
119
|
Simply use `npx` and `-y` as the command in your configuration.
|
|
120
120
|
|
|
121
121
|
> [!NOTE]
|
|
122
|
-
> **First Run Performance:** The very first time you invoke the voice tool, it will take a few minutes to initialize the Python environment and download the heavy ML weights (~4GB).
|
|
122
|
+
> **First Run Performance:** The very first time you invoke the voice tool, it will take a few minutes to initialize the Python environment and download the heavy ML weights (~4GB). **The tools will not be available until this background setup completes.** You can monitor progress in your terminal logs.
|
|
123
123
|
|
|
124
124
|
---
|
|
125
125
|
|
package/package.json
CHANGED
|
@@ -348,7 +348,7 @@ if __name__ == "__main__":
|
|
|
348
348
|
import os
|
|
349
349
|
|
|
350
350
|
# Isolate socket to user directory to prevent /tmp hijacking and permission issues
|
|
351
|
-
app_support_dir = os.path.expanduser("~/Library/Application Support/
|
|
351
|
+
app_support_dir = os.path.expanduser("~/Library/Application Support/VoiceMCP")
|
|
352
352
|
os.makedirs(app_support_dir, exist_ok=True)
|
|
353
353
|
socket_path = os.path.join(app_support_dir, "daemon.sock")
|
|
354
354
|
|
package/src/mcp_server.py
CHANGED
|
@@ -41,7 +41,7 @@ SESSION_ID = str(uuid.uuid4())
|
|
|
41
41
|
|
|
42
42
|
# We use Unix Domain Sockets to bypass macOS firewall popups
|
|
43
43
|
# Isolate socket to user directory to prevent /tmp hijacking
|
|
44
|
-
app_support_dir = os.path.expanduser("~/Library/Application Support/
|
|
44
|
+
app_support_dir = os.path.expanduser("~/Library/Application Support/VoiceMCP")
|
|
45
45
|
os.makedirs(app_support_dir, exist_ok=True)
|
|
46
46
|
SOCKET_PATH = os.path.join(app_support_dir, "daemon.sock")
|
|
47
47
|
|
|
@@ -188,7 +188,7 @@ async def voice_converse(text_to_speak: str, expect_reply: bool = True, ctx: Con
|
|
|
188
188
|
# Handle the initialization (download) state automatically with native progress
|
|
189
189
|
if response_data and response_data.get("status") == "system_busy" and "initializing" in response_data.get("message", "").lower():
|
|
190
190
|
if ctx:
|
|
191
|
-
await ctx.info("
|
|
191
|
+
await ctx.info("Voice MCP: Initializing Local AI Models. This may take a few minutes...")
|
|
192
192
|
|
|
193
193
|
while True:
|
|
194
194
|
try:
|
|
@@ -205,7 +205,7 @@ async def voice_converse(text_to_speak: str, expect_reply: bool = True, ctx: Con
|
|
|
205
205
|
|
|
206
206
|
if d_status == "READY":
|
|
207
207
|
if ctx:
|
|
208
|
-
await ctx.info("
|
|
208
|
+
await ctx.info("Voice MCP: Setup Complete!")
|
|
209
209
|
|
|
210
210
|
# After setup, the models are ready! Now perform the ACTUAL converse call with visualizer.
|
|
211
211
|
vis_task2 = asyncio.create_task(render_visualizer(ctx)) if ctx else None
|