npm - agentgui - Versions diffs - 1.0.753 → 1.0.754 - Mend

agentgui 1.0.753 → 1.0.754

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/lib/speech-manager.js ADDED Viewed

@@ -0,0 +1,203 @@
+import fs from 'fs';
+import path from 'path';
+import os from 'os';
+import { createRequire } from 'module';
+let speechModule = null;
+let _broadcastSync = null;
+let _syncClients = null;
+let _queries = null;
+export function initSpeechManager({ broadcastSync, syncClients, queries }) {
+  _broadcastSync = broadcastSync;
+  _syncClients = syncClients;
+  _queries = queries;
+}
+export async function ensurePocketTtsSetup(onProgress) {
+  const r = createRequire(import.meta.url);
+  const serverTTS = r('webtalk/server-tts');
+  return serverTTS.ensureInstalled(onProgress);
+}
+export async function getSpeech() {
+  if (!speechModule) speechModule = await import('./speech.js');
+  return speechModule;
+}
+const ttsTextAccumulators = new Map();
+export const voiceCacheManager = {
+  generating: new Map(),
+  maxCacheSize: 10 * 1024 * 1024,
+  async getOrGenerateCache(conversationId, text) {
+    const cacheKey = `${conversationId}:${text}`;
+    if (this.generating.has(cacheKey)) {
+      return new Promise((resolve) => {
+        const checkInterval = setInterval(() => {
+          const cached = _queries.getVoiceCache(conversationId, text);
+          if (cached) { clearInterval(checkInterval); resolve(cached); }
+        }, 50);
+      });
+    }
+    const cached = _queries.getVoiceCache(conversationId, text);
+    if (cached) return cached;
+    this.generating.set(cacheKey, true);
+    try {
+      const speech = await getSpeech();
+      const audioBlob = await speech.synthesize(text, 'default');
+      const saved = _queries.saveVoiceCache(conversationId, text, audioBlob);
+      const totalSize = _queries.getVoiceCacheSize(conversationId);
+      if (totalSize > this.maxCacheSize) {
+        const needed = totalSize - this.maxCacheSize;
+        _queries.deleteOldestVoiceCache(conversationId, needed);
+      }
+      return saved;
+    } finally {
+      this.generating.delete(cacheKey);
+    }
+  }
+};
+export const modelDownloadState = {
+  downloading: false,
+  progress: null,
+  error: null,
+  complete: false,
+  startTime: null,
+  downloadMetrics: new Map()
+};
+export function broadcastModelProgress(progress) {
+  modelDownloadState.progress = progress;
+  const broadcastData = {
+    type: 'model_download_progress',
+    modelId: progress.type || 'unknown',
+    bytesDownloaded: progress.bytesDownloaded || 0,
+    bytesRemaining: progress.bytesRemaining || 0,
+    totalBytes: progress.totalBytes || 0,
+    downloadSpeed: progress.downloadSpeed || 0,
+    eta: progress.eta || 0,
+    retryCount: progress.retryCount || 0,
+    currentGateway: progress.currentGateway || '',
+    status: progress.status || (progress.done ? 'completed' : progress.downloading ? 'downloading' : 'paused'),
+    percentComplete: progress.percentComplete || 0,
+    completedFiles: progress.completedFiles || 0,
+    totalFiles: progress.totalFiles || 0,
+    timestamp: Date.now(),
+    ...progress
+  };
+  _broadcastSync(broadcastData);
+}
+async function validateAndCleanupModels(modelsDir) {
+  try {
+    const manifestPath = path.join(modelsDir, '.manifests.json');
+    if (fs.existsSync(manifestPath)) {
+      try {
+        const content = fs.readFileSync(manifestPath, 'utf8');
+        JSON.parse(content);
+      } catch (e) {
+        console.error('[MODELS] Manifest corrupted, removing:', e.message);
+        fs.unlinkSync(manifestPath);
+      }
+    }
+    const files = fs.readdirSync(modelsDir);
+    for (const file of files) {
+      if (file.endsWith('.tmp')) {
+        try { fs.unlinkSync(path.join(modelsDir, file)); console.log('[MODELS] Cleaned up temp file:', file); }
+        catch (e) { console.warn('[MODELS] Failed to clean:', file); }
+      }
+    }
+  } catch (e) {
+    console.warn('[MODELS] Cleanup check failed:', e.message);
+  }
+}
+export async function ensureModelsDownloaded() {
+  if (modelDownloadState.downloading) {
+    while (modelDownloadState.downloading) { await new Promise(r => setTimeout(r, 100)); }
+    return modelDownloadState.complete;
+  }
+  modelDownloadState.downloading = true;
+  modelDownloadState.error = null;
+  try {
+    const r = createRequire(import.meta.url);
+    const { createConfig } = r('webtalk/config');
+    const { ensureModel } = r('webtalk/whisper-models');
+    const { ensureTTSModels } = r('webtalk/tts-models');
+    const gmguiModels = path.join(os.homedir(), '.gmgui', 'models');
+    const modelsBase = process.env.PORTABLE_EXE_DIR
+      ? (fs.existsSync(path.join(process.env.PORTABLE_EXE_DIR, 'models', 'onnx-community')) ? path.join(process.env.PORTABLE_EXE_DIR, 'models') : gmguiModels)
+      : gmguiModels;
+    await validateAndCleanupModels(modelsBase);
+    const config = createConfig({ modelsDir: modelsBase, ttsModelsDir: path.join(modelsBase, 'tts') });
+    const onProgress = (progress) => { broadcastModelProgress({ ...progress, started: true, done: false, downloading: true }); };
+    broadcastModelProgress({ started: true, done: false, downloading: true, type: 'whisper', status: 'starting' });
+    await ensureModel('onnx-community/whisper-base', config, onProgress);
+    broadcastModelProgress({ started: true, done: false, downloading: true, type: 'tts', status: 'starting' });
+    await ensureTTSModels(config, onProgress);
+    modelDownloadState.complete = true;
+    broadcastModelProgress({ started: true, done: true, complete: true, downloading: false });
+    return true;
+  } catch (err) {
+    console.error('[MODELS] Download error:', err.message);
+    modelDownloadState.error = err.message;
+    broadcastModelProgress({ done: true, error: err.message });
+    return false;
+  } finally {
+    modelDownloadState.downloading = false;
+  }
+}
+export function eagerTTS(text, conversationId, sessionId) {
+  const key = `${conversationId}:${sessionId}`;
+  let acc = ttsTextAccumulators.get(key);
+  if (!acc) { acc = { text: '', timer: null }; ttsTextAccumulators.set(key, acc); }
+  acc.text += text;
+  if (acc.timer) clearTimeout(acc.timer);
+  acc.timer = setTimeout(() => flushTTSaccumulator(key, conversationId, sessionId), 600);
+}
+function flushTTSaccumulator(key, conversationId, sessionId) {
+  const acc = ttsTextAccumulators.get(key);
+  if (!acc || !acc.text) return;
+  const text = acc.text.trim();
+  acc.text = '';
+  ttsTextAccumulators.delete(key);
+  getSpeech().then(speech => {
+    const status = speech.getStatus();
+    if (!status.ttsReady || status.ttsError) return;
+    const voices = new Set();
+    for (const ws of _syncClients) {
+      const vid = ws.ttsVoiceId || 'default';
+      const convKey = `conv-${conversationId}`;
+      if (ws.subscriptions && (ws.subscriptions.has(sessionId) || ws.subscriptions.has(convKey))) {
+        voices.add(vid);
+      }
+    }
+    if (voices.size === 0) return;
+    for (const vid of voices) {
+      const cacheKey = speech.ttsCacheKey(text, vid);
+      const cached = speech.ttsCacheGet(cacheKey);
+      if (cached) { pushTTSAudio(cacheKey, cached, conversationId, sessionId, vid); continue; }
+      speech.synthesize(text, vid).then(wav => {
+        if (speech.ttsCacheSet) speech.ttsCacheSet(cacheKey, wav);
+        pushTTSAudio(cacheKey, wav, conversationId, sessionId, vid);
+      }).catch(() => {});
+    }
+  }).catch(() => {});
+}
+function pushTTSAudio(cacheKey, wav, conversationId, sessionId, voiceId) {
+  const b64 = wav.toString('base64');
+  _broadcastSync({
+    type: 'tts_audio',
+    cacheKey,
+    audio: b64,
+    voiceId,
+    conversationId,
+    sessionId,
+    timestamp: Date.now()
+  });
+}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "agentgui",
-  "version": "1.0.753",
+  "version": "1.0.754",
   "description": "Multi-agent ACP client with real-time communication",
   "type": "module",
   "main": "electron/main.js",

package/server.js CHANGED Viewed

@@ -18,6 +18,7 @@ import { runClaudeWithStreaming } from './lib/claude-runner.js';
 import { initializeDescriptors, getAgentDescriptor } from './lib/agent-descriptors.js';
 import { findCommand, queryACPServerAgents, discoverAgents, discoverExternalACPServers, initializeAgentDiscovery } from './lib/agent-discovery.js';
 import { getGeminiOAuthCreds, startGeminiOAuth, exchangeGeminiOAuthCode, handleGeminiOAuthCallback, getGeminiOAuthStatus, getGeminiOAuthState } from './lib/oauth-gemini.js';
+import { initSpeechManager, getSpeech, ensurePocketTtsSetup, voiceCacheManager, modelDownloadState, broadcastModelProgress, ensureModelsDownloaded, eagerTTS } from './lib/speech-manager.js';
 import { startCodexOAuth, exchangeCodexOAuthCode, handleCodexOAuthCallback, getCodexOAuthStatus, getCodexOAuthState, CODEX_HOME, CODEX_AUTH_FILE } from './lib/oauth-codex.js';
 import { WSOptimizer } from './lib/ws-optimizer.js';
 import { WsRouter } from './lib/ws-protocol.js';
@@ -69,232 +70,6 @@ process.on('SIGHUP', () => { console.log('[SIGNAL] SIGHUP received (ignored - un
 process.on('beforeExit', (code) => { console.log('[PROCESS] beforeExit with code:', code); });
 process.on('exit', (code) => { console.log('[PROCESS] exit with code:', code); });
-const ttsTextAccumulators = new Map();
-const voiceCacheManager = {
-  generating: new Map(),
-  maxCacheSize: 10 * 1024 * 1024,
-  async getOrGenerateCache(conversationId, text) {
-    const cacheKey = `${conversationId}:${text}`;
-    if (this.generating.has(cacheKey)) {
-      return new Promise((resolve) => {
-        const checkInterval = setInterval(() => {
-          const cached = queries.getVoiceCache(conversationId, text);
-          if (cached) {
-            clearInterval(checkInterval);
-            resolve(cached);
-          }
-        }, 50);
-      });
-    }
-    const cached = queries.getVoiceCache(conversationId, text);
-    if (cached) return cached;
-    this.generating.set(cacheKey, true);
-    try {
-      const speech = await getSpeech();
-      const audioBlob = await speech.synthesize(text, 'default');
-      const saved = queries.saveVoiceCache(conversationId, text, audioBlob);
-      const totalSize = queries.getVoiceCacheSize(conversationId);
-      if (totalSize > this.maxCacheSize) {
-        const needed = totalSize - this.maxCacheSize;
-        queries.deleteOldestVoiceCache(conversationId, needed);
-      }
-      return saved;
-    } finally {
-      this.generating.delete(cacheKey);
-    }
-  }
-};
-let speechModule = null;
-async function getSpeech() {
-  if (!speechModule) speechModule = await import('./lib/speech.js');
-  return speechModule;
-}
-async function ensurePocketTtsSetup(onProgress) {
-  const { createRequire: cr } = await import('module');
-  const r = cr(import.meta.url);
-  const serverTTS = r('webtalk/server-tts');
-  return serverTTS.ensureInstalled(onProgress);
-}
-// Model download manager
-const modelDownloadState = {
-  downloading: false,
-  progress: null,
-  error: null,
-  complete: false,
-  startTime: null,
-  downloadMetrics: new Map()
-};
-function broadcastModelProgress(progress) {
-  modelDownloadState.progress = progress;
-  const broadcastData = {
-    type: 'model_download_progress',
-    modelId: progress.type || 'unknown',
-    bytesDownloaded: progress.bytesDownloaded || 0,
-    bytesRemaining: progress.bytesRemaining || 0,
-    totalBytes: progress.totalBytes || 0,
-    downloadSpeed: progress.downloadSpeed || 0,
-    eta: progress.eta || 0,
-    retryCount: progress.retryCount || 0,
-    currentGateway: progress.currentGateway || '',
-    status: progress.status || (progress.done ? 'completed' : progress.downloading ? 'downloading' : 'paused'),
-    percentComplete: progress.percentComplete || 0,
-    completedFiles: progress.completedFiles || 0,
-    totalFiles: progress.totalFiles || 0,
-    timestamp: Date.now(),
-    ...progress
-  };
-  broadcastSync(broadcastData);
-}
-async function validateAndCleanupModels(modelsDir) {
-  try {
-    const manifestPath = path.join(modelsDir, '.manifests.json');
-    if (fs.existsSync(manifestPath)) {
-      try {
-        const content = fs.readFileSync(manifestPath, 'utf8');
-        JSON.parse(content);
-      } catch (e) {
-        console.error('[MODELS] Manifest corrupted, removing:', e.message);
-        fs.unlinkSync(manifestPath);
-      }
-    }
-    const files = fs.readdirSync(modelsDir);
-    for (const file of files) {
-      if (file.endsWith('.tmp')) {
-        try {
-          fs.unlinkSync(path.join(modelsDir, file));
-          console.log('[MODELS] Cleaned up temp file:', file);
-        } catch (e) {
-          console.warn('[MODELS] Failed to clean:', file);
-        }
-      }
-    }
-  } catch (e) {
-    console.warn('[MODELS] Cleanup check failed:', e.message);
-  }
-}
-async function ensureModelsDownloaded() {
-  if (modelDownloadState.downloading) {
-    while (modelDownloadState.downloading) {
-      await new Promise(r => setTimeout(r, 100));
-    }
-    return modelDownloadState.complete;
-  }
-  modelDownloadState.downloading = true;
-  modelDownloadState.error = null;
-  try {
-    const r = createRequire(import.meta.url);
-    const { createConfig } = r('webtalk/config');
-    const { ensureModel } = r('webtalk/whisper-models');
-    const { ensureTTSModels } = r('webtalk/tts-models');
-    const gmguiModels = path.join(os.homedir(), '.gmgui', 'models');
-    const modelsBase = process.env.PORTABLE_EXE_DIR
-      ? (fs.existsSync(path.join(process.env.PORTABLE_EXE_DIR, 'models', 'onnx-community')) ? path.join(process.env.PORTABLE_EXE_DIR, 'models') : gmguiModels)
-      : gmguiModels;
-    await validateAndCleanupModels(modelsBase);
-    const config = createConfig({
-      modelsDir: modelsBase,
-      ttsModelsDir: path.join(modelsBase, 'tts'),
-    });
-    // Progress callback for broadcasting download progress
-    const onProgress = (progress) => {
-      broadcastModelProgress({
-        ...progress,
-        started: true,
-        done: false,
-        downloading: true
-      });
-    };
-    broadcastModelProgress({ started: true, done: false, downloading: true, type: 'whisper', status: 'starting' });
-    await ensureModel('onnx-community/whisper-base', config, onProgress);
-    broadcastModelProgress({ started: true, done: false, downloading: true, type: 'tts', status: 'starting' });
-    await ensureTTSModels(config, onProgress);
-    modelDownloadState.complete = true;
-    broadcastModelProgress({ started: true, done: true, complete: true, downloading: false });
-    return true;
-  } catch (err) {
-    console.error('[MODELS] Download error:', err.message);
-    modelDownloadState.error = err.message;
-    broadcastModelProgress({ done: true, error: err.message });
-    return false;
-  } finally {
-    modelDownloadState.downloading = false;
-  }
-}
-function eagerTTS(text, conversationId, sessionId) {
-  const key = `${conversationId}:${sessionId}`;
-  let acc = ttsTextAccumulators.get(key);
-  if (!acc) {
-    acc = { text: '', timer: null };
-    ttsTextAccumulators.set(key, acc);
-  }
-  acc.text += text;
-  if (acc.timer) clearTimeout(acc.timer);
-  acc.timer = setTimeout(() => flushTTSaccumulator(key, conversationId, sessionId), 600);
-}
-function flushTTSaccumulator(key, conversationId, sessionId) {
-  const acc = ttsTextAccumulators.get(key);
-  if (!acc || !acc.text) return;
-  const text = acc.text.trim();
-  acc.text = '';
-  ttsTextAccumulators.delete(key);
-  getSpeech().then(speech => {
-    const status = speech.getStatus();
-    if (!status.ttsReady || status.ttsError) return;
-    const voices = new Set();
-    for (const ws of syncClients) {
-      const vid = ws.ttsVoiceId || 'default';
-      const convKey = `conv-${conversationId}`;
-      if (ws.subscriptions && (ws.subscriptions.has(sessionId) || ws.subscriptions.has(convKey))) {
-        voices.add(vid);
-      }
-    }
-    if (voices.size === 0) return;
-    for (const vid of voices) {
-      const cacheKey = speech.ttsCacheKey(text, vid);
-      const cached = speech.ttsCacheGet(cacheKey);
-      if (cached) {
-        pushTTSAudio(cacheKey, cached, conversationId, sessionId, vid);
-        continue;
-      }
-      speech.synthesize(text, vid).then(wav => {
-        if (speech.ttsCacheSet) speech.ttsCacheSet(cacheKey, wav);
-        pushTTSAudio(cacheKey, wav, conversationId, sessionId, vid);
-      }).catch(() => {});
-    }
-  }).catch(() => {});
-}
-function pushTTSAudio(cacheKey, wav, conversationId, sessionId, voiceId) {
-  const b64 = wav.toString('base64');
-  broadcastSync({
-    type: 'tts_audio',
-    cacheKey,
-    audio: b64,
-    voiceId,
-    conversationId,
-    sessionId,
-    timestamp: Date.now()
-  });
-}
 function buildSystemPrompt(agentId, model, subAgent) {
   const parts = [];
@@ -3943,6 +3718,8 @@ function broadcastSync(event) {
 // WebSocket protocol router
 const wsRouter = new WsRouter();
+initSpeechManager({ broadcastSync, syncClients, queries });
 registerConvHandlers(wsRouter, {
   queries, activeExecutions, rateLimitState,
   broadcastSync, processMessageWithStreaming, cleanupExecution,