npm - @agentprojectcontext/apx - Versions diffs - 1.33.1 → 1.35.0 - Mend

@agentprojectcontext/apx 1.33.1 → 1.35.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (208) hide show

package/package.json +1 -1
package/skills/apx/SKILL.md +49 -61
package/src/core/agent/a2a/reply.js +48 -0
package/src/core/agent/build-agent-system.js +136 -59
package/src/core/agent/channels/voice-context.js +98 -0
package/src/core/agent/memory.js +2 -1
package/src/core/agent/prompt-builder.js +178 -124
package/src/core/agent/prompts/channels/code.md +12 -10
package/src/core/agent/prompts/channels/desktop.md +5 -32
package/src/core/agent/prompts/channels/telegram.md +4 -15
package/src/core/agent/prompts/channels/web_code.md +11 -11
package/src/core/agent/prompts/core/agent-base.md +24 -0
package/src/core/agent/prompts/core/project-agent.md +11 -0
package/src/core/agent/prompts/core/super-agent.md +21 -0
package/src/core/agent/prompts/discipline/action.md +10 -0
package/src/core/agent/prompts/discipline/single-segment.md +6 -0
package/src/core/agent/prompts/discipline/two-segment.md +11 -0
package/src/core/agent/prompts/modes/code-build.md +1 -0
package/src/core/agent/prompts/modes/code-plan.md +1 -0
package/src/core/agent/prompts/modes/index.js +28 -0
package/src/core/agent/self-memory.js +43 -1
package/src/core/agent/skills/index-store.js +307 -0
package/src/core/agent/skills/index.js +15 -1
package/src/core/agent/skills/inspector.js +317 -0
package/src/core/agent/skills/loader.js +22 -18
package/src/core/agent/stream/turn-accumulator.js +73 -0
package/src/core/agent/suggestions.js +37 -0
package/src/core/agent/super-agent.js +7 -1
package/src/core/agent/tools/handlers/_git.js +50 -0
package/src/core/agent/tools/handlers/add-project.js +5 -2
package/src/core/agent/tools/handlers/call-runtime.js +3 -2
package/src/core/agent/tools/handlers/git-diff.js +44 -0
package/src/core/agent/tools/handlers/git-log.js +38 -0
package/src/core/agent/tools/handlers/git-show.js +34 -0
package/src/core/agent/tools/handlers/git-status.js +61 -0
package/src/core/agent/tools/handlers/transcribe-audio.js +1 -1
package/src/core/agent/tools/helpers.js +2 -2
package/src/core/agent/tools/names.js +169 -0
package/src/core/agent/tools/registry-bridge.js +6 -14
package/src/core/agent/tools/registry.js +103 -69
package/src/core/apc/context-copy.js +27 -0
package/src/core/apc/notes.js +19 -0
package/src/core/apc/parser.js +12 -5
package/src/core/apc/paths.js +87 -0
package/src/core/apc/scaffold.js +82 -76
package/src/core/apc/skill-sync.js +10 -0
package/src/{host/daemon/plugins → core/channels}/telegram/dispatch.js +38 -16
package/src/core/config/index.js +24 -2
package/src/core/config/redact.js +95 -0
package/src/core/constants/channels.js +2 -0
package/src/core/constants/code-modes.js +10 -0
package/src/core/constants/index.js +1 -0
package/src/core/deck/manifest.js +186 -0
package/src/core/engines/catalog.js +83 -0
package/src/core/{tools → http-tools}/browser.js +0 -1
package/src/core/{tools → http-tools}/fetch.js +0 -1
package/src/core/{tools → http-tools}/glob.js +0 -1
package/src/core/{tools → http-tools}/grep.js +0 -1
package/src/core/{tools → http-tools}/registry.js +0 -1
package/src/core/{tools → http-tools}/search.js +0 -1
package/src/core/i18n/en.js +9 -0
package/src/core/i18n/es.js +12 -0
package/src/core/i18n/index.js +54 -0
package/src/core/i18n/pt.js +9 -0
package/src/core/identity/telegram.js +2 -1
package/src/core/mcp/runner.js +272 -14
package/src/core/mcp/sources.js +3 -2
package/src/core/routines/index.js +16 -0
package/src/{host/daemon/routines.js → core/routines/runner.js} +36 -103
package/src/core/runtime-skills/apc-context/SKILL.md +159 -0
package/src/core/runtime-skills/apx/SKILL.md +83 -0
package/src/core/runtime-skills/apx-agency-agents/SKILL.md +125 -0
package/src/core/runtime-skills/apx-agent/SKILL.md +97 -0
package/src/core/runtime-skills/apx-mcp/SKILL.md +111 -0
package/src/core/runtime-skills/apx-mcp-builder/SKILL.md +169 -0
package/{skills → src/core/runtime-skills}/apx-project/SKILL.md +20 -29
package/src/core/runtime-skills/apx-routine/SKILL.md +127 -0
package/src/core/runtime-skills/apx-runtime/SKILL.md +99 -0
package/src/core/runtime-skills/apx-sessions/SKILL.md +232 -0
package/src/core/runtime-skills/apx-skill-builder/SKILL.md +129 -0
package/{skills → src/core/runtime-skills}/apx-task/SKILL.md +18 -21
package/src/core/runtime-skills/apx-telegram/SKILL.md +120 -0
package/src/core/runtime-skills/apx-voice/SKILL.md +117 -0
package/src/core/runtime-skills/{claude-code.md → claude-code/SKILL.md} +1 -0
package/src/core/runtime-skills/{codex-cli.md → codex-cli/SKILL.md} +1 -0
package/src/core/runtime-skills/{opencode-cli.md → opencode-cli/SKILL.md} +1 -0
package/src/core/runtime-skills/{openrouter.md → openrouter/SKILL.md} +1 -0
package/src/{host/daemon/env-detect.js → core/runtimes/detect.js} +1 -1
package/src/core/stores/code-sessions.js +50 -2
package/src/core/stores/routine-memory.js +1 -1
package/src/core/stores/sessions-search.js +121 -0
package/src/core/stores/sessions.js +38 -0
package/src/core/vars/index.js +14 -0
package/src/core/vars/interpolate.js +86 -0
package/src/core/vars/sources.js +151 -0
package/src/core/voice/audio-decode.js +38 -0
package/src/core/voice/transcription.js +225 -0
package/src/host/daemon/api/admin-config.js +5 -82
package/src/host/daemon/api/agents.js +5 -5
package/src/host/daemon/api/code.js +17 -169
package/src/host/daemon/api/config.js +3 -4
package/src/host/daemon/api/conversations.js +8 -29
package/src/host/daemon/api/deck.js +37 -404
package/src/host/daemon/api/engines.js +1 -80
package/src/host/daemon/api/exec.js +1 -1
package/src/host/daemon/api/mcps.js +32 -0
package/src/host/daemon/api/routines.js +1 -1
package/src/host/daemon/api/runtimes.js +4 -3
package/src/host/daemon/api/sessions-search.js +24 -140
package/src/host/daemon/api/sessions.js +12 -30
package/src/host/daemon/api/shared.js +2 -1
package/src/host/daemon/api/skills.js +140 -6
package/src/host/daemon/api/super-agent.js +56 -1
package/src/host/daemon/api/telegram.js +1 -11
package/src/host/daemon/api/tools.js +6 -6
package/src/host/daemon/api/transcribe.js +2 -2
package/src/host/daemon/api/vars.js +137 -0
package/src/host/daemon/api/voice.js +13 -290
package/src/host/daemon/api.js +2 -0
package/src/host/daemon/db.js +6 -6
package/src/host/daemon/deck-exec.js +148 -0
package/src/host/daemon/index.js +20 -3
package/src/host/daemon/plugins/telegram/index.js +9 -9
package/src/host/daemon/routines-scheduler.js +64 -0
package/src/host/daemon/smoke.js +3 -2
package/src/host/daemon/whisper-server.js +225 -0
package/src/interfaces/cli/branding.js +53 -0
package/src/interfaces/cli/commands/agent.js +3 -2
package/src/interfaces/cli/commands/command.js +2 -3
package/src/interfaces/cli/commands/messages.js +6 -2
package/src/interfaces/cli/commands/pair.js +5 -4
package/src/interfaces/cli/commands/search.js +1 -1
package/src/interfaces/cli/commands/sessions.js +3 -2
package/src/interfaces/cli/commands/skills.js +290 -55
package/src/interfaces/cli/index.js +84 -2
package/src/interfaces/web/dist/assets/index-C0fm31dY.js +618 -0
package/src/interfaces/web/dist/assets/index-C0fm31dY.js.map +1 -0
package/src/interfaces/web/dist/assets/index-UcAqlBO6.css +1 -0
package/src/interfaces/web/dist/index.html +2 -2
package/src/interfaces/web/package-lock.json +182 -182
package/src/interfaces/web/src/components/ModelCombobox.tsx +2 -1
package/src/interfaces/web/src/components/TelegramChannelDialog.tsx +1 -1
package/src/interfaces/web/src/components/chat/AskAnswersCard.tsx +76 -0
package/src/interfaces/web/src/components/chat/MessageBubble.tsx +37 -4
package/src/interfaces/web/src/components/chat/MessageList.tsx +23 -1
package/src/interfaces/web/src/components/chat/ModelPicker.tsx +3 -1
package/src/interfaces/web/src/components/code/CodeArtifactsTab.tsx +4 -4
package/src/interfaces/web/src/components/code/CodeChangesTab.tsx +1 -1
package/src/interfaces/web/src/components/code/CodeFileTree.tsx +3 -2
package/src/interfaces/web/src/components/code/CodeFileViewer.tsx +3 -2
package/src/interfaces/web/src/components/code/CodeTerminal.tsx +3 -2
package/src/interfaces/web/src/components/config/GlobalConfigEditor.tsx +2 -1
package/src/interfaces/web/src/components/deck/WidgetRow.tsx +2 -1
package/src/interfaces/web/src/components/inputs/KeyValueList.tsx +93 -0
package/src/interfaces/web/src/components/inputs/VarTokenInput.tsx +449 -0
package/src/interfaces/web/src/components/settings/DefaultRouterCard.tsx +2 -1
package/src/interfaces/web/src/components/settings/EnginesPanel.tsx +2 -2
package/src/interfaces/web/src/components/settings/MemoryPanel.tsx +73 -4
package/src/interfaces/web/src/components/settings/SkillsInspectorPanel.tsx +222 -0
package/src/interfaces/web/src/components/settings/providers/ProviderCard.tsx +3 -2
package/src/interfaces/web/src/components/settings/providers/ProviderModal.tsx +3 -2
package/src/interfaces/web/src/components/ui/chat-input.tsx +5 -4
package/src/interfaces/web/src/components/ui/sidebar.tsx +3 -2
package/src/interfaces/web/src/components/voice/VoiceProviderModal.tsx +2 -1
package/src/interfaces/web/src/constants/index.ts +1 -1
package/src/interfaces/web/src/hooks/useChat.ts +19 -0
package/src/interfaces/web/src/i18n/en.ts +175 -7
package/src/interfaces/web/src/i18n/es.ts +180 -15
package/src/interfaces/web/src/lib/api/mcps.ts +25 -0
package/src/interfaces/web/src/lib/api/skills.ts +70 -0
package/src/interfaces/web/src/lib/api/vars.ts +38 -0
package/src/interfaces/web/src/lib/api.ts +1 -0
package/src/interfaces/web/src/screens/ProjectScreen.tsx +8 -31
package/src/interfaces/web/src/screens/SettingsScreen.tsx +6 -2
package/src/interfaces/web/src/screens/modules/CodeScreen.tsx +1 -1
package/src/interfaces/web/src/screens/modules/DeckScreen.tsx +4 -3
package/src/interfaces/web/src/screens/modules/DesktopScreen.tsx +7 -6
package/src/interfaces/web/src/screens/modules/VoiceScreen.tsx +4 -3
package/src/interfaces/web/src/screens/project/AgentDetailScreen.tsx +1 -1
package/src/interfaces/web/src/screens/project/ConfigTab.tsx +132 -1
package/src/interfaces/web/src/screens/project/McpsTab.tsx +549 -104
package/src/interfaces/web/src/screens/project/RoutinesTab.tsx +1 -1
package/src/interfaces/web/src/screens/project/VarsTab.tsx +300 -0
package/src/interfaces/web/src/types/daemon.ts +15 -0
package/skills/apx-agency-agents/SKILL.md +0 -141
package/skills/apx-agent/SKILL.md +0 -100
package/skills/apx-mcp-builder/SKILL.md +0 -183
package/skills/apx-routine/SKILL.md +0 -140
package/skills/apx-runtime/SKILL.md +0 -117
package/skills/apx-sessions/SKILL.md +0 -281
package/skills/apx-skill-builder/SKILL.md +0 -153
package/skills/apx-telegram/SKILL.md +0 -131
package/skills/apx-voice/SKILL.md +0 -137
package/src/core/agent/prompts/action-discipline.md +0 -24
package/src/core/agent/prompts/super-agent-base.md +0 -42
package/src/host/daemon/transcription.js +0 -538
package/src/host/daemon/whisper-transcribe.py +0 -73
package/src/interfaces/web/dist/assets/index-Aaiw8BZN.css +0 -1
package/src/interfaces/web/dist/assets/index-DPqtjDjh.js +0 -602
package/src/interfaces/web/dist/assets/index-DPqtjDjh.js.map +0 -1
/package/src/{host/daemon → core/apc}/projects-helpers.js +0 -0
/package/src/{host/daemon/plugins → core/channels}/telegram/ask.js +0 -0
/package/src/{host/daemon/plugins → core/channels}/telegram/helpers.js +0 -0
/package/src/{host/daemon/plugins → core/channels}/telegram/media.js +0 -0
/package/src/core/{tools → http-tools}/index.js +0 -0
/package/src/{host/daemon/compact.js → core/stores/conversations-compactor.js} +0 -0
/package/src/{host/daemon → core/stores}/conversations.js +0 -0
/package/src/{host/daemon → core/util}/thinking.js +0 -0

package/src/host/daemon/transcription.js DELETED Viewed

@@ -1,538 +0,0 @@
-// daemon/transcription.js
-// Audio transcription dispatcher. Two backends:
-//
-//   - LOCAL (faster-whisper via persistent Python server) — the server loads
-//     the model once on first use and keeps it in RAM. It auto-shuts down after
-//     idle_minutes (default 10) of inactivity, then restarts lazily on the
-//     next request. Requires `pip3 install faster-whisper` on the host.
-//
-//   - OPENAI (Whisper-1 cloud API) — needs OPENAI_API_KEY or
-//     engines.openai.api_key in config.
-//
-// Provider selection in ~/.apx/config.json:
-//   "transcription": {
-//     "provider": "auto" | "local" | "openai",   // default "auto"
-//     "local": {
-//       "model": "small",           // tiny | base | small | medium | large | large-v2 | large-v3
-//       "device": "cpu",            // cpu | cuda
-//       "compute_type": "int8",     // int8 | int8_float16 | float16 | float32
-//       "language": "auto",         // ISO 639-1 code (e.g. "es") or "auto"
-//       "beam_size": 5,
-//       "idle_minutes": 10          // auto-shutdown after N minutes idle
-//     }
-//   }
-//
-// "auto" tries local first; on failure falls back to openai.
-//
-// Spanish tip: set language: "es" for better accuracy with the small model.
-import fs from "node:fs";
-import path from "node:path";
-import { spawn, exec } from "node:child_process";
-import { fileURLToPath } from "node:url";
-import { logInfo, logWarn, logError } from "#core/logging.js";
-const __filename = fileURLToPath(import.meta.url);
-const __dirname = path.dirname(__filename);
-const WHISPER_SERVER = path.join(__dirname, "whisper-server.py");
-const WHISPER_PORT = 18765;
-const DEFAULT_LOCAL = {
-  model: "small",
-  device: "cpu",
-  compute_type: "int8",
-  language: "auto",
-  beam_size: 5,
-  idle_minutes: 10,
-  // Max time we wait for /transcribe to return. Long audio files (Telegram
-  // voice notes > 10 min) can take several minutes on CPU; the previous
-  // hard-coded 5-minute cap silently truncated them. 20 minutes covers a
-  // ~60-minute voice note on a small int8 model. Override with
-  // transcription.local.timeout_ms in ~/.apx/config.json if needed.
-  timeout_ms: 20 * 60_000,
-};
-// ---------------------------------------------------------------------------
-// Config helpers (pure — exported for tests)
-// ---------------------------------------------------------------------------
-/**
- * Resolve the effective transcription language.
- * Priority: explicit local config → config.user.language → "auto" (whisper detects).
- *
- * @param {object} localCfg   merged transcription.local config
- * @param {string} userLang   config.user.language ISO code (e.g. "es"), or ""
- * @returns {string}          ISO code or "auto"
- */
-export function resolveTranscriptionLanguage(localCfg, userLang) {
-  if (localCfg.language && localCfg.language !== "auto") return localCfg.language;
-  if (userLang) return userLang;
-  return "auto";
-}
-// ---------------------------------------------------------------------------
-// Config
-// ---------------------------------------------------------------------------
-async function getConfig() {
-  try {
-    const { readConfig } = await import("#core/config/index.js");
-    const cfg = readConfig() || {};
-    const t = cfg.transcription || {};
-    const openaiKey = cfg.engines?.openai?.api_key || process.env.OPENAI_API_KEY || "";
-    // Use user.language as default for transcription language if not explicitly set.
-    // Explicit transcription.local.language always wins; "auto" means fall back to user.language.
-    const userLang = cfg.user?.language || "";
-    const localBase = { ...DEFAULT_LOCAL, ...(t.local || {}) };
-    localBase.language = resolveTranscriptionLanguage(localBase, userLang);
-    return {
-      provider: t.provider || "auto",
-      local: localBase,
-      openaiKey,
-    };
-  } catch {
-    return {
-      provider: "auto",
-      local: { ...DEFAULT_LOCAL },
-      openaiKey: process.env.OPENAI_API_KEY || "",
-    };
-  }
-}
-// ---------------------------------------------------------------------------
-// Persistent server management
-// ---------------------------------------------------------------------------
-let _serverProcess = null;
-let _serverModel = null;   // model the running server was started with
-function _sleep(ms) {
-  return new Promise((r) => setTimeout(r, ms));
-}
-async function _isServerHealthy() {
-  try {
-    const res = await fetch(`http://127.0.0.1:${WHISPER_PORT}/health`, {
-      signal: AbortSignal.timeout(800),
-    });
-    return res.ok;
-  } catch {
-    return false;
-  }
-}
-// Check if the running whisper-server is using a specific model.
-// Returns the model name string, or null if not reachable.
-async function _serverModelName() {
-  try {
-    const res = await fetch(`http://127.0.0.1:${WHISPER_PORT}/health`, {
-      signal: AbortSignal.timeout(800),
-    });
-    if (!res.ok) return null;
-    const j = await res.json();
-    return j?.model || null;
-  } catch {
-    return null;
-  }
-}
-async function _waitForServer(maxMs = 15_000) {
-  const deadline = Date.now() + maxMs;
-  while (Date.now() < deadline) {
-    if (await _isServerHealthy()) return;
-    await _sleep(250);
-  }
-  throw new Error(`whisper-server did not start within ${maxMs}ms`);
-}
-// Find the PID of the process LISTENing on the whisper port (server only,
-// not clients). Filtering by -sTCP:LISTEN is critical — without it, lsof
-// also returns clients with an open connection (including this daemon).
-async function _findListenerPid() {
-  return new Promise((resolve) => {
-    exec(`lsof -ti tcp:${WHISPER_PORT} -sTCP:LISTEN`, (err, stdout) => {
-      if (err || !stdout) return resolve(null);
-      const candidates = stdout.trim().split("\n")
-        .map(s => parseInt(s, 10))
-        .filter(n => Number.isFinite(n) && n !== process.pid);
-      resolve(candidates[0] || null);
-    });
-  });
-}
-async function _killOrphanWhisper() {
-  // First try graceful /shutdown on the whisper server.
-  try {
-    await fetch(`http://127.0.0.1:${WHISPER_PORT}/shutdown`, {
-      method: "POST", signal: AbortSignal.timeout(1000),
-    });
-    await _sleep(600);
-  } catch {}
-  // If still bound, force-kill the LISTENER pid only (never our own pid).
-  const pid = await _findListenerPid();
-  if (pid && pid !== process.pid) {
-    try { process.kill(pid, "SIGTERM"); } catch {}
-    await _sleep(400);
-    try { process.kill(pid, 0); try { process.kill(pid, "SIGKILL"); } catch {} } catch {}
-    await _sleep(300);
-  }
-}
-async function ensureWhisperServer(opts) {
-  const model = opts.model || DEFAULT_LOCAL.model;
-  // Already running with the right model — health-check to confirm still alive.
-  if (_serverProcess && _serverModel === model) {
-    if (await _isServerHealthy()) return;
-    _serverProcess = null;
-    _serverModel = null;
-  }
-  // Adopt an externally-running whisper-server (e.g. left over from prior daemon).
-  if (!_serverProcess) {
-    const existing = await _serverModelName();
-    if (existing === model) {
-      _serverModel = model;
-      return;
-    }
-    if (existing) {
-      // Wrong model: kick out the orphan so we can start the right one.
-      await _killOrphanWhisper();
-    }
-  }
-  if (_serverProcess) {
-    try { _serverProcess.kill(); } catch {}
-    _serverProcess = null;
-    _serverModel = null;
-    await _sleep(300);
-  }
-  await _spawnWhisper(opts, model, /* retried */ false);
-}
-async function _spawnWhisper(opts, model, retried) {
-  const args = [
-    WHISPER_SERVER,
-    "--port", String(WHISPER_PORT),
-    "--model", model,
-    "--device", String(opts.device || DEFAULT_LOCAL.device),
-    "--compute-type", String(opts.compute_type || DEFAULT_LOCAL.compute_type),
-    "--idle-minutes", String(opts.idle_minutes ?? DEFAULT_LOCAL.idle_minutes),
-  ];
-  const proc = spawn("python3", args, {
-    stdio: ["ignore", "pipe", "inherit"],
-    detached: false,
-  });
-  _serverProcess = proc;
-  _serverModel = model;
-  proc.on("exit", () => {
-    if (_serverProcess === proc) {
-      _serverProcess = null;
-      _serverModel = null;
-    }
-  });
-  // Wait for the "ready" line on stdout, then wait for HTTP to respond.
-  try {
-    await new Promise((resolve, reject) => {
-      const timeout = setTimeout(
-        () => reject(new Error("whisper-server startup timed out (15s)")),
-        15_000
-      );
-      let buf = "";
-      proc.stdout.on("data", (chunk) => {
-        buf += chunk.toString();
-        const nl = buf.indexOf("\n");
-        if (nl === -1) return;
-        const line = buf.slice(0, nl).trim();
-        buf = buf.slice(nl + 1);
-        clearTimeout(timeout);
-        try {
-          const msg = JSON.parse(line);
-          if (msg.status === "error") return reject(new Error(msg.error || "whisper-server error"));
-          resolve(); // "ready"
-        } catch {
-          resolve(); // unexpected line but server is up
-        }
-      });
-      proc.on("exit", (code) => {
-        clearTimeout(timeout);
-        reject(new Error(`whisper-server exited (code ${code}) before becoming ready`));
-      });
-    });
-  } catch (e) {
-    // Self-heal: if the port was already in use, kill the orphan and retry once.
-    const msg = e.message || "";
-    if (!retried && /address already in use|errno 48|eaddrinuse/i.test(msg)) {
-      _serverProcess = null;
-      _serverModel = null;
-      await _killOrphanWhisper();
-      return _spawnWhisper(opts, model, /* retried */ true);
-    }
-    throw e;
-  }
-}
-// ---------------------------------------------------------------------------
-// Local backend (persistent whisper-server.py via HTTP)
-// ---------------------------------------------------------------------------
-async function transcribeLocal(filePath, opts) {
-  await ensureWhisperServer(opts);
-  const language = (opts.language || DEFAULT_LOCAL.language) === "auto"
-    ? null
-    : (opts.language || null);
-  const timeoutMs = Number(opts.timeout_ms) > 0
-    ? Number(opts.timeout_ms)
-    : DEFAULT_LOCAL.timeout_ms;
-  const body = JSON.stringify({
-    audio_path: filePath,
-    language,
-    beam_size: opts.beam_size || DEFAULT_LOCAL.beam_size,
-  });
-  // Long transcriptions on CPU (small int8, 1-minute voice note) can take
-  // 30-45s. Under undici (Node fetch) we occasionally see "fetch failed"
-  // from the inbound Telegram path even though the whisper-server completes
-  // the request successfully — a keep-alive socket gets reset somewhere
-  // between the long whisper-server response and the daemon's other
-  // concurrent traffic. We retry once on a generic "fetch failed" so the
-  // user actually gets a reply.
-  const maxAttempts = 2;
-  let lastErr = null;
-  for (let attempt = 1; attempt <= maxAttempts; attempt++) {
-    const t0 = Date.now();
-    try {
-      logInfo("whisper", `transcribeLocal attempt ${attempt}/${maxAttempts}`, {
-        file: path.basename(filePath),
-        language: language || "auto",
-        timeout_ms: timeoutMs,
-      });
-      const res = await fetch(`http://127.0.0.1:${WHISPER_PORT}/transcribe`, {
-        method: "POST",
-        headers: { "content-type": "application/json", "connection": "close" },
-        body,
-        signal: AbortSignal.timeout(timeoutMs),
-      });
-      const json = await res.json();
-      if (!json.ok) throw new Error(json.error || "transcription failed");
-      logInfo("whisper", `transcribeLocal ok in ${Date.now() - t0}ms`, {
-        chars: (json.text || "").length,
-        language: json.language,
-        duration: json.duration,
-      });
-      return {
-        ok: true,
-        backend: "local",
-        text: json.text || "",
-        language: json.language || null,
-        language_probability: json.language_probability ?? null,
-        duration: json.duration ?? null,
-        model: json.model,
-        compute_type: json.compute_type,
-      };
-    } catch (e) {
-      lastErr = e;
-      const isRetriable =
-        /fetch failed|ECONNRESET|socket hang up|terminated/i.test(e.message || "");
-      const dt = Date.now() - t0;
-      logWarn("whisper", `transcribeLocal attempt ${attempt} failed in ${dt}ms`, {
-        error: e.message,
-        retriable: isRetriable,
-        will_retry: isRetriable && attempt < maxAttempts,
-      });
-      if (!isRetriable || attempt >= maxAttempts) break;
-      // Brief backoff before retry — gives the whisper-server.py thread time
-      // to flush its pending response and release the model lock.
-      await _sleep(500);
-    }
-  }
-  logError("whisper", `transcribeLocal exhausted retries`, { error: lastErr?.message });
-  throw lastErr || new Error("local transcription failed");
-}
-// ---------------------------------------------------------------------------
-// OpenAI backend (Whisper-1 cloud)
-// ---------------------------------------------------------------------------
-async function transcribeOpenAI(filePath, apiKey) {
-  if (!apiKey) throw new Error("OPENAI_API_KEY not set (env or engines.openai.api_key)");
-  const fileBuf = fs.readFileSync(filePath);
-  const ext = path.extname(filePath).slice(1).toLowerCase() || "ogg";
-  const mimeMap = {
-    oga: "audio/ogg", ogg: "audio/ogg", opus: "audio/ogg",
-    mp3: "audio/mpeg", m4a: "audio/mp4", mp4: "audio/mp4",
-    wav: "audio/wav", webm: "audio/webm",
-  };
-  const blob = new Blob([fileBuf], { type: mimeMap[ext] || "audio/ogg" });
-  const form = new FormData();
-  form.append("file", blob, `audio.${ext}`);
-  form.append("model", "whisper-1");
-  const res = await fetch("https://api.openai.com/v1/audio/transcriptions", {
-    method: "POST",
-    headers: { Authorization: `Bearer ${apiKey}` },
-    body: form,
-  });
-  if (!res.ok) {
-    const err = await res.text().catch(() => "");
-    throw new Error(`Whisper API ${res.status}: ${err.slice(0, 200)}`);
-  }
-  const json = await res.json();
-  return {
-    ok: true,
-    backend: "openai",
-    text: String(json.text || "").trim(),
-    language: null,
-    language_probability: null,
-    duration: null,
-    model: "whisper-1",
-  };
-}
-// ---------------------------------------------------------------------------
-// Public API
-// ---------------------------------------------------------------------------
-/**
- * Transcribe an audio file using the configured backend.
- * Returns { ok, backend, text, language?, language_probability?, duration?, model? }.
- *
- * @param {string} filePath   absolute path to audio file
- * @param {object} overrides  optional: { provider, model, language, idle_minutes, ... }
- */
-export async function transcribe(filePath, overrides = {}) {
-  if (!filePath || !fs.existsSync(filePath)) {
-    throw new Error(`transcribe: file not found: ${filePath}`);
-  }
-  const cfg = await getConfig();
-  const provider = overrides.provider || cfg.provider;
-  const localOpts = { ...cfg.local, ...overrides };
-  if (provider === "openai") {
-    return transcribeOpenAI(filePath, cfg.openaiKey);
-  }
-  if (provider === "local") {
-    // Explicit local-only: bubble up the real error, do not mention OpenAI.
-    return transcribeLocal(filePath, localOpts);
-  }
-  // auto: local first, fall back to openai only if a key is configured
-  try {
-    return await transcribeLocal(filePath, localOpts);
-  } catch (localErr) {
-    if (cfg.openaiKey) {
-      return transcribeOpenAI(filePath, cfg.openaiKey);
-    }
-    // No OpenAI configured — surface the real local error verbatim.
-    throw new Error(`local transcription failed: ${localErr.message}`);
-  }
-}
-/**
- * Transcribe raw audio bytes (e.g. from a mic chunk or Telegram voice blob).
- * Saves to a temp file, transcribes, cleans up.
- *
- * @param {Buffer} buf        raw audio data
- * @param {string} format     file extension hint: "webm" | "ogg" | "wav" | "mp3" (default "webm")
- * @param {object} overrides  same as transcribe() overrides
- */
-export async function transcribeBuffer(buf, format = "webm", overrides = {}) {
-  if (!buf || !buf.length) throw new Error("transcribeBuffer: empty buffer");
-  const ext = format.replace(/^\./, "") || "webm";
-  const tmpFile = path.join(
-    (await import("node:os")).default.tmpdir(),
-    `apx-audio-${Date.now()}-${Math.random().toString(36).slice(2)}.${ext}`
-  );
-  try {
-    fs.writeFileSync(tmpFile, buf);
-    return await transcribe(tmpFile, overrides);
-  } finally {
-    try { fs.unlinkSync(tmpFile); } catch {}
-  }
-}
-// ---------------------------------------------------------------------------
-// Lifecycle (preload on daemon start, shutdown on daemon stop)
-// ---------------------------------------------------------------------------
-/**
- * Eagerly start the whisper server so the first transcription is fast.
- * Safe to call multiple times. Never throws — logs and continues on failure.
- */
-export async function preloadWhisperServer(log = console.log) {
-  try {
-    const cfg = await getConfig();
-    if (cfg.provider === "openai") return; // local backend not used
-    log(`whisper: preloading model "${cfg.local.model}" on port ${WHISPER_PORT}…`);
-    await ensureWhisperServer(cfg.local);
-    log(`whisper: ready on port ${WHISPER_PORT} (model: ${_serverModel})`);
-  } catch (e) {
-    log(`whisper: preload failed — ${e.message} (will retry lazily on first request)`);
-  }
-}
-/**
- * Keep the local whisper server warm. Ensures it's loaded and pings /health,
- * which resets the server's idle watchdog so a live session (e.g. the desktop
- * window held open) never pays the cold-load cost on the next utterance.
- * Cheap and safe to call repeatedly. Never throws.
- * Returns { ok, model?, loaded?, provider } for the caller to surface.
- */
-export async function warmupWhisper() {
-  try {
-    const cfg = await getConfig();
-    if (cfg.provider === "openai") return { ok: true, provider: "openai", loaded: false };
-    await ensureWhisperServer(cfg.local);
-    // /warmup loads the model into RAM (lazy otherwise) AND touches _last_used,
-    // resetting the idle timer. First call may block ~15-30s on a cold model;
-    // instant once warm. Generous timeout so the cold load can finish.
-    let loaded = false;
-    try {
-      const r = await fetch(`http://127.0.0.1:${WHISPER_PORT}/warmup`, {
-        signal: AbortSignal.timeout(40_000),
-      });
-      const j = await r.json().catch(() => ({}));
-      loaded = !!j.loaded;
-    } catch {}
-    return { ok: true, provider: "local", model: _serverModel, loaded };
-  } catch (e) {
-    return { ok: false, error: e.message };
-  }
-}
-/**
- * Stop the whisper server we own (no-op if we adopted an external one).
- */
-export async function shutdownWhisperServer() {
-  if (_serverProcess) {
-    try { _serverProcess.kill(); } catch {}
-    _serverProcess = null;
-    _serverModel = null;
-  } else {
-    // Try graceful shutdown of an adopted server
-    try {
-      await fetch(`http://127.0.0.1:${WHISPER_PORT}/shutdown`, {
-        method: "POST", signal: AbortSignal.timeout(500),
-      });
-    } catch {}
-  }
-}
-// ---------------------------------------------------------------------------
-// Diagnostics
-// ---------------------------------------------------------------------------
-export const TRANSCRIPTION_PATHS = {
-  whisper_server: WHISPER_SERVER,
-  port: WHISPER_PORT,
-};

package/src/host/daemon/whisper-transcribe.py DELETED Viewed

@@ -1,73 +0,0 @@
-#!/usr/bin/env python3
-"""
-Local audio transcription via faster-whisper. Mirrors the implementation in
-the Panda project (transcription_service.py): same default model "medium",
-device cpu, compute_type int8, beam_size 5. Lazy singleton model cache.
-Invoked by APX daemon (Node) as a subprocess. Args:
-  whisper-transcribe.py <audio_path> [--model medium] [--language auto] [--device cpu] [--compute-type int8] [--beam-size 5]
-Outputs JSON on stdout:
-  { "ok": true,  "text": "...", "language": "es", "language_probability": 0.98, "duration": 12.4 }
-  { "ok": false, "error": "..." }
-"""
-import argparse
-import json
-import os
-import sys
-def main() -> int:
-    parser = argparse.ArgumentParser()
-    parser.add_argument("audio_path")
-    parser.add_argument("--model", default="medium")
-    parser.add_argument("--language", default="auto")
-    parser.add_argument("--device", default="cpu")
-    parser.add_argument("--compute-type", dest="compute_type", default="int8")
-    parser.add_argument("--beam-size", dest="beam_size", type=int, default=5)
-    args = parser.parse_args()
-    if not os.path.exists(args.audio_path):
-        print(json.dumps({"ok": False, "error": f"file not found: {args.audio_path}"}))
-        return 1
-    try:
-        from faster_whisper import WhisperModel
-    except ImportError as e:
-        print(json.dumps({
-            "ok": False,
-            "error": "faster-whisper not installed. Run: pip3 install faster-whisper",
-            "import_error": str(e),
-        }))
-        return 1
-    try:
-        import multiprocessing
-        threads = os.cpu_count() or 4
-        model = WhisperModel(args.model, device=args.device, compute_type=args.compute_type, cpu_threads=threads)
-    except Exception as e:
-        print(json.dumps({"ok": False, "error": f"failed to load model '{args.model}': {e}"}))
-        return 1
-    language = None if args.language == "auto" else args.language
-    try:
-        segments, info = model.transcribe(args.audio_path, beam_size=args.beam_size, language=language)
-        text = " ".join(seg.text.strip() for seg in segments).strip()
-        print(json.dumps({
-            "ok": True,
-            "text": text,
-            "language": info.language,
-            "language_probability": round(info.language_probability, 4),
-            "duration": round(info.duration, 2),
-            "model": args.model,
-            "compute_type": args.compute_type,
-        }))
-        return 0
-    except Exception as e:
-        print(json.dumps({"ok": False, "error": f"transcription failed: {e}"}))
-        return 1
-if __name__ == "__main__":
-    sys.exit(main())