npm - discoclaw - Versions diffs - 1.3.0 → 2.0.0 - Mend

discoclaw 1.3.0 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

package/.env.example +4 -6
package/.env.example.full +13 -32
package/README.md +1 -1
package/dist/cli/dashboard.test.js +0 -4
package/dist/cli/init-wizard.js +4 -8
package/dist/cli/init-wizard.test.js +4 -10
package/dist/config.js +2 -42
package/dist/config.test.js +8 -72
package/dist/dashboard/server.js +1 -5
package/dist/dashboard/server.test.js +3 -6
package/dist/discord/actions.js +112 -6
package/dist/discord/actions.test.js +117 -1
package/dist/discord/help-command.js +1 -1
package/dist/discord/message-coordinator.js +3 -8
package/dist/discord/models-command.js +1 -1
package/dist/discord/reaction-handler.js +2 -2
package/dist/discord/reaction-handler.test.js +55 -0
package/dist/discord/verify-push.js +31 -36
package/dist/discord/verify-push.test.js +34 -6
package/dist/discord/voice-command.js +1 -31
package/dist/discord/voice-command.test.js +21 -259
package/dist/discord/voice-status-command.js +3 -22
package/dist/discord/voice-status-command.test.js +16 -124
package/dist/discord-followup.test.js +133 -0
package/dist/health/config-doctor.js +5 -27
package/dist/health/config-doctor.test.js +1 -4
package/dist/index.js +1 -28
package/dist/runtime-overrides.js +2 -3
package/dist/runtime-overrides.test.js +27 -193
package/dist/tasks/store.js +10 -6
package/dist/tasks/store.test.js +44 -0
package/dist/tasks/task-action-executor.test.js +162 -50
package/dist/tasks/task-action-mutations.js +22 -2
package/dist/tasks/task-action-read-ops.js +7 -1
package/dist/tasks/task-action-runner-types.js +19 -1
package/dist/voice/audio-pipeline.js +145 -298
package/docs/configuration.md +4 -9
package/docs/official-docs.md +6 -9
package/docs/runtime-switching.md +1 -1
package/package.json +1 -1
package/dist/voice/audio-pipeline.test.js +0 -1100
package/dist/voice/stt-deepgram.js +0 -154
package/dist/voice/stt-deepgram.test.js +0 -275
package/dist/voice/stt-factory.js +0 -42
package/dist/voice/stt-factory.test.js +0 -45
package/dist/voice/stt-openai.js +0 -156
package/dist/voice/stt-openai.test.js +0 -281
package/dist/voice/tts-cartesia.js +0 -169
package/dist/voice/tts-cartesia.test.js +0 -228
package/dist/voice/tts-deepgram.js +0 -84
package/dist/voice/tts-deepgram.test.js +0 -220
package/dist/voice/tts-factory.js +0 -52
package/dist/voice/tts-factory.test.js +0 -53
package/dist/voice/tts-openai.js +0 -70
package/dist/voice/tts-openai.test.js +0 -138
package/dist/voice/types.test.js +0 -90

package/.env.example CHANGED Viewed

@@ -90,7 +90,7 @@ DISCORD_GUILD_ID=
 # - PRIMARY_RUNTIME sets the default adapter the instance boots with.
 # - `!models set chat <runtime>` can live-switch the main runtime in memory, but chat runtime swaps do not persist.
 # - Persistent model-role defaults live in data/models.json.
-# - Persistent runtime-only overlays live in data/runtime-overrides.json (`voiceRuntime`, `fastRuntime`, `ttsVoice`).
+# - Persistent runtime-only overlays live in data/runtime-overrides.json (`voiceRuntime`, `fastRuntime`).
 # - `!models reset` writes startup-default model strings back into models.json and clears fast/voice runtime overlays;
 #   it does not rewrite PRIMARY_RUNTIME in .env.
 # Supported runtime-path notes:
@@ -191,11 +191,9 @@ DISCORD_GUILD_ID=
 # Voice — configure via `pnpm setup` or `discoclaw init`
 # ----------------------------------------------------------
 # Run `pnpm setup` or `discoclaw init` to enable voice interactively,
-# or set these vars manually to enable voice chat (STT/TTS via Deepgram).
+# or set these vars manually to enable Gemini Live voice chat.
 #DISCOCLAW_VOICE_ENABLED=0
-# Voice pipeline provider: pipeline (default, Deepgram STT/TTS) or gemini-live
-# (Gemini Live WebSocket — requires GEMINI_API_KEY).
-#DISCOCLAW_VOICE_PIPELINE_PROVIDER=pipeline
+# Gemini Live requires GEMINI_API_KEY.
 # Gemini Live session rotation threshold (ms). The provider proactively reconnects
 # before Gemini's ~15 min session limit to minimize audio gap. Default: 780000 (13 min).
 #DISCOCLAW_GEMINI_SESSION_ROTATION_MS=780000
@@ -206,7 +204,7 @@ DISCORD_GUILD_ID=
 # (the bot creates a "voice-log" text channel and stores its ID in system-scaffold.json).
 # Only set this to override the auto-discovered channel.
 #DISCOCLAW_VOICE_LOG_CHANNEL=
-#DEEPGRAM_API_KEY=
+#GEMINI_API_KEY=
 # Optional voice-only Anthropic runtime for voice responses.
 # `claude-api` is not a valid PRIMARY_RUNTIME and does not persist in models.json.
 # Use `!models set voice claude-api` to persist the voice runtime path in runtime-overrides.json.

package/.env.example.full CHANGED Viewed

@@ -703,32 +703,22 @@ DISCOCLAW_DISCORD_ACTIONS_IMAGEGEN=0
 # IMAGEGEN_GEMINI_API_KEY is set.
 # ----------------------------------------------------------
-# Voice (STT/TTS) — join voice channels, listen and respond
+# Voice — Gemini Live voice chat
 # ----------------------------------------------------------
-# Master switch — enables voice channel interaction (default: off).
-# When enabled, the bot can join Discord voice channels, transcribe speech via STT,
-# and respond with synthesized speech via TTS.
+# Master switch — enables Discord voice interaction (default: off).
+# Gemini Live handles speech recognition, reasoning, and speech synthesis in one session.
 #DISCOCLAW_VOICE_ENABLED=0
 # Enable voice Discord action category (voiceJoin, voiceLeave, voiceStatus, voiceMute, voiceDeafen).
 # Requires DISCOCLAW_VOICE_ENABLED=1 to take effect (default: off).
 #DISCOCLAW_DISCORD_ACTIONS_VOICE=0
 # Auto-join voice channels when a non-bot user joins, and auto-leave when the last
-# non-bot user leaves. Starts/tears down the audio pipeline (STT receiver) automatically.
-# Requires DISCOCLAW_VOICE_ENABLED=1 (default: off).
+# non-bot user leaves. Requires DISCOCLAW_VOICE_ENABLED=1 (default: off).
 #DISCOCLAW_VOICE_AUTO_JOIN=0
-# Speech-to-text provider: deepgram (Deepgram Nova-3 API) or whisper (whisper.cpp local).
-# deepgram requires DEEPGRAM_API_KEY; whisper runs locally with no API key.
-#DISCOCLAW_STT_PROVIDER=deepgram
-# Text-to-speech provider: cartesia | deepgram | kokoro | openai.
-# cartesia requires CARTESIA_API_KEY; deepgram reuses DEEPGRAM_API_KEY;
-# openai requires OPENAI_API_KEY; kokoro runs locally with no API key.
-#DISCOCLAW_TTS_PROVIDER=cartesia
-# Voice audio channel name or ID — the channel the bot joins for voice interaction.
-# Used as the prompt context source (root policy, PA files, channel context, durable memory).
+# Voice text channel name or ID — used for prompt context and voice-triggered actions.
 # The old env var DISCOCLAW_VOICE_TRANSCRIPT_CHANNEL is still accepted as a fallback.
 # Leave unset to skip voice channel context in prompts.
 #DISCOCLAW_VOICE_HOME_CHANNEL=  # e.g. "voice" if using the default scaffold
-# Text channel name or ID for posting voice transcripts (user STT and bot TTS responses).
+# Text channel name or ID for posting voice transcripts.
 # Optional — auto-discovered via bootstrap (the bot creates "voice-log" and stores its ID
 # in system-scaffold.json). Only set this to override the auto-discovered channel.
 # Leave unset to disable transcript mirroring.
@@ -741,20 +731,11 @@ DISCOCLAW_DISCORD_ACTIONS_IMAGEGEN=0
 # Custom system prompt prepended to voice AI invocations. Max 4000 chars.
 # Use this to set a conversational tone, brevity instructions, or persona for voice responses.
 #DISCOCLAW_VOICE_SYSTEM_PROMPT=
-# Anthropic API key for direct Messages API access (bypasses Claude CLI cold-start).
-# When set and voice is enabled, voice invocations use the Anthropic REST adapter
-# instead of the CLI subprocess, eliminating ~2-5s cold-start latency per response.
+# Gemini Live session rotation threshold (ms). The provider proactively reconnects
+# before Gemini's ~15 min session limit to minimize audio gap. Default: 780000 (13 min).
+#DISCOCLAW_GEMINI_SESSION_ROTATION_MS=780000
+# Google Gemini API key. Required when voice is enabled.
+#GEMINI_API_KEY=
+# Anthropic API key for the optional direct Messages API voice runtime.
+# When set, `!models set voice claude-api` can bypass CLI cold-start for voice responses.
 #ANTHROPIC_API_KEY=
-# API key for Deepgram Nova-3 STT. Required when DISCOCLAW_STT_PROVIDER=deepgram.
-#DEEPGRAM_API_KEY=
-# Deepgram STT model for voice transcription (default: nova-3-conversationalai).
-# See https://developers.deepgram.com/docs/models-languages-overview for available models.
-#DEEPGRAM_STT_MODEL=nova-3-conversationalai
-# Deepgram TTS voice for speech synthesis (default: aura-2-asteria-en).
-# See https://developers.deepgram.com/docs/tts-models for available voices.
-#DEEPGRAM_TTS_VOICE=aura-2-asteria-en
-# Deepgram TTS playback speed (range: 0.5–1.5, default: 1.3).
-# Values below 1.0 slow down speech; values above 1.0 speed it up.
-#DEEPGRAM_TTS_SPEED=1.3
-# API key for Cartesia Sonic-3 TTS. Required when DISCOCLAW_TTS_PROVIDER=cartesia.
-#CARTESIA_API_KEY=

package/README.md CHANGED Viewed

@@ -39,7 +39,7 @@ No gateways, no proxies, no web UI. Discord *is* the interface.
 ## Voice — the bot talks back
-Real-time voice with STT (Deepgram), TTS (Cartesia), barge-in, and transcript mirroring. Off by default. [Setup guide →](docs/voice.md)
+Real-time voice with Gemini Live, barge-in, tool calls, and transcript mirroring. Off by default. [Setup guide →](docs/voice.md)
 ## Self-management

package/dist/cli/dashboard.test.js CHANGED Viewed

@@ -591,7 +591,6 @@ describe('runDashboard', () => {
             runtimeOverrides: {
                 fastRuntime: 'openrouter',
                 voiceRuntime: 'anthropic',
-                ttsVoice: 'alloy',
             },
             envDefaults: {
                 ...makeDoctorContext().envDefaults,
@@ -628,7 +627,6 @@ describe('runDashboard', () => {
         expect(saveModelConfigMock).toHaveBeenCalledWith('/repo/data/models.json', {});
         expect(saveOverridesMock).toHaveBeenCalledWith('/repo/data/runtime-overrides.json', {
             voiceRuntime: 'anthropic',
-            ttsVoice: 'alloy',
         });
         expect(frames.some((frame) => frame.includes('Reset fast to default: capable. Cleared fastRuntime override. Changes take effect on next service restart.'))).toBe(true);
     });
@@ -638,7 +636,6 @@ describe('runDashboard', () => {
             runtimeOverrides: {
                 fastRuntime: 'openrouter',
                 voiceRuntime: 'anthropic',
-                ttsVoice: 'alloy',
             },
             envDefaults: {
                 ...makeDoctorContext().envDefaults,
@@ -675,7 +672,6 @@ describe('runDashboard', () => {
         expect(saveModelConfigMock).toHaveBeenCalledWith('/repo/data/models.json', {});
         expect(saveOverridesMock).toHaveBeenCalledWith('/repo/data/runtime-overrides.json', {
             fastRuntime: 'openrouter',
-            ttsVoice: 'alloy',
         });
         expect(frames.some((frame) => frame.includes('Reset voice to default: capable. Cleared voiceRuntime override. Changes take effect on next service restart.'))).toBe(true);
     });

package/dist/cli/init-wizard.js CHANGED Viewed

@@ -88,10 +88,8 @@ export function buildEnvContent(vals, now = new Date()) {
     // Voice
     const voiceKeys = [
         'DISCOCLAW_VOICE_ENABLED',
-        'DEEPGRAM_API_KEY',
+        'GEMINI_API_KEY',
         'DISCOCLAW_DISCORD_ACTIONS_VOICE',
-        'DISCOCLAW_STT_PROVIDER',
-        'DISCOCLAW_TTS_PROVIDER',
     ];
     const hasVoice = voiceKeys.some((k) => vals[k]);
     if (hasVoice) {
@@ -347,14 +345,12 @@ export async function runInitWizard() {
     }
     values.DISCOCLAW_DISCORD_ACTIONS = '1';
     // ── Voice setup ───────────────────────────────────────────────────────────
-    const enableVoice = await ask('\nEnable voice chat? (requires a Deepgram API key — you can skip this and enable later) [y/N] ');
+    const enableVoice = await ask('\nEnable voice chat? (requires a Gemini API key — you can skip this and enable later) [y/N] ');
     if (enableVoice.toLowerCase() === 'y') {
-        const deepgramKey = await askValidated('Deepgram API key: ', (val) => (val ? null : 'Deepgram API key is required'));
+        const geminiKey = await askValidated('Gemini API key: ', (val) => (val ? null : 'Gemini API key is required'));
         values.DISCOCLAW_VOICE_ENABLED = '1';
-        values.DEEPGRAM_API_KEY = deepgramKey;
+        values.GEMINI_API_KEY = geminiKey;
         values.DISCOCLAW_DISCORD_ACTIONS_VOICE = '1';
-        values.DISCOCLAW_STT_PROVIDER = 'deepgram';
-        values.DISCOCLAW_TTS_PROVIDER = 'deepgram';
     }
     // ── Write .env ────────────────────────────────────────────────────────────
     const envContent = buildEnvContent(values);

package/dist/cli/init-wizard.test.js CHANGED Viewed

@@ -155,16 +155,12 @@ describe('init wizard helpers', () => {
             DISCORD_TOKEN: 'a.b.c',
             DISCORD_ALLOW_USER_IDS: '1000000000000000001',
             DISCOCLAW_VOICE_ENABLED: '1',
-            DEEPGRAM_API_KEY: 'dg-key',
+            GEMINI_API_KEY: 'gm-key',
             DISCOCLAW_DISCORD_ACTIONS_VOICE: '1',
-            DISCOCLAW_STT_PROVIDER: 'deepgram',
-            DISCOCLAW_TTS_PROVIDER: 'deepgram',
         }, new Date('2026-02-26T00:00:00.000Z'));
         expect(content).toContain('# VOICE');
         expect(content).toContain('DISCOCLAW_VOICE_ENABLED=1');
-        expect(content).toContain('DEEPGRAM_API_KEY=dg-key');
-        expect(content).toContain('DISCOCLAW_STT_PROVIDER=deepgram');
-        expect(content).toContain('DISCOCLAW_TTS_PROVIDER=deepgram');
+        expect(content).toContain('GEMINI_API_KEY=gm-key');
     });
     it('omits voice section when no voice vars are provided', () => {
         const content = buildEnvContent({
@@ -555,7 +551,7 @@ describe('runInitWizard', () => {
             '5000000000000000001', // DISCORD_GUILD_ID
             '', // provider selection -> default (Claude)
             'y', // enable voice -> yes
-            'dg-test-key', // Deepgram API key
+            'gemini-test-key', // Gemini API key
         ];
         process.chdir(tmpDir);
         vi.mocked(createInterface).mockReturnValue(makeReadline(answers));
@@ -573,9 +569,7 @@ describe('runInitWizard', () => {
         const newEnv = fs.readFileSync(path.join(tmpDir, '.env'), 'utf8');
         expect(newEnv).toContain('# VOICE');
         expect(newEnv).toContain('DISCOCLAW_VOICE_ENABLED=1');
-        expect(newEnv).toContain('DEEPGRAM_API_KEY=dg-test-key');
-        expect(newEnv).toContain('DISCOCLAW_STT_PROVIDER=deepgram');
-        expect(newEnv).toContain('DISCOCLAW_TTS_PROVIDER=deepgram');
+        expect(newEnv).toContain('GEMINI_API_KEY=gemini-test-key');
         expect(newEnv).toContain('DISCOCLAW_DISCORD_ACTIONS_VOICE=1');
     });
 });

package/dist/config.js CHANGED Viewed

@@ -510,9 +510,6 @@ export function parseConfig(env) {
     const anthropicApiKey = parseTrimmedString(env, 'ANTHROPIC_API_KEY');
     const voiceEnabled = parseBoolean(env, 'DISCOCLAW_VOICE_ENABLED', false);
     const voiceAutoJoin = parseBoolean(env, 'DISCOCLAW_VOICE_AUTO_JOIN', false);
-    const voiceSttProvider = parseEnum(env, 'DISCOCLAW_STT_PROVIDER', ['deepgram', 'whisper', 'openai'], 'deepgram');
-    const voiceTtsProvider = parseEnum(env, 'DISCOCLAW_TTS_PROVIDER', ['cartesia', 'deepgram', 'kokoro', 'openai'], 'cartesia');
-    const voicePipelineProvider = parseEnum(env, 'DISCOCLAW_VOICE_PIPELINE_PROVIDER', ['pipeline', 'gemini-live'], 'pipeline');
     const geminiSessionRotationMs = parseNonNegativeInt(env, 'DISCOCLAW_GEMINI_SESSION_ROTATION_MS', 780_000);
     let voiceHomeChannel = parseTrimmedString(env, 'DISCOCLAW_VOICE_HOME_CHANNEL');
     if (!voiceHomeChannel) {
@@ -523,20 +520,6 @@ export function parseConfig(env) {
         }
     }
     const voiceLogChannel = parseTrimmedString(env, 'DISCOCLAW_VOICE_LOG_CHANNEL');
-    const deepgramApiKey = parseTrimmedString(env, 'DEEPGRAM_API_KEY');
-    const deepgramSttModel = parseTrimmedString(env, 'DEEPGRAM_STT_MODEL') ?? 'nova-3-general';
-    const deepgramTtsVoice = parseTrimmedString(env, 'DEEPGRAM_TTS_VOICE') ?? 'aura-2-asteria-en';
-    const deepgramTtsSpeed = (() => {
-        const raw = parseTrimmedString(env, 'DEEPGRAM_TTS_SPEED');
-        if (raw == null)
-            return 1.3;
-        const n = parseFloat(raw);
-        if (!Number.isFinite(n) || n < 0.5 || n > 1.5) {
-            throw new Error(`DEEPGRAM_TTS_SPEED must be a number between 0.5 and 1.5, got "${raw}"`);
-        }
-        return n;
-    })();
-    const cartesiaApiKey = parseTrimmedString(env, 'CARTESIA_API_KEY');
     const voiceModelRaw = parseTrimmedString(env, 'DISCOCLAW_VOICE_MODEL');
     const voiceSystemPrompt = (() => {
         const raw = parseTrimmedString(env, 'DISCOCLAW_VOICE_SYSTEM_PROMPT');
@@ -547,26 +530,11 @@ export function parseConfig(env) {
         }
         return raw;
     })();
-    if (voiceEnabled && voiceSttProvider === 'deepgram' && !deepgramApiKey) {
-        warnings.push('DISCOCLAW_VOICE_ENABLED=1 with STT provider "deepgram" but DEEPGRAM_API_KEY is not set; voice STT will fail at runtime.');
-    }
-    if (voiceEnabled && voiceSttProvider === 'openai' && !openaiApiKey) {
-        warnings.push('DISCOCLAW_VOICE_ENABLED=1 with STT provider "openai" but OPENAI_API_KEY is not set; voice STT will fail at runtime.');
-    }
-    if (voiceEnabled && voiceTtsProvider === 'cartesia' && !cartesiaApiKey) {
-        warnings.push('DISCOCLAW_VOICE_ENABLED=1 with TTS provider "cartesia" but CARTESIA_API_KEY is not set; voice TTS will fail at runtime.');
-    }
-    if (voiceEnabled && voiceTtsProvider === 'deepgram' && !deepgramApiKey) {
-        warnings.push('DISCOCLAW_VOICE_ENABLED=1 with TTS provider "deepgram" but DEEPGRAM_API_KEY is not set; voice TTS will fail at runtime.');
-    }
-    if (voiceEnabled && voiceTtsProvider === 'openai' && !openaiApiKey) {
-        warnings.push('DISCOCLAW_VOICE_ENABLED=1 with TTS provider "openai" but OPENAI_API_KEY is not set; voice TTS will fail at runtime.');
-    }
     if (voiceEnabled && !voiceHomeChannel) {
         warnings.push('DISCOCLAW_VOICE_ENABLED=1 but DISCOCLAW_VOICE_HOME_CHANNEL is not set; voice actions will be disabled (no target channel for action execution).');
     }
-    if (voiceEnabled && voicePipelineProvider === 'gemini-live' && !geminiApiKey) {
-        warnings.push('DISCOCLAW_VOICE_PIPELINE_PROVIDER=gemini-live but GEMINI_API_KEY is not set; voice pipeline will fail at runtime.');
+    if (voiceEnabled && !geminiApiKey) {
+        warnings.push('DISCOCLAW_VOICE_ENABLED=1 but GEMINI_API_KEY is not set; Gemini Live voice will fail at runtime.');
     }
     const coldStorageEnabled = parseBoolean(env, 'DISCOCLAW_COLD_STORAGE_ENABLED', false);
     const coldStorageApiKey = parseTrimmedString(env, 'COLD_STORAGE_API_KEY') ?? openaiApiKey;
@@ -746,17 +714,9 @@ export function parseConfig(env) {
             voiceAutoJoin,
             voiceModel,
             voiceSystemPrompt,
-            voiceSttProvider,
-            voiceTtsProvider,
-            voicePipelineProvider,
             geminiSessionRotationMs,
             voiceHomeChannel,
             voiceLogChannel,
-            deepgramApiKey,
-            deepgramSttModel,
-            deepgramTtsVoice,
-            deepgramTtsSpeed,
-            cartesiaApiKey,
             forgeDrafterRuntime,
             forgeAuditorRuntime,
             openrouterApiKey,

package/dist/config.test.js CHANGED Viewed

@@ -1021,41 +1021,9 @@ describe('parseConfig', () => {
         expect(config.voiceEnabled).toBe(false);
     });
     it('parses DISCOCLAW_VOICE_ENABLED=1 as true', () => {
-        const { config } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', DEEPGRAM_API_KEY: 'dg-key', CARTESIA_API_KEY: 'ca-key' }));
+        const { config } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', GEMINI_API_KEY: 'gm-key' }));
         expect(config.voiceEnabled).toBe(true);
     });
-    it('defaults voiceSttProvider to "deepgram"', () => {
-        const { config } = parseConfig(env());
-        expect(config.voiceSttProvider).toBe('deepgram');
-    });
-    it('parses DISCOCLAW_STT_PROVIDER=whisper', () => {
-        const { config } = parseConfig(env({ DISCOCLAW_STT_PROVIDER: 'whisper' }));
-        expect(config.voiceSttProvider).toBe('whisper');
-    });
-    it('parses STT provider case-insensitively', () => {
-        const { config } = parseConfig(env({ DISCOCLAW_STT_PROVIDER: 'Deepgram' }));
-        expect(config.voiceSttProvider).toBe('deepgram');
-    });
-    it('throws on invalid STT provider', () => {
-        expect(() => parseConfig(env({ DISCOCLAW_STT_PROVIDER: 'invalid' })))
-            .toThrow(/DISCOCLAW_STT_PROVIDER must be one of deepgram\|whisper/);
-    });
-    it('defaults voiceTtsProvider to "cartesia"', () => {
-        const { config } = parseConfig(env());
-        expect(config.voiceTtsProvider).toBe('cartesia');
-    });
-    it('parses DISCOCLAW_TTS_PROVIDER=kokoro', () => {
-        const { config } = parseConfig(env({ DISCOCLAW_TTS_PROVIDER: 'kokoro' }));
-        expect(config.voiceTtsProvider).toBe('kokoro');
-    });
-    it('parses TTS provider case-insensitively', () => {
-        const { config } = parseConfig(env({ DISCOCLAW_TTS_PROVIDER: 'Cartesia' }));
-        expect(config.voiceTtsProvider).toBe('cartesia');
-    });
-    it('throws on invalid TTS provider', () => {
-        expect(() => parseConfig(env({ DISCOCLAW_TTS_PROVIDER: 'elevenlabs' })))
-            .toThrow(/DISCOCLAW_TTS_PROVIDER must be one of cartesia\|deepgram\|kokoro\|openai/);
-    });
     it('parses DISCOCLAW_VOICE_HOME_CHANNEL when set', () => {
         const { config } = parseConfig(env({ DISCOCLAW_VOICE_HOME_CHANNEL: 'voice-log' }));
         expect(config.voiceHomeChannel).toBe('voice-log');
@@ -1085,33 +1053,13 @@ describe('parseConfig', () => {
         const { config } = parseConfig(env());
         expect(config.voiceLogChannel).toBeUndefined();
     });
-    it('parses DEEPGRAM_API_KEY when set', () => {
-        const { config } = parseConfig(env({ DEEPGRAM_API_KEY: 'dg-key' }));
-        expect(config.deepgramApiKey).toBe('dg-key');
+    it('warns when voice enabled but GEMINI_API_KEY is missing', () => {
+        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1' }));
+        expect(warnings.some((w) => w.includes('GEMINI_API_KEY'))).toBe(true);
     });
-    it('returns undefined for deepgramApiKey when unset', () => {
-        const { config } = parseConfig(env());
-        expect(config.deepgramApiKey).toBeUndefined();
-    });
-    it('parses CARTESIA_API_KEY when set', () => {
-        const { config } = parseConfig(env({ CARTESIA_API_KEY: 'ca-key' }));
-        expect(config.cartesiaApiKey).toBe('ca-key');
-    });
-    it('returns undefined for cartesiaApiKey when unset', () => {
-        const { config } = parseConfig(env());
-        expect(config.cartesiaApiKey).toBeUndefined();
-    });
-    it('warns when voice enabled with deepgram STT but DEEPGRAM_API_KEY missing', () => {
-        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', CARTESIA_API_KEY: 'ca-key' }));
-        expect(warnings.some((w) => w.includes('DEEPGRAM_API_KEY'))).toBe(true);
-    });
-    it('does not warn about DEEPGRAM_API_KEY when voice disabled', () => {
+    it('does not warn about GEMINI_API_KEY when voice disabled', () => {
         const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '0' }));
-        expect(warnings.some((w) => w.includes('DEEPGRAM_API_KEY'))).toBe(false);
-    });
-    it('does not warn about DEEPGRAM_API_KEY when STT provider is whisper', () => {
-        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', DISCOCLAW_STT_PROVIDER: 'whisper', CARTESIA_API_KEY: 'ca-key' }));
-        expect(warnings.some((w) => w.includes('DEEPGRAM_API_KEY'))).toBe(false);
+        expect(warnings.some((w) => w.includes('GEMINI_API_KEY'))).toBe(false);
     });
     // --- voiceAutoJoin ---
     it('defaults voiceAutoJoin to false', () => {
@@ -1130,24 +1078,12 @@ describe('parseConfig', () => {
         const { config } = parseConfig(env({ DISCOCLAW_VOICE_AUTO_JOIN: '0' }));
         expect(config.voiceAutoJoin).toBe(false);
     });
-    it('warns when voice enabled with cartesia TTS but CARTESIA_API_KEY missing', () => {
-        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', DEEPGRAM_API_KEY: 'dg-key' }));
-        expect(warnings.some((w) => w.includes('CARTESIA_API_KEY'))).toBe(true);
-    });
-    it('does not warn about CARTESIA_API_KEY when voice disabled', () => {
-        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '0' }));
-        expect(warnings.some((w) => w.includes('CARTESIA_API_KEY'))).toBe(false);
-    });
-    it('does not warn about CARTESIA_API_KEY when TTS provider is kokoro', () => {
-        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', DISCOCLAW_TTS_PROVIDER: 'kokoro', DEEPGRAM_API_KEY: 'dg-key' }));
-        expect(warnings.some((w) => w.includes('CARTESIA_API_KEY'))).toBe(false);
-    });
     it('warns when voice enabled but DISCOCLAW_VOICE_HOME_CHANNEL is unset', () => {
-        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', DEEPGRAM_API_KEY: 'dg-key', CARTESIA_API_KEY: 'ca-key' }));
+        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', GEMINI_API_KEY: 'gm-key' }));
         expect(warnings.some((w) => w.includes('DISCOCLAW_VOICE_HOME_CHANNEL'))).toBe(true);
     });
     it('does not warn about DISCOCLAW_VOICE_HOME_CHANNEL when both voice and home channel are set', () => {
-        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', DISCOCLAW_VOICE_HOME_CHANNEL: '1000000000000000003', DEEPGRAM_API_KEY: 'dg-key', CARTESIA_API_KEY: 'ca-key' }));
+        const { warnings } = parseConfig(env({ DISCOCLAW_VOICE_ENABLED: '1', DISCOCLAW_VOICE_HOME_CHANNEL: '1000000000000000003', GEMINI_API_KEY: 'gm-key' }));
         expect(warnings.some((w) => w.includes('DISCOCLAW_VOICE_HOME_CHANNEL'))).toBe(false);
     });
     // --- cold storage ---

package/dist/dashboard/server.js CHANGED Viewed

@@ -361,11 +361,7 @@ async function applyPreset(preset, inspectOpts, deps) {
     const ctx = await deps.loadDoctorContext(inspectOpts);
     const primaryRuntime = presetToPrimaryRuntime(preset);
     await deps.updateEnvKey(ctx.configPaths.env, 'PRIMARY_RUNTIME', primaryRuntime);
-    const preservedOverrides = {};
-    if (ctx.runtimeOverrides.ttsVoice) {
-        preservedOverrides.ttsVoice = ctx.runtimeOverrides.ttsVoice;
-    }
-    await deps.saveOverrides(ctx.configPaths.runtimeOverrides, preservedOverrides);
+    await deps.saveOverrides(ctx.configPaths.runtimeOverrides, {});
     await deps.saveModelConfig(ctx.configPaths.models, { ...MODEL_DEFAULTS });
     return {
         message: `Preset switched to ${preset}. Models reset to tier defaults. Restart the service to apply.`,

package/dist/dashboard/server.test.js CHANGED Viewed

@@ -762,7 +762,6 @@ describe('startDashboardServer', () => {
         const ctx = makeDoctorContext({
             runtimeOverrides: {
                 fastRuntime: 'openrouter',
-                ttsVoice: 'alloy',
             },
             runtimeOverridesFile: {
                 exists: true,
@@ -770,7 +769,6 @@ describe('startDashboardServer', () => {
                 raw: {},
                 values: {
                     fastRuntime: 'openrouter',
-                    ttsVoice: 'alloy',
                 },
             },
         });
@@ -802,7 +800,7 @@ describe('startDashboardServer', () => {
         expect(body.message).toContain('codex');
         expect(body.message).toContain('tier defaults');
         expect(updateEnvKeyMock).toHaveBeenCalledWith('/repo/.env', 'PRIMARY_RUNTIME', 'codex-cli');
-        expect(saveOverridesMock).toHaveBeenCalledWith('/repo/data/runtime-overrides.json', { ttsVoice: 'alloy' });
+        expect(saveOverridesMock).toHaveBeenCalledWith('/repo/data/runtime-overrides.json', {});
         expect(saveModelConfigMock).toHaveBeenCalledWith('/repo/data/models.json', expect.objectContaining({}));
         expect(body.snapshot).toBeDefined();
         expect(body.snapshot.primaryRuntime).toBe('codex');
@@ -829,12 +827,11 @@ describe('startDashboardServer', () => {
         expect(body.message).toContain('claude');
         expect(updateEnvKeyMock).toHaveBeenCalledWith('/repo/.env', 'PRIMARY_RUNTIME', 'claude-cli');
     });
-    it('preserves ttsVoice when clearing overrides via /api/preset', async () => {
+    it('clears legacy voice overrides when applying /api/preset', async () => {
         const ctx = makeDoctorContext({
             runtimeOverrides: {
                 fastRuntime: 'openrouter',
                 voiceRuntime: 'anthropic',
-                ttsVoice: 'shimmer',
             },
         });
         const saveOverridesMock = vi.fn(async () => undefined);
@@ -848,7 +845,7 @@ describe('startDashboardServer', () => {
             method: 'POST',
             body: JSON.stringify({ preset: 'codex' }),
         });
-        expect(saveOverridesMock).toHaveBeenCalledWith('/repo/data/runtime-overrides.json', { ttsVoice: 'shimmer' });
+        expect(saveOverridesMock).toHaveBeenCalledWith('/repo/data/runtime-overrides.json', {});
     });
     it('rejects GET requests on /api/model', async () => {
         const { port } = await startServer();

package/dist/discord/actions.js CHANGED Viewed

@@ -534,21 +534,127 @@ export function buildAllResultLines(results) {
     return results.map((r) => r.ok ? `Done: ${r.summary}` : `Failed: ${r.error}`);
 }
 /**
- * Cap a single result line to approximately `maxChars` characters.
+ * Cap a single result line to `maxChars` characters.
  * If truncated, appends a visible `...[truncated]` suffix.
  */
 export function capResultLine(line, maxChars = 1500) {
     if (line.length <= maxChars)
         return line;
-    return `${line.slice(0, maxChars)}...[truncated]`;
+    const suffix = '...[truncated]';
+    if (maxChars <= suffix.length)
+        return suffix.slice(0, maxChars);
+    return `${line.slice(0, maxChars - suffix.length)}${suffix}`;
+}
+const RESULT_LINE_PREFIX_RE = /^(Done|Failed):\s*/;
+const RESULT_LINE_IMPORTANT_FIELD_RE = /^(Status|Thread|Model|Next run|Last error|State):\s/i;
+const RESULT_LINE_GENERIC_FIELD_RE = /^[A-Z][A-Za-z0-9 /_-]{1,24}:\s/;
+const RESULT_LINE_SECTION_HEADER_RE = /^\*\*[^*\n]+:\*\*$/;
+const RESULT_LINE_ERROR_RE = /\b(error|failed|failure|missing|invalid|denied|not found|cannot|unable|exception|timeout|timed out)\b/i;
+const RESULT_LINE_PATH_RE = /(?:^|[\s(])(?:\/[^\s)`]+|\.{1,2}\/[^\s)`]+|[A-Za-z]:\\\S+)/;
+const RESULT_LINE_ID_RE = /\b(?:id[:=][^\s,)]+|[a-z]+-\d+\b|\d{8,})/i;
+const RESULT_LINE_NEXT_ACTION_RE = /\b(?:retry|rerun|re-run|resume|check|open|use)\b/i;
+const RESULT_LINE_MICROCOMPACT_TRIGGER_LINES = 6;
+const RESULT_LINE_MICROCOMPACT_TRIGGER_CHARS = 500;
+const RESULT_LINE_MAX_RETAINED_LINES = 8;
+const RESULT_LINE_ID_REPRESENTATIVE_COUNT = 4;
+const RESULT_LINE_REMAINDER_REPRESENTATIVE_COUNT = 2;
+function splitResultLine(line) {
+    const match = RESULT_LINE_PREFIX_RE.exec(line);
+    if (!match)
+        return { prefix: '', body: line };
+    return { prefix: match[0], body: line.slice(match[0].length) };
+}
+function parseResultLineBody(body) {
+    return body
+        .split(/\r?\n/)
+        .map((line) => line.trimEnd())
+        .filter((line) => line.trim().length > 0)
+        .map((text, index) => ({
+        index,
+        text,
+        isImportantField: RESULT_LINE_IMPORTANT_FIELD_RE.test(text),
+        isGenericField: RESULT_LINE_GENERIC_FIELD_RE.test(text),
+        isSectionHeader: RESULT_LINE_SECTION_HEADER_RE.test(text),
+        hasErrorText: RESULT_LINE_ERROR_RE.test(text),
+        hasPath: RESULT_LINE_PATH_RE.test(text),
+        hasId: RESULT_LINE_ID_RE.test(text),
+        hasNextAction: RESULT_LINE_NEXT_ACTION_RE.test(text),
+    }));
+}
+function takeRepresentativeIndexes(indexes, count) {
+    if (indexes.length <= count)
+        return indexes;
+    const headCount = Math.ceil(count / 2);
+    const tailCount = Math.floor(count / 2);
+    return [...indexes.slice(0, headCount), ...indexes.slice(-tailCount)];
+}
+function appendUniqueIndexes(target, indexes, maxCount) {
+    for (const index of indexes) {
+        if (target.includes(index))
+            continue;
+        target.push(index);
+        if (target.length >= maxCount)
+            return;
+    }
+}
+function collectSectionValueIndexes(lines) {
+    const indexes = [];
+    for (let i = 0; i < lines.length - 1; i += 1) {
+        if (!lines[i]?.isSectionHeader)
+            continue;
+        indexes.push(lines[i + 1].index);
+    }
+    return indexes;
+}
+function buildResultLineOmissionMarker(omittedCount) {
+    return `...[omitted ${omittedCount} line${omittedCount === 1 ? '' : 's'}]`;
+}
+function selectInformativeResultBodyIndexes(lines) {
+    if (lines.length <= RESULT_LINE_MAX_RETAINED_LINES)
+        return lines.map((line) => line.index);
+    const maxCount = Math.min(RESULT_LINE_MAX_RETAINED_LINES, lines.length);
+    const selected = [];
+    appendUniqueIndexes(selected, [0], maxCount);
+    appendUniqueIndexes(selected, lines.filter((line) => line.isImportantField).map((line) => line.index), maxCount);
+    appendUniqueIndexes(selected, lines
+        .filter((line) => line.hasErrorText || line.hasPath || line.hasNextAction)
+        .map((line) => line.index), maxCount);
+    appendUniqueIndexes(selected, lines.filter((line) => line.isSectionHeader).map((line) => line.index), maxCount);
+    appendUniqueIndexes(selected, collectSectionValueIndexes(lines), maxCount);
+    appendUniqueIndexes(selected, takeRepresentativeIndexes(lines.filter((line) => line.hasId).map((line) => line.index), RESULT_LINE_ID_REPRESENTATIVE_COUNT), maxCount);
+    appendUniqueIndexes(selected, [lines.length - 1], maxCount);
+    appendUniqueIndexes(selected, takeRepresentativeIndexes(lines
+        .filter((line) => !line.isGenericField && !line.isSectionHeader && !line.hasId)
+        .map((line) => line.index), RESULT_LINE_REMAINDER_REPRESENTATIVE_COUNT), maxCount);
+    return selected.sort((a, b) => a - b);
+}
+function microcompactResultLine(line, maxChars) {
+    const { prefix, body } = splitResultLine(line);
+    const parsedLines = parseResultLineBody(body);
+    if (parsedLines.length <= 1)
+        return capResultLine(line, maxChars);
+    const shouldCompact = parsedLines.length > RESULT_LINE_MICROCOMPACT_TRIGGER_LINES
+        || body.length > Math.min(maxChars, RESULT_LINE_MICROCOMPACT_TRIGGER_CHARS);
+    if (!shouldCompact)
+        return capResultLine(line, maxChars);
+    const selectedIndexes = selectInformativeResultBodyIndexes(parsedLines);
+    if (selectedIndexes.length >= parsedLines.length)
+        return capResultLine(line, maxChars);
+    const selectedIndexSet = new Set(selectedIndexes);
+    const retainedLines = parsedLines
+        .filter((lineInfo) => selectedIndexSet.has(lineInfo.index))
+        .map((lineInfo) => lineInfo.text);
+    const omittedCount = parsedLines.length - retainedLines.length;
+    const compactedBody = `${retainedLines.join('\n')}\n${buildResultLineOmissionMarker(omittedCount)}`;
+    return capResultLine(`${prefix}${compactedBody}`, maxChars);
 }
 /**
- * Build result lines for follow-up prompts with per-line length capping.
- * Each line is capped at `maxChars` characters to prevent oversized payloads
- * from crowding out reasoning and action blocks in follow-up prompts.
+ * Build result lines for follow-up prompts with microcompaction before
+ * the final hard cap so oversized payloads preserve continuation-critical
+ * details without crowding out reasoning and action blocks.
  */
 export function buildCappedResultLines(results, maxChars = 1500) {
-    return buildAllResultLines(results).map((line) => capResultLine(line, maxChars));
+    return buildAllResultLines(results).map((line) => microcompactResultLine(line, maxChars));
 }
 /**
  * Append display result lines to body text, automatically closing any