npm - crawd - Versions diffs - 0.8.7 → 0.9.0 - Mend

crawd 0.8.7 → 0.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

package/dist/types.d.ts +5 -23
package/openclaw.plugin.json +8 -40
package/package.json +4 -2
package/skills/crawd/SKILL.md +37 -0
package/src/backend/coordinator.test.ts +393 -0
package/src/backend/coordinator.ts +267 -16
package/src/backend/index.ts +29 -208
package/src/backend/server.ts +67 -219
package/src/plugin.ts +122 -33
package/src/types.ts +4 -23
package/src/lib/tts/tiktok.ts +0 -91

package/src/backend/index.ts CHANGED Viewed

@@ -1,31 +1,28 @@
 import 'dotenv/config';
 import { randomUUID } from "crypto";
-import { writeFile, mkdir } from "fs/promises";
 import { watch } from "fs";
-import { join } from "path";
 import Fastify from "fastify";
-import fastifyStatic from "@fastify/static";
 import cors from "@fastify/cors";
 import { Server } from "socket.io";
-import OpenAI from "openai";
 import { pumpfun } from "../lib/pumpfun/v2";
 import { ChatManager } from "../lib/chat/manager";
 import { PumpFunChatClient } from "../lib/chat/pumpfun/client";
 import { YouTubeChatClient } from "../lib/chat/youtube/client";
 import { GatewayClient, Coordinator, type CoordinatorConfig, type CoordinatorEvent, type InvokeRequestPayload } from "./coordinator";
 import { generateShortId } from "../lib/chat/types";
-import { configureTikTokTTS, generateTikTokTTS } from "../lib/tts/tiktok";
 import type { ChatMessage } from "../lib/chat/types";
-import { loadEnv, loadConfig } from "../config/store.js";
+import { loadEnv } from "../config/store.js";
 import { ENV_PATH, CONFIG_PATH } from "../utils/paths.js";
-import type { TtsProvider, ReplyTurnEvent, TalkEvent } from "../types";
 // Parse coordinator config from env vars
 function parseCoordinatorConfig(): Partial<CoordinatorConfig> {
   const config: Partial<CoordinatorConfig> = {};
-  if (process.env.VIBE_ENABLED !== undefined) {
-    config.vibeEnabled = process.env.VIBE_ENABLED === 'true';
+  if (process.env.AUTONOMY_MODE) {
+    const mode = process.env.AUTONOMY_MODE
+    if (mode === 'vibe' || mode === 'plan' || mode === 'none') {
+      config.autonomyMode = mode
+    }
   }
   if (process.env.VIBE_INTERVAL_MS) {
     config.vibeIntervalMs = Number(process.env.VIBE_INTERVAL_MS);
@@ -44,44 +41,18 @@ function parseCoordinatorConfig(): Partial<CoordinatorConfig> {
 }
 const port = Number(process.env.PORT || 4000);
-const BACKEND_URL = process.env.BACKEND_URL || `http://localhost:${port}`;
 const TOKEN_MINT = process.env.NEXT_PUBLIC_TOKEN_MINT;
 const MCAP_POLL_MS = 10_000;
-const TTS_DIR = join(process.cwd(), "tmp", "tts");
-// TTS provider selection — mutable, updated by file watcher
-let CHAT_PROVIDER = (process.env.TTS_CHAT_PROVIDER || 'tiktok') as TtsProvider;
-let CHAT_VOICE = process.env.TTS_CHAT_VOICE;
-let BOT_PROVIDER = (process.env.TTS_BOT_PROVIDER || 'elevenlabs') as TtsProvider;
-let BOT_VOICE = process.env.TTS_BOT_VOICE;
 // Unique version ID generated at startup - changes on each deploy/restart
 const BUILD_VERSION = randomUUID();
 const fastify = Fastify({ logger: true });
-const openai = new OpenAI();
-// Dynamic import for optional ElevenLabs dependency
-let elevenlabs: any = null;
-if (process.env.ELEVENLABS_API_KEY) {
-  try {
-    const { ElevenLabsClient } = await import("@elevenlabs/elevenlabs-js");
-    elevenlabs = new ElevenLabsClient({ apiKey: process.env.ELEVENLABS_API_KEY });
-  } catch {
-    fastify.log.warn("@elevenlabs/elevenlabs-js not installed, ElevenLabs TTS disabled");
-  }
-}
-// Configure TikTok TTS if session ID is available
-if (process.env.TIKTOK_SESSION_ID) {
-  configureTikTokTTS(process.env.TIKTOK_SESSION_ID);
-}
 // --- Auto-reload ~/.crawd/.env and config.json on change ---
 async function reloadConfig() {
   const env = loadEnv();
-  const config = loadConfig();
   const changes: string[] = [];
   // Update secrets in process.env
@@ -92,30 +63,6 @@ async function reloadConfig() {
     }
   }
-  // Update TTS provider/voice from config
-  const newChatProvider = (config.tts.chatProvider || 'tiktok') as TtsProvider;
-  const newChatVoice = config.tts.chatVoice;
-  const newBotProvider = (config.tts.botProvider || 'elevenlabs') as TtsProvider;
-  const newBotVoice = config.tts.botVoice;
-  if (newChatProvider !== CHAT_PROVIDER) { changes.push('tts.chatProvider'); CHAT_PROVIDER = newChatProvider; }
-  if (newChatVoice !== CHAT_VOICE) { changes.push('tts.chatVoice'); CHAT_VOICE = newChatVoice; }
-  if (newBotProvider !== BOT_PROVIDER) { changes.push('tts.botProvider'); BOT_PROVIDER = newBotProvider; }
-  if (newBotVoice !== BOT_VOICE) { changes.push('tts.botVoice'); BOT_VOICE = newBotVoice; }
-  // Reinitialize ElevenLabs client if key changed
-  if (changes.includes('ELEVENLABS_API_KEY') && process.env.ELEVENLABS_API_KEY) {
-    try {
-      const { ElevenLabsClient } = await import("@elevenlabs/elevenlabs-js");
-      elevenlabs = new ElevenLabsClient({ apiKey: process.env.ELEVENLABS_API_KEY });
-    } catch { /* already warned at startup */ }
-  }
-  // Reconfigure TikTok TTS if session ID changed
-  if (changes.includes('TIKTOK_SESSION_ID') && process.env.TIKTOK_SESSION_ID) {
-    configureTikTokTTS(process.env.TIKTOK_SESSION_ID);
-  }
   if (changes.length > 0) {
     fastify.log.info({ changes }, 'Config reloaded');
   }
@@ -133,96 +80,6 @@ for (const file of [ENV_PATH, CONFIG_PATH]) {
   } catch { /* file may not exist yet */ }
 }
-// --- TTS provider functions ---
-async function generateOpenAITTS(text: string, voice?: string): Promise<string> {
-  const response = await openai.audio.speech.create({
-    model: "tts-1-hd",
-    voice: (voice || "onyx") as "onyx",
-    input: text,
-  });
-  const buffer = Buffer.from(await response.arrayBuffer());
-  const filename = `${randomUUID()}.mp3`;
-  await mkdir(TTS_DIR, { recursive: true });
-  await writeFile(join(TTS_DIR, filename), buffer);
-  return `${BACKEND_URL}/tts/${filename}`;
-}
-async function generateElevenLabsTTS(text: string, voice?: string): Promise<string> {
-  if (!elevenlabs) throw new Error("ELEVENLABS_API_KEY not configured");
-  const audio = await elevenlabs.textToSpeech.convert(voice || "TX3LPaxmHKxFdv7VOQHJ", {
-    modelId: "eleven_multilingual_v2",
-    text,
-    outputFormat: "mp3_44100_128",
-    voiceSettings: {
-      stability: 0,
-      similarityBoost: 1.0,
-      useSpeakerBoost: true,
-      speed: 1.0,
-    },
-  });
-  // Convert stream to buffer - works with Bun and Node.js
-  const response = new Response(audio as any);
-  const arrayBuffer = await response.arrayBuffer();
-  const buffer = Buffer.from(arrayBuffer);
-  // Check if response is valid MP3 (starts with ID3 or FF FB/FA/F3/F2)
-  const isMP3 = (buffer[0] === 0x49 && buffer[1] === 0x44 && buffer[2] === 0x33) || // ID3
-                (buffer[0] === 0xFF && (buffer[1] & 0xE0) === 0xE0); // MP3 frame sync
-  if (!isMP3) {
-    const preview = buffer.subarray(0, 200).toString("utf-8");
-    console.error(`ElevenLabs returned non-audio response: ${preview}`);
-    throw new Error("ElevenLabs returned invalid audio (possibly error page)");
-  }
-  const filename = `${randomUUID()}.mp3`;
-  await mkdir(TTS_DIR, { recursive: true });
-  await writeFile(join(TTS_DIR, filename), buffer);
-  console.log(`TTS file written: ${filename}, size: ${buffer.length} bytes`);
-  return `${BACKEND_URL}/tts/${filename}`;
-}
-async function generateTikTokTTSFile(text: string, voice?: string): Promise<string> {
-  const buffer = await generateTikTokTTS(text, voice);
-  const filename = `${randomUUID()}.mp3`;
-  await mkdir(TTS_DIR, { recursive: true });
-  await writeFile(join(TTS_DIR, filename), buffer);
-  console.log(`TikTok TTS file written: ${filename}, size: ${buffer.length} bytes`);
-  return `${BACKEND_URL}/tts/${filename}`;
-}
-/** Generate TTS using the specified provider and voice, falling back to OpenAI on failure */
-async function tts(text: string, provider: TtsProvider, voice?: string): Promise<string> {
-  const providers: Record<TtsProvider, () => Promise<string>> = {
-    openai: () => generateOpenAITTS(text, voice),
-    elevenlabs: () => generateElevenLabsTTS(text, voice),
-    tiktok: () => generateTikTokTTSFile(text, voice),
-  };
-  try {
-    return await providers[provider]();
-  } catch (e) {
-    if (provider !== 'openai') {
-      fastify.log.warn(e, `${provider} TTS failed, falling back to OpenAI`);
-      return await generateOpenAITTS(text);
-    }
-    throw e;
-  }
-}
-/** Generate TTS for a chat message (uses CHAT_PROVIDER) */
-function chatTTS(text: string) { return tts(text, CHAT_PROVIDER, CHAT_VOICE); }
-/** Generate TTS for a bot message (uses BOT_PROVIDER) */
-function botTTS(text: string) { return tts(text, BOT_PROVIDER, BOT_VOICE); }
 // --- Non-TTS helpers ---
 async function fetchMarketCap(): Promise<number | null> {
@@ -238,15 +95,7 @@ async function fetchMarketCap(): Promise<number | null> {
 }
 async function main() {
-  fastify.log.info({ chatProvider: CHAT_PROVIDER, botProvider: BOT_PROVIDER }, 'TTS providers configured');
   await fastify.register(cors, { origin: true });
-  await mkdir(TTS_DIR, { recursive: true });
-  await fastify.register(fastifyStatic, {
-    root: TTS_DIR,
-    prefix: "/tts/",
-    decorateReply: false,
-  });
   const io = new Server(fastify.server, {
     cors: { origin: "*" },
@@ -339,35 +188,27 @@ async function main() {
         } else if (event.type === 'vibeExecuted' && !event.skipped) {
           io.emit('crawd:status', { status: 'vibing' });
         }
-        // Note: chatProcessed no longer emits status — we only wake/emit
-        // when the agent actually replies (via talk tool or text fallback).
       });
       /**
-       * Generate TTS and emit atomic talk event, wait for overlay ack.
-       * If replyTo is provided, also generates chat TTS — overlay plays chat first, then bot.
+       * Emit text-only talk event, wait for overlay ack.
+       * If replyTo is provided, emits reply-turn instead of talk.
        */
       async function handleTalkInvoke(text: string, replyTo?: ChatMessage): Promise<void> {
         const talkId = randomUUID();
         fastify.log.info({ talkId, text: text.slice(0, 80), replyTo: replyTo?.shortId }, 'Handling talk invoke');
-        // Generate TTS in parallel when there's a chat message to reply to
-        const [ttsUrl, chatTtsUrl] = await Promise.all([
-          botTTS(text),
-          replyTo ? chatTTS(`Chat says: ${replyTo.message}`) : Promise.resolve(undefined),
-        ]);
-        const event: TalkEvent = { id: talkId, message: text, ttsUrl };
-        if (replyTo && chatTtsUrl) {
-          event.chat = {
-            message: replyTo.message,
-            username: replyTo.username,
-            ttsUrl: chatTtsUrl,
-          };
+        if (replyTo) {
+          io.emit('crawd:reply-turn', {
+            id: talkId,
+            chat: { username: replyTo.username, message: replyTo.message },
+            botMessage: text,
+          });
+        } else {
+          io.emit('crawd:talk', { id: talkId, message: text });
         }
-        io.emit('crawd:talk', event);
-        fastify.log.info({ talkId, hasChat: !!event.chat }, 'Emitted crawd:talk, waiting for ack');
+        fastify.log.info({ talkId, hasChat: !!replyTo }, 'Emitted event, waiting for ack');
         await waitForTalkAck(talkId);
         fastify.log.info({ talkId }, 'Talk complete');
@@ -415,7 +256,7 @@ async function main() {
               fastify.log.error(err, 'Talk invoke failed');
               await gateway.sendInvokeResult(payload.id, payload.nodeId, {
                 ok: false,
-                error: { code: 'TTS_FAILED', message: String(err) },
+                error: { code: 'INVOKE_FAILED', message: String(err) },
               });
             }
           } else {
@@ -467,16 +308,9 @@ async function main() {
         return reply.status(400).send({ error: "message is required" });
       }
-      try {
-        const talkId = randomUUID();
-        const ttsUrl = await botTTS(message);
-        const event: TalkEvent = { id: talkId, message, ttsUrl };
-        io.emit("crawd:talk", event);
-        return { ok: true, id: talkId };
-      } catch (e) {
-        fastify.log.error(e, "failed to generate TTS");
-        return reply.status(500).send({ error: "Failed to generate TTS" });
-      }
+      const talkId = randomUUID();
+      io.emit("crawd:talk", { id: talkId, message });
+      return { ok: true, id: talkId };
     }
   );
@@ -533,7 +367,7 @@ async function main() {
     }
   );
-  // Mock turn endpoint for debug UI — generates real TTS
+  // Mock turn endpoint for debug UI — text-only
   fastify.post<{ Body: { username: string; message: string; response: string } }>(
     "/mock/turn",
     async (request, reply) => {
@@ -544,27 +378,14 @@ async function main() {
       fastify.log.info({ username, message, response }, "mock turn");
-      try {
-        const [chatTtsUrl, botTtsUrl] = await Promise.all([
-          chatTTS(`Chat says: ${message}`),
-          botTTS(response),
-        ]);
-        const event: ReplyTurnEvent = {
-          id: randomUUID(),
-          chat: { username, message },
-          botMessage: response,
-          chatTtsUrl,
-          botTtsUrl,
-        };
-        io.emit('crawd:reply-turn', event);
+      const id = randomUUID();
+      io.emit('crawd:reply-turn', {
+        id,
+        chat: { username, message },
+        botMessage: response,
+      });
-        return { ok: true };
-      } catch (e) {
-        fastify.log.error(e, "failed to generate mock turn TTS");
-        return reply.status(500).send({ error: "Failed to generate TTS" });
-      }
+      return { ok: true, id };
     }
   );