npm - tuna-agent - Versions diffs - 0.1.153 → 0.1.155 - Mend

tuna-agent 0.1.153 → 0.1.155

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/daemon/analyze-video-handler.js +10 -8
package/dist/daemon/extension-handlers.js +13 -8
package/package.json +1 -1

package/dist/daemon/analyze-video-handler.js CHANGED Viewed

@@ -247,8 +247,10 @@ Voiceover during this scene: "${voiceoverText || '(none)'}"`;
         { text: promptText },
         ...frames.map(b64 => ({ inlineData: { mimeType: 'image/jpeg', data: b64 } })),
     ];
-    const { text, usage } = await geminiGenerate(parts, 512);
-    cost?.geminiVision('vision', usage);
+    // Gemini 2.5 Flash (cheapest). geminiGenerate disables thinking for
+    // 2.5-flash so the 512 budget isn't starved → non-empty descriptions.
+    const { text, usage } = await geminiGenerate(parts, 512, 'gemini-2.5-flash');
+    cost?.geminiVision('vision', usage, 'gemini-2.5-flash');
     return text;
 }
 // Phase 1 (the strong part of AI_Video_Clone, ported): ONE gpt-4o call over
@@ -291,18 +293,18 @@ Rules:
 - NO GROUP ENTRIES (CRITICAL): NEVER output a collective/crowd label as a single entry — forbidden: "VILLAGERS", "LADIES GROUP", "KNITTING GROUP", "CROWD", "GROUP OF ...", any "*_GROUP". If 2+ similar secondary people RECUR across scenes, list them as SEPARATE numbered individuals (e.g. WOMAN_1, WOMAN_2, WOMAN_3), each with its OWN distinct face/hair/body/age. Only a truly anonymous one-off background that never recurs may be omitted entirely.
 - characters.description: ENGLISH only, factual, no camera/action words.
 - DISTINCT FACES (CRITICAL): every character MUST have a HIGHLY UNIQUE facial structure, a distinct hairstyle, a specific body type and a clearly different age. NEVER reuse the same or a similar facial description for two characters — they must look completely different from one another.`;
-        // Phase-1 on Gemini 3 Flash (strong multimodal, far cheaper image tokens
-        // than gpt-4o) with a dense 30-frame seed. 1 call/video; final cast
-        // recall is double-covered by the reconcile pass. Generous output budget
-        // so any model-side thinking can't starve the JSON answer.
+        // Phase-1 on Gemini 2.5 Flash (cheapest) with a dense 30-frame seed. 1
+        // call/video; final cast recall is double-covered by the reconcile pass.
+        // geminiGenerate disables thinking for 2.5-flash + generous 3000 output
+        // budget so the JSON answer is never starved (was empty without this).
         const parts = [
             { text: promptText },
             ...frames.map(b64 => ({ inlineData: { mimeType: 'image/jpeg', data: b64 } })),
         ];
-        const { text: rawTxt, usage } = await geminiGenerate(parts, 3000, 'gemini-3-flash-preview');
+        const { text: rawTxt, usage } = await geminiGenerate(parts, 3000, 'gemini-2.5-flash');
         if (!rawTxt)
             return empty;
-        cost?.geminiVision('phase1', usage, 'gemini-3-flash-preview');
+        cost?.geminiVision('phase1', usage, 'gemini-2.5-flash');
         let parsed = {};
         try {
             const m = rawTxt.match(/\{[\s\S]*\}/);

package/dist/daemon/extension-handlers.js CHANGED Viewed

@@ -118,21 +118,26 @@ export async function handleClaudePrompt(ws, code, taskId, prompt, systemPrompt,
     }
 }
 // ─── Handler: claude_prompt_stream (prompt → streamed text + JSON result) ────
-// Track active stream tasks by code so we can abort previous ones
+// Track active stream tasks by taskId (UNIQUE per request). Was keyed by
+// `code` (the shared pair code) which made concurrent claude_prompt_stream
+// calls abort each other — fatal for the batched clone pool (5 parallel
+// chunks → siblings killed → batches hang at 0). taskId is unique so streams
+// run independently; a superseded request gets a fresh taskId anyway.
 const _activeStreamTasks = new Map();
 export async function handleClaudePromptStream(ws, code, taskId, prompt, systemPrompt) {
     console.log(`[claude_prompt_stream] Received: ${prompt.substring(0, 100)}...`);
-    // Kill previous stream task for same code (e.g. user clicked Regenerate again)
-    const prev = _activeStreamTasks.get(code);
+    // Per-taskId (unique): never aborts a concurrent sibling. (Re-clicked
+    // Regenerate arrives with a new taskId; the old one finishes on its own.)
+    const prev = _activeStreamTasks.get(taskId);
     if (prev) {
-        console.log(`[claude_prompt_stream] Aborting previous task for code=${code}`);
+        console.log(`[claude_prompt_stream] Aborting previous task for taskId=${taskId}`);
         prev.abort();
     }
     const abortController = new AbortController();
-    _activeStreamTasks.set(code, abortController);
+    _activeStreamTasks.set(taskId, abortController);
     if (!hasContentCreator()) {
         const error = 'content-creator agent not found on this machine';
-        _activeStreamTasks.delete(code);
+        _activeStreamTasks.delete(taskId);
         ws.sendExtensionDone(code, taskId, { error });
         return;
     }
@@ -190,11 +195,11 @@ export async function handleClaudePromptStream(ws, code, taskId, prompt, systemP
                 }
                 catch { }
         }
-        _activeStreamTasks.delete(code);
+        _activeStreamTasks.delete(taskId);
         ws.sendExtensionDone(code, taskId, { result: parsed, raw: text });
     }
     catch (err) {
-        _activeStreamTasks.delete(code);
+        _activeStreamTasks.delete(taskId);
         if (abortController.signal.aborted) {
             console.log(`[claude_prompt_stream] Aborted (replaced by new task)`);
             return; // Don't send error — new task is already running

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "tuna-agent",
-  "version": "0.1.153",
+  "version": "0.1.155",
   "description": "Tuna Agent - Run AI coding tasks on your machine",
   "bin": {
     "tuna-agent": "dist/cli/index.js"