npm - tuna-agent - Versions diffs - 0.1.123 → 0.1.125 - Mend

tuna-agent 0.1.123 → 0.1.125

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/daemon/analyze-video-handler.js +10 -2
package/package.json +1 -1

package/dist/daemon/analyze-video-handler.js CHANGED Viewed

@@ -82,11 +82,19 @@ async function visionDescribe(frameB64, voiceoverText) {
         headers: { 'Content-Type': 'application/json', Authorization: `Bearer ${OPENAI_KEY}` },
         body: JSON.stringify({
             model: 'gpt-4o-mini',
-            max_tokens: 150,
+            max_tokens: 300,
             messages: [{
                     role: 'user',
                     content: [
-                        { type: 'text', text: `Mô tả ngắn gọn (1-2 câu tiếng Việt) khung hình này: nhân vật, bối cảnh, góc quay, tâm trạng. Voiceover đang nói: "${voiceoverText || '(không có)'}"` },
+                        { type: 'text', text: `Describe this frame in detail (4-6 sentences, English). Include:
+- Characters: appearance (shape, color, size), facial expression, what they're doing
+- Physical connections: Are characters physically joined/attached/fused together (e.g. organs connected at a junction, body parts linked)? Or are they separate/independent? Be VERY specific — "physically attached at Y-junction" is different from "standing next to each other"
+- Spatial positions: exact position of each character (left/right/above/below/center), distance between them
+- Environment: setting, lighting, color palette, atmosphere
+- Camera: angle, framing (close-up, wide, etc.)
+- Action: what is happening in this moment, movement direction
+Voiceover at this moment: "${voiceoverText || '(none)'}"` },
                         { type: 'image_url', image_url: { url: `data:image/jpeg;base64,${frameB64}` } },
                     ],
                 }],

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "tuna-agent",
-  "version": "0.1.123",
+  "version": "0.1.125",
   "description": "Tuna Agent - Run AI coding tasks on your machine",
   "bin": {
     "tuna-agent": "dist/cli/index.js"