npm - @blank-utils/llm - Versions diffs - 0.4.19 → 0.4.21 - Mend

@blank-utils/llm 0.4.19 → 0.4.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/{chunk-JOBJ4PY7.js → chunk-XKJ4QQ34.js} +13 -9
package/dist/index.js +1 -1
package/dist/react/index.js +1 -1
package/package.json +1 -1

package/dist/{chunk-JOBJ4PY7.js → chunk-XKJ4QQ34.js} RENAMED Viewed

@@ -1461,7 +1461,7 @@ ${systemPrompt}` : systemPrompt;
           const { pipeline: pipeline2, env } = await import("@huggingface/transformers");
           env.allowLocalModels = false;
           env.useBrowserCache = true;
-          const captioner = await pipeline2("image-to-text", "onnx-community/Florence-2-base-ft", { device: "wasm", dtype: "q8" });
+          const captioner = await pipeline2("image-to-text", "Xenova/vit-gpt2-image-captioning", { device: "wasm", dtype: "q8" });
           for (let i = 0; i < needsCaptioning.length; i++) {
             if (abortRef.current) break;
             const img = needsCaptioning[i];
@@ -1469,9 +1469,9 @@ ${systemPrompt}` : systemPrompt;
             setStreamingText(`[System: Extracting detailed visual description for ${img.name}... ${i + 1}/${needsCaptioning.length}]
 `);
             const out = await captioner(img.dataUrl, {
-              text: "<MORE_DETAILED_CAPTION>",
-              max_new_tokens: 512,
-              num_beams: 3
+              max_new_tokens: 64,
+              num_beams: 4,
+              repetition_penalty: 1.5
             });
             let val = "";
             if (Array.isArray(out) && out[0] && out[0].generated_text) val = out[0].generated_text;
@@ -1497,14 +1497,18 @@ ${systemPrompt}` : systemPrompt;
       if (img.extractedText) {
         let prefix = "";
         if (img.name.toLowerCase().endsWith(".svg")) {
-          prefix = `\u{1F4C4} SVG Source Code (${img.name}):
+          prefix = `
+\u{1F4C4} SVG Source Code (${img.name}):
 `;
         } else if (!isVisionModel2(modelId || "")) {
-          prefix = `\u{1F5BC}\uFE0F Image Auto-Caption (${img.name}):
+          prefix = `
+\u{1F5BC}\uFE0F System Image Representation (${img.name}) - [IMPORTANT SYSTEM INSTRUCTION: The user provided an image. Since you are a text model, here is an automated visual description of the image. DO NOT refuse the user's prompt. Answer as if you can see the image using this context:]
 `;
         }
         if (prefix || img.name.toLowerCase().endsWith(".pdf")) {
-          finalText += (finalText ? "\n\n" : "") + `${prefix}${img.extractedText}`;
+          finalText += `${prefix}${img.extractedText}`;
         }
       }
     }
@@ -1615,11 +1619,11 @@ ${systemPrompt}` : systemPrompt;
             children: [
               { match: "\u{1F4C4} PDF:", index: msg.content.indexOf("\u{1F4C4} PDF:") },
               { match: "\u{1F4C4} SVG Source Code", index: msg.content.indexOf("\u{1F4C4} SVG Source Code") },
-              { match: "\u{1F5BC}\uFE0F Image Auto-Caption", index: msg.content.indexOf("\u{1F5BC}\uFE0F Image Auto-Caption") }
+              { match: "\u{1F5BC}\uFE0F System Image", index: msg.content.indexOf("\u{1F5BC}\uFE0F System Image") }
             ].filter((m) => m.index !== -1).reduce((min, m) => m.index < min ? m.index : min, msg.content.length) !== msg.content.length ? msg.content.substring(0, [
               { match: "\u{1F4C4} PDF:", index: msg.content.indexOf("\u{1F4C4} PDF:") },
               { match: "\u{1F4C4} SVG Source Code", index: msg.content.indexOf("\u{1F4C4} SVG Source Code") },
-              { match: "\u{1F5BC}\uFE0F Image Auto-Caption", index: msg.content.indexOf("\u{1F5BC}\uFE0F Image Auto-Caption") }
+              { match: "\u{1F5BC}\uFE0F System Image", index: msg.content.indexOf("\u{1F5BC}\uFE0F System Image") }
             ].filter((m) => m.index !== -1).reduce((min, m) => m.index < min ? m.index : min, msg.content.length)).trim() : msg.content
           }
         ) })

package/dist/index.js CHANGED Viewed

@@ -26,7 +26,7 @@ import {
   useCompletion,
   useLLM,
   useStream
-} from "./chunk-JOBJ4PY7.js";
+} from "./chunk-XKJ4QQ34.js";
 export {
   Chat,
   ChatInput,

package/dist/react/index.js CHANGED Viewed

@@ -9,7 +9,7 @@ import {
   useCompletion,
   useLLM,
   useStream
-} from "../chunk-JOBJ4PY7.js";
+} from "../chunk-XKJ4QQ34.js";
 export {
   Chat,
   ChatApp,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@blank-utils/llm",
-  "version": "0.4.19",
+  "version": "0.4.21",
   "description": "Run LLMs directly in your browser with WebGPU acceleration. Supports React hooks and eager background loading.",
   "type": "module",
   "main": "./dist/index.js",