npm - nothumanallowed - Versions diffs - 13.2.76 → 13.2.77 - Mend

nothumanallowed 13.2.76 → 13.2.77

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "nothumanallowed",
-  "version": "13.2.76",
+  "version": "13.2.77",
   "description": "NotHumanAllowed — 38 AI agents, 80 tools, Studio (visual agentic workflows). Email, calendar, browser automation, screen capture, canvas, cron/heartbeat, Alexandria E2E messaging, GitHub, Notion, Slack, voice chat, free AI (Liara), 28 languages. Zero-dependency CLI.",
   "type": "module",
   "bin": {

package/src/commands/ui.mjs CHANGED Viewed

@@ -2852,24 +2852,24 @@ export async function cmdUI(args) {
           // ── Fetch REAL data for each agent type ──────────────────────
           if (agent === 'DocumentReaderAgent') {
-            // Extract text from attached PDF, then ask the LLM to structure it cleanly.
-            // The structured output becomes context for all subsequent steps.
-            sendToken('[Reading attached document...] ');
+            // Always use vision for PDF reading — text extraction loses table structure,
+            // column alignment, and layout-dependent data for the vast majority of
+            // technical PDFs (datasheets, catalogs, forms, scanned docs).
+            // Vision reads exactly what a human sees on the page.
+            sendToken('[Reading document with vision...] ');
             let rawText = '';
             if (stepPdfBase64) {
               try {
-                const b64 = stepPdfBase64.includes(',') ? stepPdfBase64.split(',')[1] : stepPdfBase64;
-                const pdfBuffer = Buffer.from(b64, 'base64');
-                rawText = extractTextFromPdf(pdfBuffer) || '';
-                if (!rawText || rawText.length < 20) {
-                  // Scanned PDF — use vision OCR
-                  sendToken('[No text layer — using vision OCR...] ');
-                  try {
-                    rawText = await callLLMVision(config, stepPdfBase64, 'application/pdf',
-                      'Extract ALL text from this document exactly as printed, preserving all numbers, codes, and values.');
-                  } catch (ve) { rawText = ''; }
-                }
-              } catch (e) { rawText = ''; }
+                rawText = await callLLMVision(config, stepPdfBase64, 'application/pdf',
+                  'Extract ALL content from this document exactly as it appears: all text, tables (preserve rows and columns), codes, numbers, units, notes, headers, and any other information visible on the page. Do not summarize — transcribe everything.');
+              } catch (ve) {
+                // Vision failed — fall back to text extraction
+                sendToken('[Vision unavailable — falling back to text extraction...] ');
+                try {
+                  const b64 = stepPdfBase64.includes(',') ? stepPdfBase64.split(',')[1] : stepPdfBase64;
+                  rawText = extractTextFromPdf(Buffer.from(b64, 'base64')) || '';
+                } catch (e) { rawText = ''; }
+              }
             }
             if (!rawText) {
               sendToken('Could not extract text from the attached document.');

package/src/constants.mjs CHANGED Viewed

@@ -5,7 +5,7 @@ import { fileURLToPath } from 'url';
 const __filename = fileURLToPath(import.meta.url);
 const __dirname = path.dirname(__filename);
-export const VERSION = '13.2.76';
+export const VERSION = '13.2.77';
 export const BASE_URL = 'https://nothumanallowed.com/cli';
 export const API_BASE = 'https://nothumanallowed.com/api/v1';