npm - @manfred-kunze-dev/backbone-mcp-server - Versions diffs - 2.8.0-dev.2 → 2.8.0-dev.3 - Mend

@manfred-kunze-dev/backbone-mcp-server 2.8.0-dev.2 → 2.8.0-dev.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/tools/conversion.js +45 -11
package/package.json +1 -1

package/dist/tools/conversion.js CHANGED Viewed

@@ -32,7 +32,7 @@ function formatExportDocument(doc) {
 }
 export function register(server, client) {
     // ── convert_document ────────────────────────────────────────────────────
-    server.tool("backbone_convert_document", "Convert documents (PDF, DOCX, XLSX, images, etc.) to Markdown, text, HTML, or JSON. Accepts URLs, base64 data, or local file paths. Local files are automatically read and base64-encoded. Use this to convert binary files before passing them to backbone_create_extraction. Pipeline options: 'standard' (default, OCR-based) or 'vlm' (vision model, better for image-heavy/complex layouts). Use async mode for large documents.", {
+    server.tool("backbone_convert_document", "Convert documents (PDF, DOCX, XLSX, images, etc.) to Markdown, text, HTML, or JSON. Accepts URLs, base64 data, or local file paths. Local files are automatically read and base64-encoded. Use this to convert binary files before passing them to backbone_create_extraction. Pipeline options: 'fast' (default, fast text extraction), 'ocr' (OCR with layout analysis), or 'vlm' (vision language model for image-heavy/complex layouts). Use async mode for large documents.", {
         sources: z
             .array(z.object({
             type: z.enum(["url", "base64", "file"]).describe("Source type: 'url' for HTTP URLs, 'base64' for base64-encoded data, 'file' for local file paths"),
@@ -42,20 +42,30 @@ export function register(server, client) {
             path: z.string().optional().describe("Local file path (when type='file')"),
         }))
             .describe("List of document sources to convert"),
-        outputFormats: z
-            .array(z.string())
-            .optional()
-            .describe("Output formats, e.g. ['markdown', 'text', 'html', 'json']"),
         pipeline: z
             .string()
             .optional()
-            .describe("Processing pipeline: 'standard' (default) or 'vlm' (vision language model for image-heavy documents)"),
+            .describe("Processing pipeline: 'fast' (default, fast text extraction), 'ocr' (OCR with layout analysis), or 'vlm' (vision language model for image-heavy documents)"),
+        options: z
+            .object({
+            outputFormats: z.array(z.string()).optional().describe("Output formats, e.g. ['md', 'text', 'html', 'json']. Only relevant for ocr/vlm pipelines."),
+            ocrEngine: z.string().optional().describe("OCR engine (e.g. 'easyocr', 'tesseract')"),
+            ocrLanguages: z.array(z.string()).optional().describe("OCR languages (e.g. ['en', 'de'])"),
+            pdfBackend: z.string().optional().describe("PDF backend (e.g. 'dlparser', 'pypdfium2')"),
+            tableStructure: z.boolean().optional().describe("Enable table structure detection"),
+            maxPages: z.number().optional().describe("Maximum number of pages to process"),
+            imageExportMode: z.string().optional().describe("Image export mode (e.g. 'placeholder', 'embedded')"),
+            imagesScale: z.number().optional().describe("Scale factor for exported images"),
+            pictureClassification: z.boolean().optional().describe("Enable picture classification"),
+        })
+            .optional()
+            .describe("Options for ocr/vlm pipelines. Ignored when pipeline is 'fast'."),
         async: z
             .boolean()
             .optional()
             .default(false)
             .describe("If true, submit as async task and return task ID for polling"),
-    }, async ({ sources, outputFormats, pipeline, async: isAsync }) => {
+    }, async ({ sources, pipeline, options: pipelineOptions, async: isAsync }) => {
         try {
             const apiSources = [];
             for (const src of sources) {
@@ -79,12 +89,36 @@ export function register(server, client) {
                     apiSources.push({ kind: "base64", content: b64, filename: name, mimeType: getMimeType(name) });
                 }
             }
+            // Build nested options matching new API shape
+            const opts = {};
+            if (pipeline)
+                opts.pipeline = pipeline;
+            if (pipelineOptions) {
+                const nested = {};
+                if (pipelineOptions.outputFormats)
+                    nested.outputFormats = pipelineOptions.outputFormats.map(mapOutputFormat);
+                if (pipelineOptions.ocrEngine)
+                    nested.ocrEngine = pipelineOptions.ocrEngine;
+                if (pipelineOptions.ocrLanguages)
+                    nested.ocrLanguages = pipelineOptions.ocrLanguages;
+                if (pipelineOptions.pdfBackend)
+                    nested.pdfBackend = pipelineOptions.pdfBackend;
+                if (pipelineOptions.tableStructure !== undefined)
+                    nested.tableStructure = pipelineOptions.tableStructure;
+                if (pipelineOptions.maxPages !== undefined)
+                    nested.maxPages = pipelineOptions.maxPages;
+                if (pipelineOptions.imageExportMode)
+                    nested.imageExportMode = pipelineOptions.imageExportMode;
+                if (pipelineOptions.imagesScale !== undefined)
+                    nested.imagesScale = pipelineOptions.imagesScale;
+                if (pipelineOptions.pictureClassification !== undefined)
+                    nested.pictureClassification = pipelineOptions.pictureClassification;
+                if (Object.keys(nested).length > 0)
+                    opts.options = nested;
+            }
             const body = {
                 sources: apiSources,
-                options: {
-                    ...(outputFormats ? { toFormats: outputFormats.map(mapOutputFormat) } : {}),
-                    ...(pipeline ? { pipeline } : {}),
-                },
+                options: Object.keys(opts).length > 0 ? opts : undefined,
             };
             if (isAsync) {
                 const { data } = await client.POST("/v1/convert/source/async", { body });

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@manfred-kunze-dev/backbone-mcp-server",
-  "version": "2.8.0-dev.2",
+  "version": "2.8.0-dev.3",
   "description": "MCP server for the Backbone AI platform",
   "type": "module",
   "main": "dist/index.js",