npm - @wonderwhy-er/desktop-commander - Versions diffs - 0.2.23 → 0.2.24 - Mend

@wonderwhy-er/desktop-commander 0.2.23 → 0.2.24

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

package/README.md +14 -55
package/dist/custom-stdio.d.ts +1 -0
package/dist/custom-stdio.js +19 -0
package/dist/handlers/filesystem-handlers.d.ts +4 -0
package/dist/handlers/filesystem-handlers.js +120 -14
package/dist/handlers/node-handlers.d.ts +6 -0
package/dist/handlers/node-handlers.js +73 -0
package/dist/index.js +5 -3
package/dist/search-manager.d.ts +25 -0
package/dist/search-manager.js +212 -0
package/dist/server.js +160 -73
package/dist/terminal-manager.d.ts +56 -2
package/dist/terminal-manager.js +169 -13
package/dist/tools/edit.d.ts +28 -4
package/dist/tools/edit.js +87 -4
package/dist/tools/filesystem.d.ts +23 -12
package/dist/tools/filesystem.js +201 -416
package/dist/tools/improved-process-tools.d.ts +2 -2
package/dist/tools/improved-process-tools.js +244 -214
package/dist/tools/mime-types.d.ts +1 -0
package/dist/tools/mime-types.js +7 -0
package/dist/tools/pdf/extract-images.d.ts +34 -0
package/dist/tools/pdf/extract-images.js +132 -0
package/dist/tools/pdf/index.d.ts +6 -0
package/dist/tools/pdf/index.js +3 -0
package/dist/tools/pdf/lib/pdf2md.d.ts +36 -0
package/dist/tools/pdf/lib/pdf2md.js +76 -0
package/dist/tools/pdf/manipulations.d.ts +13 -0
package/dist/tools/pdf/manipulations.js +96 -0
package/dist/tools/pdf/markdown.d.ts +7 -0
package/dist/tools/pdf/markdown.js +37 -0
package/dist/tools/pdf/utils.d.ts +12 -0
package/dist/tools/pdf/utils.js +34 -0
package/dist/tools/schemas.d.ts +167 -12
package/dist/tools/schemas.js +54 -5
package/dist/types.d.ts +2 -1
package/dist/utils/feature-flags.js +7 -4
package/dist/utils/files/base.d.ts +167 -0
package/dist/utils/files/base.js +5 -0
package/dist/utils/files/binary.d.ts +21 -0
package/dist/utils/files/binary.js +65 -0
package/dist/utils/files/excel.d.ts +24 -0
package/dist/utils/files/excel.js +416 -0
package/dist/utils/files/factory.d.ts +40 -0
package/dist/utils/files/factory.js +101 -0
package/dist/utils/files/image.d.ts +21 -0
package/dist/utils/files/image.js +78 -0
package/dist/utils/files/index.d.ts +10 -0
package/dist/utils/files/index.js +13 -0
package/dist/utils/files/pdf.d.ts +32 -0
package/dist/utils/files/pdf.js +142 -0
package/dist/utils/files/text.d.ts +63 -0
package/dist/utils/files/text.js +357 -0
package/dist/utils/ripgrep-resolver.js +3 -2
package/dist/utils/system-info.d.ts +5 -0
package/dist/utils/system-info.js +71 -3
package/dist/version.d.ts +1 -1
package/dist/version.js +1 -1
package/package.json +14 -3

package/dist/tools/filesystem.js CHANGED Viewed

@@ -2,66 +2,33 @@ import fs from "fs/promises";
 import path from "path";
 import os from 'os';
 import fetch from 'cross-fetch';
-import { createReadStream } from 'fs';
-import { createInterface } from 'readline';
-import { isBinaryFile } from 'isbinaryfile';
 import { capture } from '../utils/capture.js';
 import { withTimeout } from '../utils/withTimeout.js';
 import { configManager } from '../config-manager.js';
+import { getFileHandler, TextFileHandler } from '../utils/files/index.js';
+import { isPdfFile } from "./mime-types.js";
+import { parsePdfToMarkdown, editPdf, parseMarkdownToPdf } from './pdf/index.js';
 // CONSTANTS SECTION - Consolidate all timeouts and thresholds
 const FILE_OPERATION_TIMEOUTS = {
     PATH_VALIDATION: 10000, // 10 seconds
-    URL_FETCH: 30000, // 30 seconds
+    URL_FETCH: 30000, // 30 seconds
     FILE_READ: 30000, // 30 seconds
 };
 const FILE_SIZE_LIMITS = {
-    LARGE_FILE_THRESHOLD: 10 * 1024 * 1024, // 10MB
     LINE_COUNT_LIMIT: 10 * 1024 * 1024, // 10MB for line counting
 };
-const READ_PERFORMANCE_THRESHOLDS = {
-    SMALL_READ_THRESHOLD: 100, // For very small reads
-    DEEP_OFFSET_THRESHOLD: 1000, // For byte estimation
-    SAMPLE_SIZE: 10000, // Sample size for estimation
-    CHUNK_SIZE: 8192, // 8KB chunks for reverse reading
-};
 // UTILITY FUNCTIONS - Eliminate duplication
-/**
- * Count lines in text content efficiently
- * @param content Text content to count lines in
- * @returns Number of lines
- */
-function countLines(content) {
-    return content.split('\n').length;
-}
-/**
- * Count lines in a file efficiently (for files under size limit)
- * @param filePath Path to the file
- * @returns Line count or undefined if file too large/can't read
- */
-async function getFileLineCount(filePath) {
-    try {
-        const stats = await fs.stat(filePath);
-        // Only count lines for reasonably sized files to avoid performance issues
-        if (stats.size < FILE_SIZE_LIMITS.LINE_COUNT_LIMIT) {
-            const content = await fs.readFile(filePath, 'utf8');
-            return countLines(content);
-        }
-    }
-    catch (error) {
-        // If we can't read the file, just return undefined
-    }
-    return undefined;
-}
 /**
  * Get MIME type information for a file
  * @param filePath Path to the file
  * @returns Object with mimeType and isImage properties
  */
 async function getMimeTypeInfo(filePath) {
-    const { getMimeType, isImageFile } = await import('./mime-types.js');
+    const { getMimeType, isImageFile, isPdfFile } = await import('./mime-types.js');
     const mimeType = getMimeType(filePath);
     const isImage = isImageFile(mimeType);
-    return { mimeType, isImage };
+    const isPdf = isPdfFile(mimeType);
+    return { mimeType, isImage, isPdf };
 }
 /**
  * Get file extension for telemetry purposes
@@ -79,20 +46,6 @@ async function getDefaultReadLength() {
     const config = await configManager.getConfig();
     return config.fileReadLineLimit ?? 1000; // Default to 1000 lines if not set
 }
-/**
- * Generate instructions for handling binary files
- * @param filePath Path to the binary file
- * @param mimeType MIME type of the file
- * @returns Instruction message for the LLM
- */
-function getBinaryFileInstructions(filePath, mimeType) {
-    const fileName = path.basename(filePath);
-    return `Cannot read binary file as text: ${fileName} (${mimeType})
-Use start_process + interact_with_process to analyze binary files with appropriate tools (Node.js or Python libraries, command-line utilities, etc.).
-The read_file tool only handles text files and images.`;
-}
 // Initialize allowed directories from configuration
 async function getAllowedDirs() {
     try {
@@ -266,19 +219,37 @@ export async function readFileFromUrl(url) {
         if (!response.ok) {
             throw new Error(`HTTP error! Status: ${response.status}`);
         }
-        // Get MIME type from Content-Type header
+        // Get MIME type from Content-Type header or infer from URL
         const contentType = response.headers.get('content-type') || 'text/plain';
         const isImage = isImageFile(contentType);
-        if (isImage) {
+        const isPdf = isPdfFile(contentType) || url.toLowerCase().endsWith('.pdf');
+        // NEW: Add PDF handling before image check
+        if (isPdf) {
+            // Use URL directly - pdfreader handles URL downloads internally
+            const pdfResult = await parsePdfToMarkdown(url);
+            return {
+                content: "",
+                mimeType: 'text/plain',
+                metadata: {
+                    isImage: false,
+                    isPdf: true,
+                    author: pdfResult.metadata.author,
+                    title: pdfResult.metadata.title,
+                    totalPages: pdfResult.metadata.totalPages,
+                    pages: pdfResult.pages
+                }
+            };
+        }
+        else if (isImage) {
             // For images, convert to base64
             const buffer = await response.arrayBuffer();
             const content = Buffer.from(buffer).toString('base64');
-            return { content, mimeType: contentType, isImage };
+            return { content, mimeType: contentType, metadata: { isImage } };
         }
         else {
             // For text content
             const content = await response.text();
-            return { content, mimeType: contentType, isImage };
+            return { content, mimeType: contentType, metadata: { isImage } };
         }
     }
     catch (error) {
@@ -291,269 +262,15 @@ export async function readFileFromUrl(url) {
         throw new Error(errorMessage);
     }
 }
-/**
- * Generate enhanced status message with total and remaining line information
- * @param readLines Number of lines actually read
- * @param offset Starting offset (line number)
- * @param totalLines Total lines in the file (if available)
- * @param isNegativeOffset Whether this is a tail operation
- * @returns Enhanced status message string
- */
-function generateEnhancedStatusMessage(readLines, offset, totalLines, isNegativeOffset = false) {
-    if (isNegativeOffset) {
-        // For tail operations (negative offset)
-        if (totalLines !== undefined) {
-            return `[Reading last ${readLines} lines (total: ${totalLines} lines)]`;
-        }
-        else {
-            return `[Reading last ${readLines} lines]`;
-        }
-    }
-    else {
-        // For normal reads (positive offset)
-        if (totalLines !== undefined) {
-            const endLine = offset + readLines;
-            const remainingLines = Math.max(0, totalLines - endLine);
-            if (offset === 0) {
-                return `[Reading ${readLines} lines from start (total: ${totalLines} lines, ${remainingLines} remaining)]`;
-            }
-            else {
-                return `[Reading ${readLines} lines from line ${offset} (total: ${totalLines} lines, ${remainingLines} remaining)]`;
-            }
-        }
-        else {
-            // Fallback when total lines unknown
-            if (offset === 0) {
-                return `[Reading ${readLines} lines from start]`;
-            }
-            else {
-                return `[Reading ${readLines} lines from line ${offset}]`;
-            }
-        }
-    }
-}
-/**
- * Read file content using smart positioning for optimal performance
- * @param filePath Path to the file (already validated)
- * @param offset Starting line number (negative for tail behavior)
- * @param length Maximum number of lines to read
- * @param mimeType MIME type of the file
- * @param includeStatusMessage Whether to include status headers (default: true)
- * @returns File result with content
- */
-async function readFileWithSmartPositioning(filePath, offset, length, mimeType, includeStatusMessage = true) {
-    const stats = await fs.stat(filePath);
-    const fileSize = stats.size;
-    // Check if the file is binary (but allow images to pass through)
-    const { isImage } = await getMimeTypeInfo(filePath);
-    if (!isImage) {
-        const isBinary = await isBinaryFile(filePath);
-        if (isBinary) {
-            // Return instructions instead of trying to read binary content
-            const instructions = getBinaryFileInstructions(filePath, mimeType);
-            throw new Error(instructions);
-        }
-    }
-    // Get total line count for enhanced status messages (only for smaller files)
-    const totalLines = await getFileLineCount(filePath);
-    // For negative offsets (tail behavior), use reverse reading
-    if (offset < 0) {
-        const requestedLines = Math.abs(offset);
-        if (fileSize > FILE_SIZE_LIMITS.LARGE_FILE_THRESHOLD && requestedLines <= READ_PERFORMANCE_THRESHOLDS.SMALL_READ_THRESHOLD) {
-            // Use efficient reverse reading for large files with small tail requests
-            return await readLastNLinesReverse(filePath, requestedLines, mimeType, includeStatusMessage, totalLines);
-        }
-        else {
-            // Use readline circular buffer for other cases
-            return await readFromEndWithReadline(filePath, requestedLines, mimeType, includeStatusMessage, totalLines);
-        }
-    }
-    // For positive offsets
-    else {
-        // For small files or reading from start, use simple readline
-        if (fileSize < FILE_SIZE_LIMITS.LARGE_FILE_THRESHOLD || offset === 0) {
-            return await readFromStartWithReadline(filePath, offset, length, mimeType, includeStatusMessage, totalLines);
-        }
-        // For large files with middle/end reads, try to estimate position
-        else {
-            // If seeking deep into file, try byte estimation
-            if (offset > READ_PERFORMANCE_THRESHOLDS.DEEP_OFFSET_THRESHOLD) {
-                return await readFromEstimatedPosition(filePath, offset, length, mimeType, includeStatusMessage, totalLines);
-            }
-            else {
-                return await readFromStartWithReadline(filePath, offset, length, mimeType, includeStatusMessage, totalLines);
-            }
-        }
-    }
-}
-/**
- * Read last N lines efficiently by reading file backwards in chunks
- */
-async function readLastNLinesReverse(filePath, n, mimeType, includeStatusMessage = true, fileTotalLines) {
-    const fd = await fs.open(filePath, 'r');
-    try {
-        const stats = await fd.stat();
-        const fileSize = stats.size;
-        let position = fileSize;
-        let lines = [];
-        let partialLine = '';
-        while (position > 0 && lines.length < n) {
-            const readSize = Math.min(READ_PERFORMANCE_THRESHOLDS.CHUNK_SIZE, position);
-            position -= readSize;
-            const buffer = Buffer.alloc(readSize);
-            await fd.read(buffer, 0, readSize, position);
-            const chunk = buffer.toString('utf-8');
-            const text = chunk + partialLine;
-            const chunkLines = text.split('\n');
-            partialLine = chunkLines.shift() || '';
-            lines = chunkLines.concat(lines);
-        }
-        // Add the remaining partial line if we reached the beginning
-        if (position === 0 && partialLine) {
-            lines.unshift(partialLine);
-        }
-        const result = lines.slice(-n); // Get exactly n lines
-        const content = includeStatusMessage
-            ? `${generateEnhancedStatusMessage(result.length, -n, fileTotalLines, true)}\n\n${result.join('\n')}`
-            : result.join('\n');
-        return { content, mimeType, isImage: false };
-    }
-    finally {
-        await fd.close();
-    }
-}
-/**
- * Read from end using readline with circular buffer
- */
-async function readFromEndWithReadline(filePath, requestedLines, mimeType, includeStatusMessage = true, fileTotalLines) {
-    const rl = createInterface({
-        input: createReadStream(filePath),
-        crlfDelay: Infinity
-    });
-    const buffer = new Array(requestedLines);
-    let bufferIndex = 0;
-    let totalLines = 0;
-    for await (const line of rl) {
-        buffer[bufferIndex] = line;
-        bufferIndex = (bufferIndex + 1) % requestedLines;
-        totalLines++;
-    }
-    rl.close();
-    // Extract lines in correct order
-    let result;
-    if (totalLines >= requestedLines) {
-        result = [
-            ...buffer.slice(bufferIndex),
-            ...buffer.slice(0, bufferIndex)
-        ].filter(line => line !== undefined);
-    }
-    else {
-        result = buffer.slice(0, totalLines);
-    }
-    const content = includeStatusMessage
-        ? `${generateEnhancedStatusMessage(result.length, -requestedLines, fileTotalLines, true)}\n\n${result.join('\n')}`
-        : result.join('\n');
-    return { content, mimeType, isImage: false };
-}
-/**
- * Read from start/middle using readline
- */
-async function readFromStartWithReadline(filePath, offset, length, mimeType, includeStatusMessage = true, fileTotalLines) {
-    const rl = createInterface({
-        input: createReadStream(filePath),
-        crlfDelay: Infinity
-    });
-    const result = [];
-    let lineNumber = 0;
-    for await (const line of rl) {
-        if (lineNumber >= offset && result.length < length) {
-            result.push(line);
-        }
-        if (result.length >= length)
-            break; // Early exit optimization
-        lineNumber++;
-    }
-    rl.close();
-    if (includeStatusMessage) {
-        const statusMessage = generateEnhancedStatusMessage(result.length, offset, fileTotalLines, false);
-        const content = `${statusMessage}\n\n${result.join('\n')}`;
-        return { content, mimeType, isImage: false };
-    }
-    else {
-        const content = result.join('\n');
-        return { content, mimeType, isImage: false };
-    }
-}
-/**
- * Read from estimated byte position for very large files
- */
-async function readFromEstimatedPosition(filePath, offset, length, mimeType, includeStatusMessage = true, fileTotalLines) {
-    // First, do a quick scan to estimate lines per byte
-    const rl = createInterface({
-        input: createReadStream(filePath),
-        crlfDelay: Infinity
-    });
-    let sampleLines = 0;
-    let bytesRead = 0;
-    for await (const line of rl) {
-        bytesRead += Buffer.byteLength(line, 'utf-8') + 1; // +1 for newline
-        sampleLines++;
-        if (bytesRead >= READ_PERFORMANCE_THRESHOLDS.SAMPLE_SIZE)
-            break;
-    }
-    rl.close();
-    if (sampleLines === 0) {
-        // Fallback to simple read
-        return await readFromStartWithReadline(filePath, offset, length, mimeType, includeStatusMessage, fileTotalLines);
-    }
-    // Estimate average line length and seek position
-    const avgLineLength = bytesRead / sampleLines;
-    const estimatedBytePosition = Math.floor(offset * avgLineLength);
-    // Create a new stream starting from estimated position
-    const fd = await fs.open(filePath, 'r');
-    try {
-        const stats = await fd.stat();
-        const startPosition = Math.min(estimatedBytePosition, stats.size);
-        const stream = createReadStream(filePath, { start: startPosition });
-        const rl2 = createInterface({
-            input: stream,
-            crlfDelay: Infinity
-        });
-        const result = [];
-        let lineCount = 0;
-        let firstLineSkipped = false;
-        for await (const line of rl2) {
-            // Skip first potentially partial line if we didn't start at beginning
-            if (!firstLineSkipped && startPosition > 0) {
-                firstLineSkipped = true;
-                continue;
-            }
-            if (result.length < length) {
-                result.push(line);
-            }
-            else {
-                break;
-            }
-            lineCount++;
-        }
-        rl2.close();
-        const content = includeStatusMessage
-            ? `${generateEnhancedStatusMessage(result.length, offset, fileTotalLines, false)}\n\n${result.join('\n')}`
-            : result.join('\n');
-        return { content, mimeType, isImage: false };
-    }
-    finally {
-        await fd.close();
-    }
-}
 /**
  * Read file content from the local filesystem
  * @param filePath Path to the file
- * @param offset Starting line number to read from (default: 0)
- * @param length Maximum number of lines to read (default: from config or 1000)
+ * @param options Read options (offset, length, sheet, range)
  * @returns File content or file result with metadata
  */
-export async function readFileFromDisk(filePath, offset = 0, length) {
+export async function readFileFromDisk(filePath, options) {
+    const { offset = 0, sheet, range } = options ?? {};
+    let { length } = options ?? {};
     // Add validation for required parameters
     if (!filePath || typeof filePath !== 'string') {
         throw new Error('Invalid file path provided');
@@ -563,7 +280,7 @@ export async function readFileFromDisk(filePath, offset = 0, length) {
         length = await getDefaultReadLength();
     }
     const validPath = await validatePath(filePath);
-    // Get file extension for telemetry using path module consistently
+    // Get file extension for telemetry
     const fileExtension = getFileExtension(validPath);
     // Check file size before attempting to read
     try {
@@ -582,37 +299,37 @@ export async function readFileFromDisk(filePath, offset = 0, length) {
         capture('server_read_file_error', { error: errorMessage, fileExtension: fileExtension });
         // If we can't stat the file, continue anyway and let the read operation handle errors
     }
-    // Detect the MIME type based on file extension
-    const { mimeType, isImage } = await getMimeTypeInfo(validPath);
     // Use withTimeout to handle potential hangs
     const readOperation = async () => {
-        if (isImage) {
-            // For image files, read as Buffer and convert to base64
-            // Images are always read in full, ignoring offset and length
-            const buffer = await fs.readFile(validPath);
-            const content = buffer.toString('base64');
-            return { content, mimeType, isImage };
+        // Get appropriate handler for this file type (async - includes binary detection)
+        const handler = await getFileHandler(validPath);
+        // Use handler to read the file
+        const result = await handler.read(validPath, {
+            offset,
+            length,
+            sheet,
+            range,
+            includeStatusMessage: true
+        });
+        // Return with content as string
+        // For images: content is already base64-encoded string from handler
+        // For text: content may be string or Buffer, convert to UTF-8 string
+        let content;
+        if (typeof result.content === 'string') {
+            content = result.content;
+        }
+        else if (result.metadata?.isImage) {
+            // Image buffer should be base64 encoded, not UTF-8 converted
+            content = result.content.toString('base64');
         }
         else {
-            // For all other files, use smart positioning approach
-            try {
-                return await readFileWithSmartPositioning(validPath, offset, length, mimeType, true);
-            }
-            catch (error) {
-                // If it's our binary file instruction error, return it as content
-                if (error instanceof Error && error.message.includes('Cannot read binary file as text:')) {
-                    return { content: error.message, mimeType: 'text/plain', isImage: false };
-                }
-                // If UTF-8 reading fails for other reasons, also check if it's binary
-                const isBinary = await isBinaryFile(validPath);
-                if (isBinary) {
-                    const instructions = getBinaryFileInstructions(validPath, mimeType);
-                    return { content: instructions, mimeType: 'text/plain', isImage: false };
-                }
-                // Only if it's truly not binary, then we have a real UTF-8 reading error
-                throw error;
-            }
+            content = result.content.toString('utf8');
         }
+        return {
+            content,
+            mimeType: result.mimeType,
+            metadata: result.metadata
+        };
     };
     // Execute with timeout
     const result = await withTimeout(readOperation(), FILE_OPERATION_TIMEOUTS.FILE_READ, `Read file operation for ${filePath}`, null);
@@ -625,15 +342,14 @@ export async function readFileFromDisk(filePath, offset = 0, length) {
 /**
  * Read a file from either the local filesystem or a URL
  * @param filePath Path to the file or URL
- * @param isUrl Whether the path is a URL
- * @param offset Starting line number to read from (default: 0)
- * @param length Maximum number of lines to read (default: from config or 1000)
+ * @param options Read options (isUrl, offset, length, sheet, range)
  * @returns File content or file result with metadata
  */
-export async function readFile(filePath, isUrl, offset, length) {
+export async function readFile(filePath, options) {
+    const { isUrl, offset, length, sheet, range } = options ?? {};
     return isUrl
         ? readFileFromUrl(filePath)
-        : readFileFromDisk(filePath, offset, length);
+        : readFileFromDisk(filePath, { offset, length, sheet, range });
 }
 /**
  * Read file content without status messages for internal operations
@@ -667,56 +383,19 @@ export async function readFileInternal(filePath, offset = 0, length) {
         return content;
     }
     // Handle offset/length by splitting on line boundaries while preserving line endings
-    const lines = splitLinesPreservingEndings(content);
+    const lines = TextFileHandler.splitLinesPreservingEndings(content);
     // Apply offset and length
     const selectedLines = lines.slice(offset, offset + length);
     // Join back together (this preserves the original line endings)
     return selectedLines.join('');
 }
-/**
- * Split text into lines while preserving original line endings with each line
- * @param content The text content to split
- * @returns Array of lines, each including its original line ending
- */
-function splitLinesPreservingEndings(content) {
-    if (!content)
-        return [''];
-    const lines = [];
-    let currentLine = '';
-    for (let i = 0; i < content.length; i++) {
-        const char = content[i];
-        currentLine += char;
-        // Check for line ending patterns
-        if (char === '\n') {
-            // LF or end of CRLF
-            lines.push(currentLine);
-            currentLine = '';
-        }
-        else if (char === '\r') {
-            // Could be CR or start of CRLF
-            if (i + 1 < content.length && content[i + 1] === '\n') {
-                // It's CRLF, include the \n as well
-                currentLine += content[i + 1];
-                i++; // Skip the \n in next iteration
-            }
-            // Either way, we have a complete line
-            lines.push(currentLine);
-            currentLine = '';
-        }
-    }
-    // Handle any remaining content (file not ending with line ending)
-    if (currentLine) {
-        lines.push(currentLine);
-    }
-    return lines;
-}
 export async function writeFile(filePath, content, mode = 'rewrite') {
     const validPath = await validatePath(filePath);
     // Get file extension for telemetry
     const fileExtension = getFileExtension(validPath);
     // Calculate content metrics
     const contentBytes = Buffer.from(content).length;
-    const lineCount = countLines(content);
+    const lineCount = TextFileHandler.countLines(content);
     // Capture file extension and operation details in telemetry without capturing the file path
     capture('server_write_file', {
         fileExtension: fileExtension,
@@ -724,24 +403,41 @@ export async function writeFile(filePath, content, mode = 'rewrite') {
         contentBytes: contentBytes,
         lineCount: lineCount
     });
-    // Use different fs methods based on mode
-    if (mode === 'append') {
-        await fs.appendFile(validPath, content);
-    }
-    else {
-        await fs.writeFile(validPath, content);
-    }
+    // Get appropriate handler for this file type (async - includes binary detection)
+    const handler = await getFileHandler(validPath);
+    // Use handler to write the file
+    await handler.write(validPath, content, mode);
 }
 export async function readMultipleFiles(paths) {
     return Promise.all(paths.map(async (filePath) => {
         try {
             const validPath = await validatePath(filePath);
             const fileResult = await readFile(validPath);
+            // Handle content conversion properly for images vs text
+            let content;
+            if (typeof fileResult.content === 'string') {
+                content = fileResult.content;
+            }
+            else if (fileResult.metadata?.isImage) {
+                content = fileResult.content.toString('base64');
+            }
+            else {
+                content = fileResult.content.toString('utf8');
+            }
             return {
                 path: filePath,
-                content: typeof fileResult === 'string' ? fileResult : fileResult.content,
-                mimeType: typeof fileResult === 'string' ? "text/plain" : fileResult.mimeType,
-                isImage: typeof fileResult === 'string' ? false : fileResult.isImage
+                content,
+                mimeType: fileResult.mimeType,
+                isImage: fileResult.metadata?.isImage ?? false,
+                isPdf: fileResult.metadata?.isPdf ?? false,
+                payload: fileResult.metadata?.isPdf ? {
+                    metadata: {
+                        author: fileResult.metadata.author,
+                        title: fileResult.metadata.title,
+                        totalPages: fileResult.metadata.totalPages ?? 0
+                    },
+                    pages: fileResult.metadata.pages ?? []
+                } : undefined
             };
         }
         catch (error) {
@@ -923,9 +619,9 @@ async function searchFilesNodeJS(rootPath, pattern) {
 }
 export async function getFileInfo(filePath) {
     const validPath = await validatePath(filePath);
+    // Get fs.stat as a fallback for any missing fields
     const stats = await fs.stat(validPath);
-    // Basic file info
-    const info = {
+    const fallbackInfo = {
         size: stats.size,
         created: stats.birthtime,
         modified: stats.mtime,
@@ -933,25 +629,114 @@ export async function getFileInfo(filePath) {
         isDirectory: stats.isDirectory(),
         isFile: stats.isFile(),
         permissions: stats.mode.toString(8).slice(-3),
+        fileType: 'text',
+        metadata: undefined,
     };
-    // For text files that aren't too large, also count lines
-    if (stats.isFile() && stats.size < FILE_SIZE_LIMITS.LINE_COUNT_LIMIT) {
-        try {
-            // Get MIME type information
-            const { mimeType, isImage } = await getMimeTypeInfo(validPath);
-            // Only count lines for non-image, likely text files
-            if (!isImage) {
-                const content = await fs.readFile(validPath, 'utf8');
-                const lineCount = countLines(content);
-                info.lineCount = lineCount;
-                info.lastLine = lineCount - 1; // Zero-indexed last line
-                info.appendPosition = lineCount; // Position to append at end
-            }
-        }
-        catch (error) {
-            // If reading fails, just skip the line count
-            // This could happen for binary files or very large files
+    // Get appropriate handler for this file type (async - includes binary detection)
+    const handler = await getFileHandler(validPath);
+    // Use handler to get file info, with fallback
+    let fileInfo;
+    try {
+        fileInfo = await handler.getInfo(validPath);
+    }
+    catch (error) {
+        // If handler fails, use fallback stats
+        fileInfo = fallbackInfo;
+    }
+    // Convert to legacy format (for backward compatibility)
+    // Use handler values with fallback to fs.stat values for any missing fields
+    const info = {
+        size: fileInfo.size ?? fallbackInfo.size,
+        created: fileInfo.created ?? fallbackInfo.created,
+        modified: fileInfo.modified ?? fallbackInfo.modified,
+        accessed: fileInfo.accessed ?? fallbackInfo.accessed,
+        isDirectory: fileInfo.isDirectory ?? fallbackInfo.isDirectory,
+        isFile: fileInfo.isFile ?? fallbackInfo.isFile,
+        permissions: fileInfo.permissions ?? fallbackInfo.permissions,
+        fileType: fileInfo.fileType ?? fallbackInfo.fileType,
+    };
+    // Add type-specific metadata from file handler
+    if (fileInfo.metadata) {
+        // For text files
+        if (fileInfo.metadata.lineCount !== undefined) {
+            info.lineCount = fileInfo.metadata.lineCount;
+            info.lastLine = fileInfo.metadata.lineCount - 1;
+            info.appendPosition = fileInfo.metadata.lineCount;
+        }
+        // For Excel files
+        if (fileInfo.metadata.sheets) {
+            info.sheets = fileInfo.metadata.sheets;
+            info.isExcelFile = true;
+        }
+        // For images
+        if (fileInfo.metadata.isImage) {
+            info.isImage = true;
+        }
+        // For PDF files
+        if (fileInfo.metadata.isPdf) {
+            info.isPdf = true;
+            info.totalPages = fileInfo.metadata.totalPages;
+            if (fileInfo.metadata.title)
+                info.title = fileInfo.metadata.title;
+            if (fileInfo.metadata.author)
+                info.author = fileInfo.metadata.author;
+        }
+        // For binary files
+        if (fileInfo.metadata.isBinary) {
+            info.isBinary = true;
         }
     }
     return info;
 }
+/**
+ * Write content to a PDF file.
+ * Can create a new PDF from Markdown string, or modify an existing PDF using operations.
+ *
+ * @param filePath Path to the output PDF file
+ * @param content Markdown string (for creation) or array of operations (for modification)
+ * @param options Options for PDF generation or modification. For modification, can include `sourcePdf`.
+ */
+export async function writePdf(filePath, content, outputPath, options = {}) {
+    const validPath = await validatePath(filePath);
+    const fileExtension = getFileExtension(validPath);
+    if (typeof content === 'string') {
+        // --- PDF CREATION MODE ---
+        capture('server_write_pdf', {
+            fileExtension: fileExtension,
+            contentLength: content.length,
+            mode: 'create'
+        });
+        const pdfBuffer = await parseMarkdownToPdf(content, options);
+        // Use outputPath if provided, otherwise overwrite input file
+        const targetPath = outputPath ? await validatePath(outputPath) : validPath;
+        await fs.writeFile(targetPath, pdfBuffer);
+    }
+    else if (Array.isArray(content)) {
+        // Use outputPath if provided, otherwise overwrite input file
+        const targetPath = outputPath ? await validatePath(outputPath) : validPath;
+        const operations = [];
+        // Validate paths in operations
+        for (const o of content) {
+            if (o.type === 'insert') {
+                if (o.sourcePdfPath) {
+                    o.sourcePdfPath = await validatePath(o.sourcePdfPath);
+                }
+            }
+            operations.push(o);
+        }
+        capture('server_write_pdf', {
+            fileExtension: fileExtension,
+            operationCount: operations.length,
+            mode: 'modify',
+            deleteCount: operations.filter(op => op.type === 'delete').length,
+            insertCount: operations.filter(op => op.type === 'insert').length
+        });
+        // Perform the PDF editing
+        const modifiedPdfBuffer = await editPdf(validPath, operations);
+        // Write the modified PDF to the output path
+        await fs.writeFile(targetPath, modifiedPdfBuffer);
+    }
+    else {
+        throw new Error('Invalid content type for writePdf. Expected string (markdown) or array of operations.');
+    }
+}