npm - docxmlater - Versions diffs - 10.3.5 → 10.4.0 - Mend

docxmlater 10.3.5 → 10.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (185) hide show

package/README.md +158 -7
package/dist/core/Document.d.ts +102 -3
package/dist/core/Document.d.ts.map +1 -1
package/dist/core/Document.js +775 -50
package/dist/core/Document.js.map +1 -1
package/dist/core/DocumentContent.d.ts.map +1 -1
package/dist/core/DocumentContent.js +0 -8
package/dist/core/DocumentContent.js.map +1 -1
package/dist/core/DocumentGenerator.d.ts.map +1 -1
package/dist/core/DocumentGenerator.js +9 -5
package/dist/core/DocumentGenerator.js.map +1 -1
package/dist/core/DocumentParser.d.ts.map +1 -1
package/dist/core/DocumentParser.js +588 -102
package/dist/core/DocumentParser.js.map +1 -1
package/dist/core/RelationshipManager.d.ts.map +1 -1
package/dist/core/RelationshipManager.js +4 -3
package/dist/core/RelationshipManager.js.map +1 -1
package/dist/elements/Bookmark.d.ts +7 -0
package/dist/elements/Bookmark.d.ts.map +1 -1
package/dist/elements/Bookmark.js +24 -4
package/dist/elements/Bookmark.js.map +1 -1
package/dist/elements/BookmarkManager.d.ts.map +1 -1
package/dist/elements/BookmarkManager.js +4 -3
package/dist/elements/BookmarkManager.js.map +1 -1
package/dist/elements/CommonTypes.d.ts +2 -2
package/dist/elements/CommonTypes.d.ts.map +1 -1
package/dist/elements/CommonTypes.js +14 -1
package/dist/elements/CommonTypes.js.map +1 -1
package/dist/elements/Field.d.ts +1 -1
package/dist/elements/Field.d.ts.map +1 -1
package/dist/elements/Field.js +1 -1
package/dist/elements/Field.js.map +1 -1
package/dist/elements/Footer.d.ts +2 -0
package/dist/elements/Footer.d.ts.map +1 -1
package/dist/elements/Footer.js +6 -0
package/dist/elements/Footer.js.map +1 -1
package/dist/elements/Header.d.ts +2 -0
package/dist/elements/Header.d.ts.map +1 -1
package/dist/elements/Header.js +6 -0
package/dist/elements/Header.js.map +1 -1
package/dist/elements/Image.d.ts +1 -0
package/dist/elements/Image.d.ts.map +1 -1
package/dist/elements/Image.js +17 -2
package/dist/elements/Image.js.map +1 -1
package/dist/elements/Paragraph.d.ts +81 -1
package/dist/elements/Paragraph.d.ts.map +1 -1
package/dist/elements/Paragraph.js +515 -21
package/dist/elements/Paragraph.js.map +1 -1
package/dist/elements/Revision.d.ts +0 -1
package/dist/elements/Revision.d.ts.map +1 -1
package/dist/elements/Revision.js +0 -12
package/dist/elements/Revision.js.map +1 -1
package/dist/elements/RevisionManager.d.ts +0 -1
package/dist/elements/RevisionManager.d.ts.map +1 -1
package/dist/elements/RevisionManager.js +0 -2
package/dist/elements/RevisionManager.js.map +1 -1
package/dist/elements/Run.d.ts +16 -4
package/dist/elements/Run.d.ts.map +1 -1
package/dist/elements/Run.js +114 -22
package/dist/elements/Run.js.map +1 -1
package/dist/elements/Section.d.ts +7 -1
package/dist/elements/Section.d.ts.map +1 -1
package/dist/elements/Section.js +185 -4
package/dist/elements/Section.js.map +1 -1
package/dist/elements/Shape.js.map +1 -1
package/dist/elements/Table.d.ts +30 -1
package/dist/elements/Table.d.ts.map +1 -1
package/dist/elements/Table.js +357 -40
package/dist/elements/Table.js.map +1 -1
package/dist/elements/TableCell.d.ts +3 -0
package/dist/elements/TableCell.d.ts.map +1 -1
package/dist/elements/TableCell.js +30 -3
package/dist/elements/TableCell.js.map +1 -1
package/dist/elements/TableGridChange.d.ts +0 -1
package/dist/elements/TableGridChange.d.ts.map +1 -1
package/dist/elements/TableGridChange.js +0 -10
package/dist/elements/TableGridChange.js.map +1 -1
package/dist/elements/TableRow.d.ts +4 -0
package/dist/elements/TableRow.d.ts.map +1 -1
package/dist/elements/TableRow.js +31 -3
package/dist/elements/TableRow.js.map +1 -1
package/dist/formatting/AbstractNumbering.d.ts +5 -0
package/dist/formatting/AbstractNumbering.d.ts.map +1 -1
package/dist/formatting/AbstractNumbering.js +22 -0
package/dist/formatting/AbstractNumbering.js.map +1 -1
package/dist/formatting/NumberingLevel.d.ts.map +1 -1
package/dist/formatting/NumberingLevel.js +3 -3
package/dist/formatting/NumberingLevel.js.map +1 -1
package/dist/formatting/Style.d.ts +1 -0
package/dist/formatting/Style.d.ts.map +1 -1
package/dist/formatting/Style.js +25 -59
package/dist/formatting/Style.js.map +1 -1
package/dist/formatting/StylesManager.d.ts +1 -0
package/dist/formatting/StylesManager.d.ts.map +1 -1
package/dist/formatting/StylesManager.js +12 -0
package/dist/formatting/StylesManager.js.map +1 -1
package/dist/helpers/CleanupHelper.js.map +1 -1
package/dist/images/ImageOptimizer.d.ts.map +1 -1
package/dist/images/ImageOptimizer.js +0 -1
package/dist/images/ImageOptimizer.js.map +1 -1
package/dist/index.d.ts +1 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js.map +1 -1
package/dist/managers/DrawingManager.d.ts.map +1 -1
package/dist/managers/DrawingManager.js +4 -2
package/dist/managers/DrawingManager.js.map +1 -1
package/dist/types/formatting.d.ts +2 -2
package/dist/types/formatting.d.ts.map +1 -1
package/dist/types/formatting.js.map +1 -1
package/dist/utils/ChangelogGenerator.d.ts +2 -2
package/dist/utils/ChangelogGenerator.d.ts.map +1 -1
package/dist/utils/ChangelogGenerator.js +4 -5
package/dist/utils/ChangelogGenerator.js.map +1 -1
package/dist/utils/InMemoryRevisionAcceptor.d.ts.map +1 -1
package/dist/utils/InMemoryRevisionAcceptor.js +0 -1
package/dist/utils/InMemoryRevisionAcceptor.js.map +1 -1
package/dist/utils/RevisionAwareProcessor.d.ts +2 -2
package/dist/utils/RevisionAwareProcessor.d.ts.map +1 -1
package/dist/utils/RevisionAwareProcessor.js +2 -2
package/dist/utils/RevisionAwareProcessor.js.map +1 -1
package/dist/utils/SelectiveRevisionAcceptor.d.ts +0 -2
package/dist/utils/SelectiveRevisionAcceptor.d.ts.map +1 -1
package/dist/utils/SelectiveRevisionAcceptor.js +0 -26
package/dist/utils/SelectiveRevisionAcceptor.js.map +1 -1
package/dist/utils/ShadingResolver.d.ts.map +1 -1
package/dist/utils/ShadingResolver.js.map +1 -1
package/dist/utils/acceptRevisions.js +1 -1
package/dist/utils/acceptRevisions.js.map +1 -1
package/dist/utils/stripTrackedChanges.js +1 -1
package/dist/utils/stripTrackedChanges.js.map +1 -1
package/dist/utils/units.d.ts.map +1 -1
package/dist/utils/units.js +1 -1
package/dist/utils/units.js.map +1 -1
package/dist/validation/RevisionAutoFixer.d.ts +2 -1
package/dist/validation/RevisionAutoFixer.d.ts.map +1 -1
package/dist/validation/RevisionAutoFixer.js.map +1 -1
package/package.json +10 -1
package/src/constants/CLAUDE.md +28 -0
package/src/core/CLAUDE.md +4 -0
package/src/core/Document.ts +1888 -137
package/src/core/DocumentContent.ts +0 -11
package/src/core/DocumentGenerator.ts +11 -12
package/src/core/DocumentParser.ts +620 -139
package/src/core/RelationshipManager.ts +6 -3
package/src/elements/Bookmark.ts +39 -4
package/src/elements/BookmarkManager.ts +4 -3
package/src/elements/CLAUDE.md +18 -2
package/src/elements/CommonTypes.ts +35 -8
package/src/elements/Field.ts +1 -1
package/src/elements/Footer.ts +23 -0
package/src/elements/Header.ts +25 -0
package/src/elements/Image.ts +28 -5
package/src/elements/Paragraph.ts +1069 -41
package/src/elements/Revision.ts +0 -19
package/src/elements/RevisionManager.ts +1 -3
package/src/elements/Run.ts +265 -35
package/src/elements/Section.ts +214 -8
package/src/elements/Shape.ts +1 -1
package/src/elements/Table.ts +850 -61
package/src/elements/TableCell.ts +84 -10
package/src/elements/TableGridChange.ts +2 -16
package/src/elements/TableRow.ts +94 -9
package/src/formatting/AbstractNumbering.ts +42 -1
package/src/formatting/CLAUDE.md +4 -0
package/src/formatting/NumberingLevel.ts +11 -7
package/src/formatting/Style.ts +39 -71
package/src/formatting/StylesManager.ts +36 -0
package/src/helpers/CleanupHelper.ts +1 -1
package/src/images/ImageOptimizer.ts +0 -3
package/src/index.ts +1 -1
package/src/managers/DrawingManager.ts +5 -3
package/src/tracking/CLAUDE.md +30 -0
package/src/types/CLAUDE.md +39 -0
package/src/types/formatting.ts +2 -2
package/src/utils/CLAUDE.md +15 -0
package/src/utils/ChangelogGenerator.ts +4 -5
package/src/utils/InMemoryRevisionAcceptor.ts +0 -9
package/src/utils/RevisionAwareProcessor.ts +2 -3
package/src/utils/SelectiveRevisionAcceptor.ts +0 -39
package/src/utils/ShadingResolver.ts +0 -1
package/src/utils/acceptRevisions.ts +1 -1
package/src/utils/stripTrackedChanges.ts +1 -1
package/src/utils/units.ts +2 -1
package/src/validation/CLAUDE.md +40 -0
package/src/validation/RevisionAutoFixer.ts +2 -1

package/src/core/Document.ts CHANGED Viewed

@@ -3,17 +3,14 @@
  * Provides a simple interface for creating DOCX files without managing ZIP and XML manually
  */
-import { AlternateContent } from '../elements/AlternateContent';
 import { Bookmark } from '../elements/Bookmark';
 import { BookmarkManager } from '../elements/BookmarkManager';
 import { Comment } from '../elements/Comment';
-import { CustomXmlBlock } from '../elements/CustomXml';
 import { PreservedElement } from '../elements/PreservedElement';
-import { MathParagraph } from '../elements/MathElement';
 import { CommentManager } from '../elements/CommentManager';
 import { Endnote } from '../elements/Endnote';
 import { EndnoteManager } from '../elements/EndnoteManager';
-import { Field } from '../elements/Field';
+import { Field, ComplexField } from '../elements/Field';
 import { Footnote } from '../elements/Footnote';
 import { FootnoteManager } from '../elements/FootnoteManager';
 import { Footer } from '../elements/Footer';
@@ -77,7 +74,7 @@ function getLogger(): ILogger {
 // cleanupRevisionMetadata - cleanup metadata files after in-memory acceptance
 import { acceptAllRevisions, cleanupRevisionMetadata } from '../utils/acceptRevisions';
 // In-memory revision acceptance - used AFTER parsing, allows subsequent modifications
-import { acceptRevisionsInMemory, AcceptRevisionsResult } from '../utils/InMemoryRevisionAcceptor';
+import { acceptRevisionsInMemory } from '../utils/InMemoryRevisionAcceptor';
 import { stripTrackedChanges } from '../utils/stripTrackedChanges';
 import { diffText, diffHasUnchangedParts } from '../utils/textDiff';
 import { XMLBuilder } from '../xml/XMLBuilder';
@@ -333,9 +330,6 @@ export class Document {
   // TOC auto-population setting
   private autoPopulateTOCs = false;
-  // TOC field instruction sync setting (default: OFF to preserve original instructions)
-  private autoSyncTOCStyles = false;
   // Flag to skip document.xml regeneration after stripping tracked changes
   // When true, save() and toBuffer() will preserve the manually cleaned XML
   private skipDocumentXmlRegeneration = false;
@@ -558,6 +552,211 @@ export class Document {
     return doc;
   }
+  /**
+   * Creates a Document from Markdown text
+   *
+   * Parses common Markdown syntax and builds a DOCX document. Supports:
+   * - Headings (`#` through `######`)
+   * - Bold (`**text**`), italic (`*text*`), bold+italic (`***text***`)
+   * - Strikethrough (`~~text~~`)
+   * - Inline code (`` `code` ``) rendered in Courier New
+   * - Links (`[text](url)`)
+   * - Bullet lists (`- ` or `* `)
+   * - Numbered lists (`1. `)
+   * - Tables (`| col | col |` with `| --- |` separator)
+   * - Horizontal rules (`---`, `***`, `___`)
+   * - Blank lines as paragraph separators
+   *
+   * @param markdown - Markdown text to convert
+   * @param options - Optional document options
+   * @returns New Document populated with the parsed content
+   *
+   * @example
+   * ```typescript
+   * const doc = Document.fromMarkdown(`
+   * # Report Title
+   *
+   * This is the **introduction** with *emphasis*.
+   *
+   * ## Data
+   *
+   * | Name | Value |
+   * | --- | --- |
+   * | Alpha | 100 |
+   *
+   * - First item
+   * - Second item
+   * `);
+   * await doc.save('output.docx');
+   * ```
+   */
+  static fromMarkdown(markdown: string, options?: DocumentOptions): Document {
+    const doc = Document.create(options);
+    const lines = markdown.split('\n');
+    let i = 0;
+    while (i < lines.length) {
+      const line = lines[i]!;
+      // Skip blank lines
+      if (line.trim() === '') {
+        i++;
+        continue;
+      }
+      // Horizontal rule: ---, ***, ___ (3+ of same char, optional spaces)
+      if (/^\s{0,3}([-]{3,}|[*]{3,}|[_]{3,})\s*$/.test(line)) {
+        doc.addHorizontalRule();
+        i++;
+        continue;
+      }
+      // Heading
+      const headingMatch = /^(#{1,6})\s+(.+)$/.exec(line);
+      if (headingMatch) {
+        const level = headingMatch[1]!.length as 1 | 2 | 3 | 4 | 5 | 6;
+        const text = headingMatch[2]!;
+        const para = doc.addHeading('', level);
+        Document.applyInlineMarkdown(para, text);
+        i++;
+        continue;
+      }
+      // Table (starts with |)
+      if (line.trimStart().startsWith('|')) {
+        const tableLines: string[] = [];
+        while (i < lines.length && lines[i]!.trimStart().startsWith('|')) {
+          tableLines.push(lines[i]!);
+          i++;
+        }
+        const table = Document.parseMarkdownTable(tableLines);
+        if (table) {
+          doc.addTable(table);
+        }
+        continue;
+      }
+      // Bullet list item
+      const bulletMatch = /^(\s*)[-*+]\s+(.+)$/.exec(line);
+      if (bulletMatch) {
+        const text = bulletMatch[2]!;
+        const para = doc.createParagraph();
+        Document.applyInlineMarkdown(para, text);
+        para.setStyle('ListBullet');
+        i++;
+        continue;
+      }
+      // Numbered list item
+      const numberMatch = /^(\s*)\d+[.)]\s+(.+)$/.exec(line);
+      if (numberMatch) {
+        const text = numberMatch[2]!;
+        const para = doc.createParagraph();
+        Document.applyInlineMarkdown(para, text);
+        para.setStyle('ListNumber');
+        i++;
+        continue;
+      }
+      // Regular paragraph (may span multiple non-blank lines)
+      const paraLines: string[] = [line];
+      i++;
+      while (
+        i < lines.length &&
+        lines[i]!.trim() !== '' &&
+        !lines[i]!.trim().startsWith('#') &&
+        !lines[i]!.trim().startsWith('|') &&
+        !/^\s{0,3}([-]{3,}|[*]{3,}|[_]{3,})\s*$/.test(lines[i]!) &&
+        !/^(\s*)[-*+]\s+/.test(lines[i]!) &&
+        !/^(\s*)\d+[.)]\s+/.test(lines[i]!)
+      ) {
+        paraLines.push(lines[i]!);
+        i++;
+      }
+      const para = doc.createParagraph();
+      Document.applyInlineMarkdown(para, paraLines.join(' '));
+    }
+    return doc;
+  }
+  /**
+   * Parses inline Markdown formatting and adds runs to a paragraph.
+   * Handles bold, italic, strikethrough, inline code, and links.
+   * @internal
+   */
+  private static applyInlineMarkdown(para: Paragraph, text: string): void {
+    // Regex to match inline elements in priority order
+    const inlinePattern =
+      /(\*\*\*(.+?)\*\*\*|\*\*(.+?)\*\*|\*(.+?)\*|~~(.+?)~~|`([^`]+)`|\[([^\]]+)\]\(([^)]+)\))/g;
+    let lastIndex = 0;
+    let match: RegExpExecArray | null;
+    while ((match = inlinePattern.exec(text)) !== null) {
+      // Add plain text before this match
+      if (match.index > lastIndex) {
+        para.addText(text.slice(lastIndex, match.index));
+      }
+      if (match[2] !== undefined) {
+        // ***bold+italic***
+        para.addText(match[2], { bold: true, italic: true });
+      } else if (match[3] !== undefined) {
+        // **bold**
+        para.addText(match[3], { bold: true });
+      } else if (match[4] !== undefined) {
+        // *italic*
+        para.addText(match[4], { italic: true });
+      } else if (match[5] !== undefined) {
+        // ~~strikethrough~~
+        para.addText(match[5], { strike: true });
+      } else if (match[6] !== undefined) {
+        // `inline code`
+        para.addText(match[6], { font: 'Courier New' });
+      } else if (match[7] !== undefined && match[8] !== undefined) {
+        // [text](url)
+        para.addHyperlink(new Hyperlink({ url: match[8], text: match[7] }));
+      }
+      lastIndex = match.index + match[0]!.length;
+    }
+    // Add remaining plain text
+    if (lastIndex < text.length) {
+      para.addText(text.slice(lastIndex));
+    }
+  }
+  /**
+   * Parses Markdown table lines into a Table.
+   * @internal
+   */
+  private static parseMarkdownTable(lines: string[]): Table | null {
+    if (lines.length < 2) return null;
+    const parseRow = (line: string): string[] =>
+      line
+        .replace(/^\|/, '')
+        .replace(/\|$/, '')
+        .split('|')
+        .map((cell) => cell.trim());
+    const rows: string[][] = [];
+    for (let i = 0; i < lines.length; i++) {
+      const cells = parseRow(lines[i]!);
+      // Skip separator row (| --- | --- |)
+      if (cells.every((c) => /^:?-+:?$/.test(c))) continue;
+      rows.push(cells);
+    }
+    if (rows.length === 0) return null;
+    return Table.fromArray(rows);
+  }
   /**
    * Loads an existing Word document from a file path
    *
@@ -1461,6 +1660,83 @@ export class Document {
     return para;
   }
+  /**
+   * Creates a heading paragraph and appends it to the document
+   *
+   * Convenience method that creates a paragraph with the given text and
+   * applies a heading style (Heading1–Heading9). Equivalent to:
+   * ```typescript
+   * doc.createParagraph(text).setStyle(`Heading${level}`);
+   * ```
+   *
+   * @param text - Heading text content
+   * @param level - Heading level 1–9 (default: 1)
+   * @returns The created Paragraph for further customization
+   *
+   * @example
+   * ```typescript
+   * doc.addHeading('Introduction', 1);
+   * doc.addHeading('Background', 2);
+   * doc.addHeading('Methods', 2);
+   * doc.addHeading('Data Collection', 3);
+   * ```
+   */
+  addHeading(text: string, level: 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 = 1): Paragraph {
+    return this.createParagraph(text).setStyle(`Heading${level}`);
+  }
+  /**
+   * Inserts a page break into the document
+   *
+   * Creates a paragraph containing a page break element and appends it
+   * to the document body. This is the standard way to force a new page
+   * in OOXML (a paragraph with `w:br w:type="page"`).
+   *
+   * @returns The created Paragraph (allows further content after the break)
+   *
+   * @example
+   * ```typescript
+   * doc.addHeading('Chapter 1', 1);
+   * doc.createParagraph('Chapter 1 content...');
+   * doc.addPageBreak();
+   * doc.addHeading('Chapter 2', 1);
+   * ```
+   */
+  addPageBreak(): Paragraph {
+    const para = this.createParagraph();
+    const run = new Run('');
+    run.addBreak('page');
+    para.addRun(run);
+    return para;
+  }
+  /**
+   * Inserts a horizontal rule into the document
+   *
+   * Creates an empty paragraph with a bottom border that renders as a
+   * horizontal line. Uses a thin single-line border, which is the standard
+   * OOXML approach for horizontal rules (no dedicated HR element exists).
+   *
+   * @param color - Border color in hex without # (default: 'auto')
+   * @param size - Border thickness in eighths of a point (default: 4, ~0.5pt)
+   * @returns The created Paragraph
+   *
+   * @example
+   * ```typescript
+   * doc.createParagraph('Above the line');
+   * doc.addHorizontalRule();
+   * doc.createParagraph('Below the line');
+   *
+   * // Custom color and thickness
+   * doc.addHorizontalRule('FF0000', 12);
+   * ```
+   */
+  addHorizontalRule(color = 'auto', size = 4): Paragraph {
+    const para = this.createParagraph();
+    para.setBorder({ bottom: { style: 'single', size, color, space: 1 } });
+    return para;
+  }
   /**
    * Adds an existing table to the document body
    *
@@ -1545,6 +1821,32 @@ export class Document {
     return table;
   }
+  /**
+   * Creates a table from CSV data and appends it to the document
+   *
+   * Parses the CSV string into a table using `Table.fromCSV()` and adds
+   * it to the document body. Handles quoted fields, commas in values,
+   * and other RFC 4180 features.
+   *
+   * @param csv - CSV string to parse
+   * @param delimiter - Field delimiter (default: ',')
+   * @returns The created Table
+   *
+   * @example
+   * ```typescript
+   * doc.createTableFromCSV('Name,Age\nAlice,30\nBob,25');
+   *
+   * // From a TSV string
+   * doc.createTableFromCSV(tsvData, '\t');
+   * ```
+   */
+  createTableFromCSV(csv: string, delimiter = ','): Table {
+    const table = Table.fromCSV(csv, delimiter);
+    table._setStylesManager(this.stylesManager);
+    this.bodyElements.push(table);
+    return table;
+  }
   /**
    * Populates all TOCs in document XML
    * Extracted from replaceTableOfContents for reuse
@@ -2194,6 +2496,19 @@ export class Document {
     this.updateContentTypesWithImagesHeadersFootersAndComments();
   }
+  /**
+   * Saves the document to a file. Uses atomic write (temp file + rename) for crash safety.
+   * Always call dispose() after saving when done with the document.
+   *
+   * @param filePath - Output file path
+   * @throws {FileOperationError} If the file cannot be written
+   *
+   * @example
+   * ```typescript
+   * await doc.save('output.docx');
+   * doc.dispose();
+   * ```
+   */
   async save(filePath: string): Promise<void> {
     const logger = getLogger();
     logger.info('Saving document', { path: filePath, paragraphs: this.getParagraphCount() });
@@ -2236,7 +2551,7 @@ export class Document {
         const { promises: fs } = await import('fs');
         await fs.unlink(tempPath);
       } catch (cleanupErr) {
-        logger.debug('Failed to clean up temp file', { tempPath, error: String(cleanupErr) });
+        logger.warn('Failed to clean up temp file', { tempPath, error: String(cleanupErr) });
       }
       throw error; // Re-throw original error
     } finally {
@@ -2320,6 +2635,123 @@ export class Document {
     }
   }
+  /**
+   * Generates the document as a base64-encoded string
+   *
+   * Produces the same DOCX content as `toBuffer()` but encoded as base64.
+   * Useful for embedding in JSON API responses, storing in databases as text,
+   * passing through systems that don't support binary data, or constructing
+   * data URIs (see `toDataUri()`).
+   *
+   * @returns Promise resolving to a base64-encoded string of the DOCX file
+   *
+   * @example
+   * ```typescript
+   * // JSON API response
+   * const base64 = await doc.toBase64();
+   * res.json({ filename: 'report.docx', content: base64 });
+   *
+   * // Store in text-based database field
+   * await db.insert({ docBase64: await doc.toBase64() });
+   * ```
+   */
+  async toBase64(): Promise<string> {
+    const buffer = await this.toBuffer();
+    return buffer.toString('base64');
+  }
+  /**
+   * Generates the document as a data URI string
+   *
+   * Returns a complete `data:` URI with the DOCX MIME type and base64-encoded
+   * content. Can be used directly as an `href` for download links, embedded
+   * in HTML, or passed to APIs expecting data URIs.
+   *
+   * @returns Promise resolving to a data URI string
+   *
+   * @example
+   * ```typescript
+   * // HTML download link
+   * const uri = await doc.toDataUri();
+   * const html = `<a href="${uri}" download="report.docx">Download</a>`;
+   *
+   * // Embed in email HTML
+   * const dataUri = await doc.toDataUri();
+   * ```
+   */
+  async toDataUri(): Promise<string> {
+    const base64 = await this.toBase64();
+    return `data:application/vnd.openxmlformats-officedocument.wordprocessingml.document;base64,${base64}`;
+  }
+  /**
+   * Loads a document from a base64-encoded string
+   *
+   * The inverse of `toBase64()`. Creates a Document from a base64 string,
+   * useful for receiving documents from JSON APIs or text-based storage.
+   *
+   * @param base64 - Base64-encoded DOCX content
+   * @param options - Optional document configuration
+   * @returns Promise resolving to a Document instance
+   *
+   * @example
+   * ```typescript
+   * // Receive from API
+   * const doc = await Document.loadFromBase64(apiResponse.content);
+   * console.log(doc.toPlainText());
+   * ```
+   */
+  static async loadFromBase64(base64: string, options?: DocumentOptions): Promise<Document> {
+    const buffer = Buffer.from(base64, 'base64');
+    return Document.loadFromBuffer(buffer, options);
+  }
+  /**
+   * Creates an independent deep copy of this document
+   *
+   * Serializes the document to a buffer and reloads it, producing a
+   * completely independent clone with its own body elements, styles,
+   * numbering, images, and ZIP state. Changes to the clone do not
+   * affect the original and vice versa.
+   *
+   * Essential for template-based batch generation: load a template
+   * once, clone it N times, and fill each with different data.
+   *
+   * @returns Promise resolving to a new Document with identical content
+   *
+   * @example
+   * ```typescript
+   * // Template-based batch generation
+   * const template = await Document.load('template.docx');
+   *
+   * for (const record of data) {
+   *   const doc = await template.clone();
+   *   doc.fillTemplate(record);
+   *   await doc.save(`output-${record.id}.docx`);
+   *   doc.dispose();
+   * }
+   *
+   * template.dispose();
+   * ```
+   *
+   * @example
+   * ```typescript
+   * // Fork a document for parallel modifications
+   * const original = Document.create();
+   * original.addHeading('Shared Title', 1);
+   *
+   * const version1 = await original.clone();
+   * version1.createParagraph('Version 1 content');
+   *
+   * const version2 = await original.clone();
+   * version2.createParagraph('Version 2 content');
+   * ```
+   */
+  async clone(): Promise<Document> {
+    const buffer = await this.toBuffer();
+    return Document.loadFromBuffer(buffer);
+  }
   /**
    * Updates the document.xml file with current paragraphs
    */
@@ -2940,10 +3372,12 @@ export class Document {
     return divCount;
   }
+  /** Gets the optimizeForBrowser web setting. */
   getOptimizeForBrowser(): boolean {
     return this._webSettings.optimizeForBrowser;
   }
+  /** Sets the optimizeForBrowser web setting. */
   setOptimizeForBrowser(value: boolean): this {
     this._webSettings.optimizeForBrowser = value;
     this._webSettingsModified = true;
@@ -2952,10 +3386,12 @@ export class Document {
     return this;
   }
+  /** Gets the allowPNG web setting. */
   getAllowPNG(): boolean {
     return this._webSettings.allowPNG;
   }
+  /** Sets the allowPNG web setting. */
   setAllowPNG(value: boolean): this {
     this._webSettings.allowPNG = value;
     this._webSettingsModified = true;
@@ -4475,7 +4911,7 @@ export class Document {
       left: options?.cellMargins?.left ?? 115, // 0.08 inches
       right: options?.cellMargins?.right ?? 115, // 0.08 inches
     };
-    const skipSingleCellTables = options?.skipSingleCellTables !== false && !singleCellShading;
+    // Note: skipSingleCellTables option is accepted but not yet implemented
     // Statistics
     let tablesProcessed = 0;
@@ -5069,7 +5505,7 @@ export class Document {
   validateNumberingReferences(): number {
     let fixed = 0;
     const existingNumIds = new Set<number>(
-      this.numberingManager.getAllInstances().map((i: any) => i.getNumId())
+      this.numberingManager.getAllInstances().map((i) => i.getNumId())
     );
     for (const para of this.getAllParagraphs()) {
@@ -5261,6 +5697,24 @@ export class Document {
     let docPrId = 1;
+    // Collect existing paraIds to avoid collisions when generating new ones
+    const existingParaIds = new Set<string>();
+    const paragraphsNeedingIds: Paragraph[] = [];
+    const generateUniqueParaId = (): string => {
+      let id: string;
+      do {
+        // Generate 8-char uppercase hex string matching Word's w14:paraId format
+        // Per ECMA-376, ST_LongHexNumber MaxExclusive is 80000000 (must be < 0x80000000)
+        id = Math.floor(Math.random() * 0x7fffffff + 1)
+          .toString(16)
+          .toUpperCase()
+          .padStart(8, '0');
+      } while (existingParaIds.has(id));
+      existingParaIds.add(id);
+      return id;
+    };
     const processParagraph = (para: Paragraph) => {
       // Assign unique IDs to unregistered revisions
       for (const rev of para.getRevisions()) {
@@ -5281,6 +5735,13 @@ export class Document {
           item.getImageElement().setDocPrId(docPrId++);
         }
       }
+      // Track existing paraIds and paragraphs that need new ones
+      if (para.formatting.paraId) {
+        existingParaIds.add(para.formatting.paraId);
+      } else {
+        paragraphsNeedingIds.push(para);
+      }
     };
     for (const element of this.bodyElements) {
@@ -5296,6 +5757,14 @@ export class Document {
         }
       }
     }
+    // Generate w14:paraId and w14:textId for paragraphs that lack them (Word 2010+ requirement)
+    for (const para of paragraphsNeedingIds) {
+      para.formatting.paraId = generateUniqueParaId();
+      if (!para.formatting.textId) {
+        para.formatting.textId = generateUniqueParaId();
+      }
+    }
   }
   /**
@@ -5741,6 +6210,103 @@ export class Document {
     return this.numberingManager.createMultiLevelList();
   }
+  /**
+   * Creates a bullet list from an array of text items and appends it to the document
+   *
+   * Handles all numbering plumbing internally: creates a bullet list definition,
+   * creates paragraphs, and applies numbering to each one. Supports nested items
+   * via `{ text, level }` objects.
+   *
+   * @param items - Array of strings or `{ text, level }` objects. Strings default to level 0.
+   * @param formatting - Optional run formatting applied to all items
+   * @returns Array of created Paragraphs
+   *
+   * @example
+   * ```typescript
+   * // Simple flat list
+   * doc.addBulletListFromArray(['First item', 'Second item', 'Third item']);
+   *
+   * // Nested list
+   * doc.addBulletListFromArray([
+   *   'Top level',
+   *   { text: 'Nested item', level: 1 },
+   *   { text: 'Deeper item', level: 2 },
+   *   'Back to top',
+   * ]);
+   *
+   * // With formatting
+   * doc.addBulletListFromArray(['Bold item'], { bold: true });
+   * ```
+   */
+  addBulletListFromArray(
+    items: (string | { text: string; level?: number })[],
+    formatting?: RunFormatting
+  ): Paragraph[] {
+    if (items.length === 0) return [];
+    const numId = this.createBulletList();
+    return this.addListItems(numId, items, formatting);
+  }
+  /**
+   * Creates a numbered list from an array of text items and appends it to the document
+   *
+   * Handles all numbering plumbing internally: creates a numbered list definition,
+   * creates paragraphs, and applies numbering to each one. Supports nested items
+   * via `{ text, level }` objects.
+   *
+   * @param items - Array of strings or `{ text, level }` objects. Strings default to level 0.
+   * @param formatting - Optional run formatting applied to all items
+   * @returns Array of created Paragraphs
+   *
+   * @example
+   * ```typescript
+   * // Simple numbered list
+   * doc.addNumberedListFromArray(['First', 'Second', 'Third']);
+   *
+   * // Nested numbered list
+   * doc.addNumberedListFromArray([
+   *   'Chapter 1',
+   *   { text: 'Section 1.1', level: 1 },
+   *   { text: 'Section 1.2', level: 1 },
+   *   'Chapter 2',
+   * ]);
+   * ```
+   */
+  addNumberedListFromArray(
+    items: (string | { text: string; level?: number })[],
+    formatting?: RunFormatting
+  ): Paragraph[] {
+    if (items.length === 0) return [];
+    const numId = this.createNumberedList();
+    return this.addListItems(numId, items, formatting);
+  }
+  /**
+   * Internal helper that creates list paragraphs from items.
+   * @internal
+   */
+  private addListItems(
+    numId: number,
+    items: (string | { text: string; level?: number })[],
+    formatting?: RunFormatting
+  ): Paragraph[] {
+    const paragraphs: Paragraph[] = [];
+    for (const item of items) {
+      const text = typeof item === 'string' ? item : item.text;
+      const level = typeof item === 'string' ? 0 : (item.level ?? 0);
+      const para = this.createParagraph();
+      para.addText(text, formatting);
+      para.setNumbering(numId, level);
+      paragraphs.push(para);
+    }
+    return paragraphs;
+  }
   /**
    * Creates a new numbering instance that restarts numbering for an existing list
    *
@@ -7334,7 +7900,7 @@ export class Document {
     const fillPattern = new RegExp(`(w:fill=["'])${normalizedOld}(["'])`, 'gi');
     // Replace all occurrences
-    stylesXml = stylesXml.replace(fillPattern, (match, prefix, suffix) => {
+    stylesXml = stylesXml.replace(fillPattern, (_match, prefix, suffix) => {
       updateCount++;
       return `${prefix}${normalizedNew}${suffix}`;
     });
@@ -7343,7 +7909,7 @@ export class Document {
     // Matches: w:color="A5A5A5" within shd elements
     const colorPattern = new RegExp(`(<w:shd[^>]*w:color=["'])${normalizedOld}(["'])`, 'gi');
-    stylesXml = stylesXml.replace(colorPattern, (match, prefix, suffix) => {
+    stylesXml = stylesXml.replace(colorPattern, (_match, prefix, suffix) => {
       updateCount++;
       return `${prefix}${normalizedNew}${suffix}`;
     });
@@ -7413,27 +7979,6 @@ export class Document {
    * Helper method to process consecutive blank paragraphs
    * @private
    */
-  private processConsecutiveBlanks(
-    blanks: Paragraph[],
-    keepOne: boolean,
-    toRemove: Paragraph[]
-  ): void {
-    if (blanks.length === 0) return;
-    if (keepOne && blanks.length > 1) {
-      // Keep the first one, remove the rest
-      for (let i = 1; i < blanks.length; i++) {
-        const blank = blanks[i];
-        if (blank) {
-          toRemove.push(blank);
-        }
-      }
-    } else if (!keepOne) {
-      // Remove all
-      toRemove.push(...blanks);
-    }
-    // If keepOne is true and there's only 1 blank, don't remove it
-  }
   /**
    * Standardizes all bullet list symbols formatting (font, size, bold, color)
@@ -8031,7 +8576,7 @@ export class Document {
   private parseTOCFieldInstruction(instrText: string): number[] {
     const levels = new Set<number>();
     let hasOutlineSwitch = false;
-    let hasTableSwitch = false;
+    // hasTableSwitch tracked via \t switch parsing below
     // Normalize whitespace and quotes: trim input and replace &quot; with " for consistent parsing
     const normalizedText = instrText.trim().replace(/&quot;/g, '"');
@@ -8065,7 +8610,7 @@ export class Document {
     const tMatches = [...normalizedText.matchAll(tSwitchRegex)];
     for (const match of tMatches) {
-      hasTableSwitch = true;
+      // \t switch found — heading levels extracted from table style mappings
       const content = (match[1] || '').trim();
       if (!content) continue;
@@ -8450,6 +8995,7 @@ export class Document {
       }
       // Helper function to extract heading info from a parsed paragraph object
+      // eslint-disable-next-line @typescript-eslint/no-explicit-any
       const extractHeading = (para: any): void => {
         const pPr = para['w:pPr'];
         if (!pPr?.['w:pStyle']) {
@@ -8584,52 +9130,6 @@ export class Document {
     return headings;
   }
-  /**
-   * Legacy method - searches only bodyElements (doesn't search inside tables)
-   * Kept for compatibility but not recommended
-   * @deprecated Use findHeadingsForTOCFromXML instead
-   */
-  private findHeadingsForTOC(
-    levels: number[]
-  ): { level: number; text: string; bookmark: string }[] {
-    const headings: { level: number; text: string; bookmark: string }[] = [];
-    const levelSet = new Set(levels);
-    // Iterate through body elements
-    for (const element of this.bodyElements) {
-      if (element instanceof Paragraph) {
-        const para = element;
-        const formatting = para.getFormatting();
-        // Check if paragraph has a heading style (handle both "Heading1" and "Heading 1")
-        if (formatting.style) {
-          const styleMatch = /Heading\s*(\d+)/i.exec(formatting.style);
-          if (styleMatch?.[1]) {
-            const headingLevel = parseInt(styleMatch[1], 10);
-            // Check if this level should be included in TOC
-            if (levelSet.has(headingLevel)) {
-              const text = para.getText().trim();
-              if (text) {
-                // Create or get bookmark for this heading
-                const bookmark = this.bookmarkManager.createHeadingBookmark(text);
-                headings.push({
-                  level: headingLevel,
-                  text: text,
-                  bookmark: bookmark.getName(),
-                });
-              }
-            }
-          }
-        }
-      }
-    }
-    return headings;
-  }
   /**
    * Generates TOC XML structure with populated entries
    *
@@ -10047,14 +10547,100 @@ export class Document {
   }
   /**
-   * Gets the RevisionManager for track changes operations
-   *
-   * Provides access to the RevisionManager for managing tracked changes
-   * (insertions, deletions, formatting changes, etc.) in the document.
-   *
-   * @returns The RevisionManager instance managing this document's revisions
+   * Ensures a "Top of the Document" hyperlink exists above every 1x1 table
+   * except the first one. Skips tables that already have a _top link in the
+   * paragraph immediately above them.
    *
-   * @example
+   * @param options Optional configuration
+   * @param options.text Display text for inserted links (default: 'Top of the Document')
+   * @param options.formatting Optional RunFormatting for the hyperlink
+   * @returns Number of links inserted
+   */
+  ensureTopLinksAbove1x1Tables(options?: { text?: string; formatting?: RunFormatting }): number {
+    const linkText = options?.text || 'Top of the Document';
+    const formatting = options?.formatting;
+    // Ensure _top bookmark exists at document start
+    this.addTopBookmark();
+    let insertedCount = 0;
+    let oneByOneCount = 0;
+    // Work directly with bodyElements array since indices shift on insert
+    let i = 0;
+    while (i < this.bodyElements.length) {
+      const element = this.bodyElements[i];
+      if (
+        element instanceof Table &&
+        element.getRowCount() === 1 &&
+        element.getColumnCount() === 1
+      ) {
+        oneByOneCount++;
+        // Skip the first 1x1 table
+        if (oneByOneCount > 1) {
+          // Check if paragraph immediately before has a _top link
+          const prevElement = i > 0 ? this.bodyElements[i - 1] : undefined;
+          const hasLink =
+            prevElement instanceof Paragraph && this._paragraphHasTopLink(prevElement);
+          if (!hasLink) {
+            // Insert a paragraph with _top hyperlink before this table
+            const para = new Paragraph();
+            const link = Hyperlink.createInternal('_top', linkText, {
+              color: '0000FF',
+              underline: 'single',
+              ...formatting,
+            });
+            para.addHyperlink(link);
+            this.bodyElements.splice(i, 0, para);
+            insertedCount++;
+            i++; // Skip past the inserted paragraph
+          }
+        }
+      }
+      i++;
+    }
+    return insertedCount;
+  }
+  /**
+   * Checks whether a paragraph contains a hyperlink with `_top` anchor.
+   * Handles inline Hyperlink elements, ComplexField HYPERLINK _top,
+   * and PreservedElement raw XML passthrough (loaded docs).
+   * @internal
+   */
+  private _paragraphHasTopLink(paragraph: Paragraph): boolean {
+    for (const item of paragraph.getContent()) {
+      if (item instanceof Hyperlink && item.getAnchor() === '_top') {
+        return true;
+      }
+      if (item instanceof ComplexField && item.isHyperlinkField()) {
+        const parsed = item.getParsedHyperlink();
+        if (parsed?.anchor === '_top') {
+          return true;
+        }
+      }
+      // Loaded docs may have hyperlinks as PreservedElement (raw XML passthrough)
+      if (item instanceof PreservedElement && item.getRawXml().includes('w:anchor="_top"')) {
+        return true;
+      }
+    }
+    return false;
+  }
+  /**
+   * Gets the RevisionManager for track changes operations
+   *
+   * Provides access to the RevisionManager for managing tracked changes
+   * (insertions, deletions, formatting changes, etc.) in the document.
+   *
+   * @returns The RevisionManager instance managing this document's revisions
+   *
+   * @example
    * ```typescript
    * const revManager = doc.getRevisionManager();
    * const stats = revManager.getStats();
@@ -10731,6 +11317,7 @@ export class Document {
    * @param element - Element to bind
    * @internal
    */
+  // eslint-disable-next-line @typescript-eslint/no-explicit-any
   private bindTrackingToElement(element: any): void {
     // Set tracking context on element if it supports it
     if (element && typeof element._setTrackingContext === 'function') {
@@ -10970,6 +11557,7 @@ export class Document {
     this._settingsModified = true;
   }
+  /** Gets whether even/odd page headers and footers are enabled (w:evenAndOddHeaders). */
   getEvenAndOddHeaders(): boolean {
     return this._evenAndOddHeaders ?? false;
   }
@@ -11063,6 +11651,72 @@ export class Document {
     this._modifiedBooleanSettings.add('defaultTabStop');
   }
+  /**
+   * Sets the default document font by updating the Normal style
+   *
+   * All unstyled text inherits from the Normal style, so this effectively
+   * sets the font for the entire document. Optionally sets the font size too.
+   *
+   * @param fontName - Font family name (e.g., 'Calibri', 'Times New Roman', 'Arial')
+   * @param sizeInPoints - Optional font size in points (e.g., 11, 12, 14)
+   * @returns This document for chaining
+   *
+   * @example
+   * ```typescript
+   * const doc = Document.create();
+   * doc.setDefaultFont('Times New Roman', 12);
+   * doc.createParagraph('This text will be in Times New Roman 12pt');
+   * ```
+   */
+  setDefaultFont(fontName: string, sizeInPoints?: number): this {
+    let normalStyle = this.stylesManager.getStyle('Normal');
+    if (!normalStyle) {
+      normalStyle = new Style({
+        styleId: 'Normal',
+        name: 'Normal',
+        type: 'paragraph',
+        isDefault: true,
+      });
+      this.stylesManager.addStyle(normalStyle);
+    }
+    const existing = normalStyle.getRunFormatting() ?? {};
+    const updated: RunFormatting = { ...existing, font: fontName };
+    if (sizeInPoints !== undefined) {
+      updated.size = sizeInPoints;
+    }
+    normalStyle.setRunFormatting(updated);
+    return this;
+  }
+  /**
+   * Sets the default document font size by updating the Normal style
+   *
+   * @param sizeInPoints - Font size in points (e.g., 10, 11, 12, 14)
+   * @returns This document for chaining
+   *
+   * @example
+   * ```typescript
+   * doc.setDefaultFontSize(14);
+   * ```
+   */
+  setDefaultFontSize(sizeInPoints: number): this {
+    let normalStyle = this.stylesManager.getStyle('Normal');
+    if (!normalStyle) {
+      normalStyle = new Style({
+        styleId: 'Normal',
+        name: 'Normal',
+        type: 'paragraph',
+        isDefault: true,
+      });
+      this.stylesManager.addStyle(normalStyle);
+    }
+    const existing = normalStyle.getRunFormatting() ?? {};
+    normalStyle.setRunFormatting({ ...existing, size: sizeInPoints });
+    return this;
+  }
   /**
    * Gets whether fields are updated on document open (w:updateFields)
    */
@@ -11546,19 +12200,31 @@ export class Document {
     return this.commentManager.getAllComments();
   }
+  /** Returns the footnote manager for advanced footnote operations. */
   getFootnoteManager(): FootnoteManager {
     return this.footnoteManager;
   }
+  /** Returns the endnote manager for advanced endnote operations. */
   getEndnoteManager(): EndnoteManager {
     return this.endnoteManager;
   }
+  /**
+   * Creates a new footnote with the given text and adds a reference in the document.
+   * @param text - The footnote text content
+   * @returns The created Footnote object
+   */
   createFootnote(text: string): Footnote {
     this._footnotesModified = true;
     return this.footnoteManager.createFootnote(text);
   }
+  /**
+   * Creates a new endnote with the given text and adds a reference in the document.
+   * @param text - The endnote text content
+   * @returns The created Endnote object
+   */
   createEndnote(text: string): Endnote {
     this._endnotesModified = true;
     return this.endnoteManager.createEndnote(text);
@@ -12332,6 +12998,34 @@ export class Document {
     return count;
   }
+  /**
+   * Removes all body content from the document
+   *
+   * Clears all paragraphs, tables, and other body elements while
+   * preserving the document shell (styles, numbering, settings,
+   * properties, headers, footers). The document remains valid and
+   * new content can be added after clearing.
+   *
+   * @returns This document for chaining
+   *
+   * @example
+   * ```typescript
+   * // Clear and rebuild content
+   * doc.clear();
+   * doc.addHeading('Fresh Start', 1);
+   * doc.createParagraph('New content here.');
+   *
+   * // Use as a template reset
+   * const template = await Document.load('template.docx');
+   * template.clear();
+   * // Styles and settings preserved, content gone
+   * ```
+   */
+  clear(): this {
+    this.bodyElements = [];
+    return this;
+  }
   /**
    * Cleans up resources and clears all managers
    * Call this after saving in long-running processes to free memory
@@ -13808,6 +14502,153 @@ export class Document {
     return trackChanges ? { count, revisions } : { count };
   }
+  /**
+   * Fills template placeholders with values using cross-run replacement
+   *
+   * Replaces `{{key}}` placeholders throughout the document (paragraphs
+   * and table cells) with the corresponding values from the data object.
+   * Uses cross-run matching, so placeholders that Word has fragmented across
+   * multiple runs (e.g., `{{` in one run, `name` in another, `}}` in a third)
+   * are found and replaced correctly.
+   *
+   * The replacement text inherits the formatting of the first run in the
+   * matched placeholder. Delimiter style can be customized.
+   *
+   * @param data - Key-value pairs where keys match placeholder names
+   * @param options - Template options
+   * @param options.delimiters - Custom open/close delimiters (default: `['{{', '}}']`)
+   * @returns Total number of replacements made
+   *
+   * @example
+   * ```typescript
+   * // Document contains: "Dear {{name}}, your order {{orderId}} is ready."
+   * const count = doc.fillTemplate({
+   *   name: 'Alice',
+   *   orderId: 'ORD-12345',
+   * });
+   * // Result: "Dear Alice, your order ORD-12345 is ready."
+   * ```
+   *
+   * @example
+   * ```typescript
+   * // Custom delimiters
+   * doc.fillTemplate(
+   *   { title: 'Report', date: '2024-01-15' },
+   *   { delimiters: ['<<', '>>'] }
+   * );
+   * ```
+   */
+  fillTemplate(data: Record<string, string>, options?: { delimiters?: [string, string] }): number {
+    const [open, close] = options?.delimiters ?? ['{{', '}}'];
+    let totalCount = 0;
+    const allParagraphs = this.getAllParagraphs();
+    for (const [key, value] of Object.entries(data)) {
+      const placeholder = `${open}${key}${close}`;
+      for (const para of allParagraphs) {
+        totalCount += para.replaceTextCrossRun(placeholder, value);
+      }
+    }
+    return totalCount;
+  }
+  /**
+   * Finds all occurrences of text and applies highlight color
+   *
+   * Searches across run boundaries (handles Word-fragmented text) and
+   * applies character highlight formatting to every match. Uses
+   * `findTextCrossRun` + `applyFormattingToRange` internally.
+   *
+   * @param text - Text to search for
+   * @param color - Highlight color (default: 'yellow')
+   * @param options - Search options
+   * @param options.caseSensitive - Match case exactly (default: false)
+   * @returns Number of matches highlighted
+   *
+   * @example
+   * ```typescript
+   * // Highlight all occurrences of "important" in yellow
+   * doc.findAndHighlight('important');
+   *
+   * // Red highlight, case-sensitive
+   * doc.findAndHighlight('ERROR', 'red', { caseSensitive: true });
+   * ```
+   */
+  findAndHighlight(
+    text: string,
+    color:
+      | 'yellow'
+      | 'green'
+      | 'cyan'
+      | 'magenta'
+      | 'blue'
+      | 'red'
+      | 'darkBlue'
+      | 'darkCyan'
+      | 'darkGreen'
+      | 'darkMagenta'
+      | 'darkRed'
+      | 'darkYellow'
+      | 'darkGray'
+      | 'lightGray'
+      | 'black' = 'yellow',
+    options?: { caseSensitive?: boolean }
+  ): number {
+    return this.findAndFormat(text, { highlight: color }, options);
+  }
+  /**
+   * Finds all occurrences of text and applies formatting
+   *
+   * Searches across run boundaries (handles Word-fragmented text) and
+   * applies the specified run formatting to every match. This is the
+   * general-purpose version of `findAndHighlight()`.
+   *
+   * @param text - Text to search for
+   * @param formatting - RunFormatting to apply to matches
+   * @param options - Search options
+   * @param options.caseSensitive - Match case exactly (default: false)
+   * @returns Number of matches formatted
+   *
+   * @example
+   * ```typescript
+   * // Bold all occurrences of "warning"
+   * doc.findAndFormat('warning', { bold: true, color: 'FF0000' });
+   *
+   * // Strikethrough deprecated terms
+   * doc.findAndFormat('deprecated', { strike: true, color: '888888' });
+   *
+   * // Apply multiple styles to a term
+   * doc.findAndFormat('critical', {
+   *   bold: true,
+   *   highlight: 'red',
+   *   underline: 'single',
+   * });
+   * ```
+   */
+  findAndFormat(
+    text: string,
+    formatting: Partial<RunFormatting>,
+    options?: { caseSensitive?: boolean }
+  ): number {
+    let totalMatches = 0;
+    for (const para of this.getAllParagraphs()) {
+      const matches = para.findTextCrossRun(text, options);
+      // Apply formatting in reverse order to preserve offsets
+      for (let i = matches.length - 1; i >= 0; i--) {
+        const match = matches[i]!;
+        para.applyFormattingToRange(match.offset, match.offset + match.text.length, formatting);
+      }
+      totalMatches += matches.length;
+    }
+    return totalMatches;
+  }
   /**
    * Gets the total word count in the document
    *
@@ -13930,73 +14771,867 @@ export class Document {
   }
   /**
-   * Removes a paragraph from the document
-   * @param paragraphOrIndex - The paragraph object or its index
-   * @returns True if the paragraph was removed, false otherwise
+   * Returns comprehensive document statistics in a single call
+   *
+   * Aggregates word count, character counts, element counts, and structural
+   * metrics. More efficient than calling individual methods since shared
+   * data (like the paragraph list) is computed once.
+   *
+   * @returns Object with all document metrics
+   *
+   * @example
+   * ```typescript
+   * const stats = doc.getStatistics();
+   * console.log(`Words: ${stats.words}, Pages (est): ${stats.paragraphs}`);
+   * console.log(`Tables: ${stats.tables}, Images: ${stats.images}`);
+   * ```
    */
-  removeParagraph(paragraphOrIndex: Paragraph | number): boolean {
-    let index: number;
+  getStatistics(): {
+    words: number;
+    characters: number;
+    charactersNoSpaces: number;
+    paragraphs: number;
+    tables: number;
+    images: number;
+    headings: number;
+    lists: number;
+    hyperlinks: number;
+    bookmarks: number;
+    footnotes: number;
+    endnotes: number;
+    comments: number;
+    sections: number;
+  } {
+    const allParagraphs = this.getAllParagraphs();
+    const tables = this.getTables();
-    if (typeof paragraphOrIndex === 'number') {
-      index = paragraphOrIndex;
-    } else {
-      // Find the index of the paragraph
-      index = this.bodyElements.indexOf(paragraphOrIndex);
+    let words = 0;
+    let characters = 0;
+    let charactersNoSpaces = 0;
+    let headings = 0;
+    let lists = 0;
+    const counted = new Set<Paragraph>();
+    for (const para of allParagraphs) {
+      if (counted.has(para)) continue;
+      counted.add(para);
+      const text = para.getText();
+      characters += text.length;
+      charactersNoSpaces += text.replace(/\s/g, '').length;
+      const trimmed = text.trim();
+      if (trimmed) {
+        words += trimmed.split(/\s+/).filter((w) => w.length > 0).length;
+      }
+      if (para.detectHeadingLevel() !== null) headings++;
+      if (para.hasNumbering()) lists++;
     }
-    if (index >= 0 && index < this.bodyElements.length) {
-      const element = this.bodyElements[index];
-      if (element instanceof Paragraph) {
-        // When tracking enabled, wrap content in w:del instead of removing
-        if (this.trackChangesEnabled && this.trackingContext.isEnabled()) {
-          const runs = element.getRuns();
-          if (runs.length > 0) {
-            const author = this.trackingContext.getAuthor();
-            const deletion = Revision.createDeletion(author, runs);
-            this.trackingContext.getRevisionManager().register(deletion);
-            element.addRevision(deletion);
+    // Count table cell text too (for tables not traversed via getAllParagraphs)
+    for (const table of tables) {
+      for (const row of table.getRows()) {
+        for (const cell of row.getCells()) {
+          for (const para of cell.getParagraphs()) {
+            if (counted.has(para)) continue;
+            counted.add(para);
+            const text = para.getText();
+            characters += text.length;
+            charactersNoSpaces += text.replace(/\s/g, '').length;
+            const trimmed = text.trim();
+            if (trimmed) {
+              words += trimmed.split(/\s+/).filter((w) => w.length > 0).length;
+            }
           }
-          return true;
         }
-        this.bodyElements.splice(index, 1);
-        return true;
       }
     }
-    return false;
+    return {
+      words,
+      characters,
+      charactersNoSpaces,
+      paragraphs: allParagraphs.length,
+      tables: tables.length,
+      images: this.imageManager.getAllImages().length,
+      headings,
+      lists,
+      hyperlinks: this.getHyperlinks().length,
+      bookmarks: this.bookmarkManager.getAllBookmarks().length,
+      footnotes: this.footnoteManager.getAllFootnotes().length,
+      endnotes: this.endnoteManager.getAllEndnotes().length,
+      comments: this.commentManager.getAllComments().length,
+      sections: 1, // Base section; multi-section docs add via paragraph section properties
+    };
   }
   /**
-   * Removes a table from the document
-   * @param tableOrIndex - The table object or its index
-   * @returns True if the table was removed, false otherwise
+   * Iterates over top-level paragraphs in the document body (not inside tables)
+   *
+   * Calls the callback for each Paragraph that is a direct child of the body.
+   * Paragraphs inside table cells are NOT included — use `getAllParagraphs()`
+   * or `walkElements()` for those. Supports early termination by returning `false`.
+   *
+   * @param callback - Function called for each paragraph. Return `false` to stop.
+   * @returns Number of paragraphs visited
+   *
+   * @example
+   * ```typescript
+   * // Bold all top-level paragraphs
+   * doc.forEachParagraph((para) => {
+   *   para.getRuns().forEach(r => r.setBold(true));
+   * });
+   *
+   * // Find first paragraph matching criteria
+   * let found: Paragraph | undefined;
+   * doc.forEachParagraph((para) => {
+   *   if (para.getText().includes('Summary')) {
+   *     found = para;
+   *     return false;
+   *   }
+   * });
+   * ```
    */
-  removeTable(tableOrIndex: Table | number): boolean {
-    let index: number;
-    if (typeof tableOrIndex === 'number') {
-      // If number provided, find the nth table
-      const tables = this.getTables();
-      if (tableOrIndex >= 0 && tableOrIndex < tables.length) {
-        const table = tables[tableOrIndex];
-        if (!table) return false;
-        index = this.bodyElements.indexOf(table);
-      } else {
-        return false;
+  forEachParagraph(callback: (paragraph: Paragraph, index: number) => void | false): number {
+    let count = 0;
+    let paraIndex = 0;
+    for (const element of this.bodyElements) {
+      if (element instanceof Paragraph) {
+        const result = callback(element, paraIndex);
+        count++;
+        paraIndex++;
+        if (result === false) break;
       }
-    } else {
-      // Find the index of the table
-      index = this.bodyElements.indexOf(tableOrIndex);
     }
+    return count;
+  }
-    if (index >= 0 && index < this.bodyElements.length) {
-      const element = this.bodyElements[index];
+  /**
+   * Iterates over top-level tables in the document body
+   *
+   * Calls the callback for each Table that is a direct child of the body.
+   * Supports early termination by returning `false`.
+   *
+   * @param callback - Function called for each table. Return `false` to stop.
+   * @returns Number of tables visited
+   *
+   * @example
+   * ```typescript
+   * // Remove empty rows from all tables
+   * doc.forEachTable((table) => {
+   *   table.removeEmptyRows();
+   * });
+   *
+   * // Find first table with more than 5 rows
+   * let bigTable: Table | undefined;
+   * doc.forEachTable((table) => {
+   *   if (table.getRowCount() > 5) {
+   *     bigTable = table;
+   *     return false;
+   *   }
+   * });
+   * ```
+   */
+  forEachTable(callback: (table: Table, index: number) => void | false): number {
+    let count = 0;
+    let tableIndex = 0;
+    for (const element of this.bodyElements) {
       if (element instanceof Table) {
-        this.bodyElements.splice(index, 1);
-        return true;
+        const result = callback(element, tableIndex);
+        count++;
+        tableIndex++;
+        if (result === false) break;
       }
     }
+    return count;
+  }
+  /**
+   * Extracts all text content from the document as a plain string.
+   * Concatenates text from all paragraphs (including those in tables),
+   * separated by newlines.
+   *
+   * @param separator - String to insert between paragraphs (default: '\n')
+   * @returns Plain text content of the entire document
+   *
+   * @example
+   * ```typescript
+   * const text = doc.toPlainText();
+   * console.log(text);
+   *
+   * // With custom separator
+   * const singleLine = doc.toPlainText(' ');
+   * ```
+   */
+  toPlainText(separator = '\n'): string {
+    const paragraphs = this.getAllParagraphs();
+    return paragraphs.map((p) => p.getText()).join(separator);
+  }
+  /**
+   * Converts the document to Markdown format
+   *
+   * Iterates body elements in order and converts them to Markdown syntax:
+   * - Headings → `#` / `##` / `###` etc.
+   * - Bold/italic runs → `**bold**` / `*italic*`
+   * - Hyperlinks → `[text](url)`
+   * - Tables → pipe-delimited Markdown tables with alignment row
+   * - Numbered/bulleted lists → `1.` / `-` prefixes
+   * - Regular paragraphs → plain text with blank lines between
+   *
+   * Useful for AI/LLM pipelines, content migration, documentation
+   * generation, and plain-text extraction with structure preserved.
+   *
+   * @returns Markdown string representation of the document
+   *
+   * @example
+   * ```typescript
+   * const md = doc.toMarkdown();
+   * console.log(md);
+   * // # Document Title
+   * //
+   * // Opening paragraph text.
+   * //
+   * // ## Section 1
+   * //
+   * // | Name | Age |
+   * // | --- | --- |
+   * // | Alice | 30 |
+   * ```
+   */
+  toMarkdown(): string {
+    const lines: string[] = [];
+    for (const element of this.bodyElements) {
+      if (element instanceof Paragraph) {
+        const mdLine = this.paragraphToMarkdown(element);
+        if (mdLine !== null) {
+          lines.push(mdLine);
+          lines.push('');
+        }
+      } else if (element instanceof Table) {
+        lines.push(...this.tableToMarkdown(element));
+        lines.push('');
+      }
+      // Other element types (SDT, AlternateContent, etc.) are skipped
+    }
+    // Remove trailing blank line
+    while (lines.length > 0 && lines[lines.length - 1] === '') {
+      lines.pop();
+    }
+    return lines.join('\n');
+  }
+  /**
+   * Converts a paragraph to a Markdown line.
+   * @internal
+   */
+  private paragraphToMarkdown(para: Paragraph): string | null {
+    const text = this.paragraphContentToMarkdown(para);
+    if (!text && !para.hasNumbering()) return null;
+    // Headings
+    const headingLevel = para.detectHeadingLevel();
+    if (headingLevel !== null && headingLevel >= 1 && headingLevel <= 6) {
+      return '#'.repeat(headingLevel) + ' ' + text;
+    }
+    // Numbered/bulleted lists
+    if (para.hasNumbering()) {
+      const style = para.getStyle();
+      const isBullet =
+        style?.toLowerCase().includes('bullet') || style?.toLowerCase().includes('list bullet');
+      return isBullet ? `- ${text}` : `1. ${text}`;
+    }
+    return text;
+  }
+  /**
+   * Converts paragraph inline content to Markdown with formatting.
+   * @internal
+   */
+  private paragraphContentToMarkdown(para: Paragraph): string {
+    const parts: string[] = [];
+    for (const item of para.getContent()) {
+      if (item instanceof Run) {
+        const runText = item.getText();
+        if (!runText) continue;
+        const fmt = item.getFormatting();
+        let md = runText;
+        // Apply inline formatting (bold + italic combined)
+        if (fmt.bold && fmt.italic) {
+          md = `***${md}***`;
+        } else if (fmt.bold) {
+          md = `**${md}**`;
+        } else if (fmt.italic) {
+          md = `*${md}*`;
+        }
+        if (fmt.strike) {
+          md = `~~${md}~~`;
+        }
+        // Inline code (monospace font detection)
+        if (
+          fmt.font &&
+          /^(courier|consolas|monaco|menlo|source code|fira code|jetbrains mono)/i.test(fmt.font)
+        ) {
+          md = `\`${runText}\``;
+        }
+        parts.push(md);
+      } else if (item instanceof Hyperlink) {
+        const url = item.getUrl() || '';
+        const linkText = item.getText() || url;
+        parts.push(`[${linkText}](${url})`);
+      }
+      // Revisions, fields, shapes, etc. — extract text if possible
+    }
+    return parts.join('');
+  }
+  /**
+   * Converts a table to Markdown table lines.
+   * @internal
+   */
+  private tableToMarkdown(table: Table): string[] {
+    const data = table.toArray();
+    if (data.length === 0) return [];
+    const colCount = Math.max(...data.map((row) => row.length));
+    if (colCount === 0) return [];
+    // Normalize all rows to same column count
+    const normalized = data.map((row) => {
+      const padded = [...row];
+      while (padded.length < colCount) padded.push('');
+      // Escape pipes and normalize whitespace in cell text
+      return padded.map((cell) => cell.replace(/\|/g, '\\|').replace(/\n/g, ' ').trim());
+    });
+    const lines: string[] = [];
+    // Header row
+    lines.push('| ' + normalized[0]!.join(' | ') + ' |');
+    // Separator row
+    lines.push('| ' + normalized[0]!.map(() => '---').join(' | ') + ' |');
+    // Data rows
+    for (let i = 1; i < normalized.length; i++) {
+      lines.push('| ' + normalized[i]!.join(' | ') + ' |');
+    }
+    return lines;
+  }
+  /**
+   * Converts the document to an HTML string
+   *
+   * Iterates body elements and renders them as semantic HTML:
+   * - Headings → `<h1>` through `<h6>`
+   * - Bold → `<strong>`, italic → `<em>`, strikethrough → `<s>`
+   * - Inline code (monospace fonts) → `<code>`
+   * - Hyperlinks → `<a href="...">`
+   * - Tables → `<table>` with `<thead>` / `<tbody>`
+   * - Bullet lists → `<ul><li>`, numbered lists → `<ol><li>`
+   * - Regular paragraphs → `<p>`
+   *
+   * Useful for web display, email bodies, CMS import, and rich-text previews.
+   *
+   * @param options - Output options
+   * @param options.wrapInDocument - Wrap in `<!DOCTYPE html>` with head/body (default: false)
+   * @param options.title - Document title for the `<title>` tag (only when wrapInDocument is true)
+   * @returns HTML string
+   *
+   * @example
+   * ```typescript
+   * // Fragment for embedding
+   * const html = doc.toHTML();
+   *
+   * // Full HTML document
+   * const page = doc.toHTML({ wrapInDocument: true, title: 'My Report' });
+   * ```
+   */
+  toHTML(options?: { wrapInDocument?: boolean; title?: string }): string {
+    const parts: string[] = [];
+    let inList: 'ul' | 'ol' | null = null;
+    const closeList = () => {
+      if (inList) {
+        parts.push(`</${inList}>`);
+        inList = null;
+      }
+    };
+    for (const element of this.bodyElements) {
+      if (element instanceof Paragraph) {
+        const headingLevel = element.detectHeadingLevel();
+        const style = element.getStyle();
+        const isBullet = style?.toLowerCase().includes('bullet') || style === 'ListBullet';
+        const isNumber =
+          style?.toLowerCase().includes('listnumber') ||
+          style?.toLowerCase().includes('list number') ||
+          style === 'ListNumber';
+        if (isBullet || isNumber) {
+          const listType = isBullet ? 'ul' : 'ol';
+          if (inList !== listType) {
+            closeList();
+            inList = listType;
+            parts.push(`<${listType}>`);
+          }
+          parts.push(`<li>${this.paragraphContentToHTML(element)}</li>`);
+          continue;
+        }
+        closeList();
+        if (headingLevel !== null && headingLevel >= 1 && headingLevel <= 6) {
+          parts.push(
+            `<h${headingLevel}>${this.paragraphContentToHTML(element)}</h${headingLevel}>`
+          );
+        } else {
+          const content = this.paragraphContentToHTML(element);
+          if (content) {
+            parts.push(`<p>${content}</p>`);
+          }
+        }
+      } else if (element instanceof Table) {
+        closeList();
+        parts.push(this.tableToHTML(element));
+      }
+    }
+    closeList();
+    const body = parts.join('\n');
+    if (options?.wrapInDocument) {
+      const title = options.title ? this.escapeHTML(options.title) : 'Document';
+      return [
+        '<!DOCTYPE html>',
+        '<html>',
+        '<head>',
+        `<meta charset="utf-8">`,
+        `<title>${title}</title>`,
+        '</head>',
+        '<body>',
+        body,
+        '</body>',
+        '</html>',
+      ].join('\n');
+    }
+    return body;
+  }
+  /**
+   * Converts paragraph inline content to HTML.
+   * @internal
+   */
+  private paragraphContentToHTML(para: Paragraph): string {
+    const parts: string[] = [];
+    for (const item of para.getContent()) {
+      if (item instanceof Run) {
+        const text = item.getText();
+        if (!text) continue;
+        const escaped = this.escapeHTML(text);
+        const fmt = item.getFormatting();
+        // Detect monospace font
+        const isMono =
+          fmt.font &&
+          /^(courier|consolas|monaco|menlo|source code|fira code|jetbrains mono)/i.test(fmt.font);
+        if (isMono) {
+          parts.push(`<code>${escaped}</code>`);
+          continue;
+        }
+        let html = escaped;
+        if (fmt.bold) html = `<strong>${html}</strong>`;
+        if (fmt.italic) html = `<em>${html}</em>`;
+        if (fmt.strike) html = `<s>${html}</s>`;
+        if (fmt.underline && fmt.underline !== 'none') {
+          html = `<u>${html}</u>`;
+        }
+        parts.push(html);
+      } else if (item instanceof Hyperlink) {
+        const url = this.escapeHTML(item.getUrl() || '');
+        const linkText = this.escapeHTML(item.getText() || url);
+        parts.push(`<a href="${url}">${linkText}</a>`);
+      }
+    }
+    return parts.join('');
+  }
+  /**
+   * Converts a table to an HTML table string.
+   * @internal
+   */
+  private tableToHTML(table: Table): string {
+    const rows = table.getRows();
+    if (rows.length === 0) return '';
+    const lines: string[] = ['<table>'];
+    // First row as thead
+    const headerCells = rows[0]!.getCells();
+    lines.push('<thead>');
+    lines.push('<tr>');
+    for (const cell of headerCells) {
+      lines.push(`<th>${this.escapeHTML(cell.getText())}</th>`);
+    }
+    lines.push('</tr>');
+    lines.push('</thead>');
+    // Remaining rows as tbody
+    if (rows.length > 1) {
+      lines.push('<tbody>');
+      for (let r = 1; r < rows.length; r++) {
+        lines.push('<tr>');
+        for (const cell of rows[r]!.getCells()) {
+          lines.push(`<td>${this.escapeHTML(cell.getText())}</td>`);
+        }
+        lines.push('</tr>');
+      }
+      lines.push('</tbody>');
+    }
+    lines.push('</table>');
+    return lines.join('\n');
+  }
+  /**
+   * Escapes HTML special characters.
+   * @internal
+   */
+  private escapeHTML(text: string): string {
+    return text
+      .replace(/&/g, '&amp;')
+      .replace(/</g, '&lt;')
+      .replace(/>/g, '&gt;')
+      .replace(/"/g, '&quot;');
+  }
+  /**
+   * Returns a JSON-serializable representation of the document structure.
+   * Useful for debugging, inspection, and logging.
+   *
+   * @returns Object with document properties, statistics, and content summary
+   *
+   * @example
+   * ```typescript
+   * const json = doc.toJSON();
+   * console.log(JSON.stringify(json, null, 2));
+   * ```
+   */
+  toJSON(): {
+    properties: DocumentProperties;
+    stats: {
+      paragraphs: number;
+      tables: number;
+      images: number;
+      headings: number;
+      sections: number;
+    };
+    headings: { level: number; text: string }[];
+    body: { type: string; text?: string; style?: string }[];
+  } {
+    const paragraphs = this.getAllParagraphs();
+    const tables = this.getTables();
+    const headings = this.getHeadingHierarchy();
+    return {
+      properties: this.getProperties(),
+      stats: {
+        paragraphs: paragraphs.length,
+        tables: tables.length,
+        images: this.imageManager.getImageCount(),
+        headings: headings.length,
+        sections: this.bodyElements.filter((el) => el instanceof Section).length || 1,
+      },
+      headings: headings.map((h) => ({ level: h.level, text: h.text })),
+      body: this.bodyElements.map((el) => {
+        if (el instanceof Paragraph) {
+          return {
+            type: 'paragraph',
+            text: el.getText(),
+            style: el.getStyle(),
+          };
+        }
+        if (el instanceof Table) {
+          return {
+            type: 'table',
+            text: `${el.getRows().length} rows x ${el.getRows()[0]?.getCells().length ?? 0} cols`,
+          };
+        }
+        return { type: el.constructor.name };
+      }),
+    };
+  }
+  /**
+   * Finds all images in the document that have no alt text or only the default alt text.
+   * Useful for accessibility auditing.
+   *
+   * @returns Array of Image elements missing meaningful alt text
+   *
+   * @example
+   * ```typescript
+   * const missing = doc.findImagesWithoutAltText();
+   * console.log(`${missing.length} images need alt text`);
+   * for (const img of missing) {
+   *   img.setAltText('Description of the image');
+   * }
+   * ```
+   */
+  findImagesWithoutAltText(): Image[] {
+    const results: Image[] = [];
+    for (const para of this.getAllParagraphs()) {
+      for (const item of para.getContent()) {
+        if (item instanceof ImageRun) {
+          const image = item.getImageElement();
+          const altText = image.getAltText();
+          if (!altText || altText === 'Image') {
+            results.push(image);
+          }
+        }
+        if (item instanceof Revision) {
+          for (const revContent of item.getContent()) {
+            if (revContent instanceof ImageRun) {
+              const image = revContent.getImageElement();
+              const altText = image.getAltText();
+              if (!altText || altText === 'Image') {
+                results.push(image);
+              }
+            }
+          }
+        }
+      }
+    }
+    return results;
+  }
+  /**
+   * Returns the heading hierarchy of the document as a flat list.
+   * Each entry includes the heading level, text content, and the paragraph object.
+   * Useful for accessibility auditing (detecting skipped levels) and TOC generation.
+   *
+   * @returns Array of heading entries sorted by document order
+   *
+   * @example
+   * ```typescript
+   * const headings = doc.getHeadingHierarchy();
+   * for (const h of headings) {
+   *   console.log(`${'  '.repeat(h.level - 1)}H${h.level}: ${h.text}`);
+   * }
+   *
+   * // Check for skipped levels (accessibility issue)
+   * for (let i = 1; i < headings.length; i++) {
+   *   if (headings[i].level - headings[i - 1].level > 1) {
+   *     console.warn(`Skipped heading level: H${headings[i - 1].level} -> H${headings[i].level}`);
+   *   }
+   * }
+   * ```
+   */
+  getHeadingHierarchy(): { level: number; text: string; paragraph: Paragraph }[] {
+    const results: { level: number; text: string; paragraph: Paragraph }[] = [];
+    for (const para of this.getAllParagraphs()) {
+      const level = para.detectHeadingLevel();
+      if (level !== null) {
+        results.push({
+          level,
+          text: para.getText(),
+          paragraph: para,
+        });
+      }
+    }
+    return results;
+  }
+  /**
+   * Groups body elements into sections delimited by headings
+   *
+   * Walks the body elements in order and splits them at each heading paragraph
+   * at or above the specified level. Each section contains the heading paragraph
+   * and all subsequent body elements until the next heading at that level or higher.
+   *
+   * Content before the first matching heading is returned as a section with
+   * `heading: undefined` and `level: 0`.
+   *
+   * @param maxLevel - Maximum heading level to split on (default: 1, meaning only H1
+   *   starts a new section). Set to 2 to also split on H2, 3 for H1-H3, etc.
+   * @returns Array of sections, each with heading info and content elements
+   *
+   * @example
+   * ```typescript
+   * // Split document by H1 headings (chapters)
+   * const chapters = doc.extractByHeading(1);
+   * for (const chapter of chapters) {
+   *   console.log(`Chapter: ${chapter.heading?.getText() ?? '(preamble)'}`);
+   *   console.log(`  ${chapter.content.length} elements`);
+   * }
+   * ```
+   *
+   * @example
+   * ```typescript
+   * // Split by H1 and H2 (chapters and sections)
+   * const sections = doc.extractByHeading(2);
+   *
+   * // Extract a specific section's content as markdown
+   * const target = sections.find(s => s.heading?.getText() === 'Methods');
+   * ```
+   */
+  extractByHeading(maxLevel = 1): {
+    heading: Paragraph | undefined;
+    level: number;
+    content: BodyElement[];
+  }[] {
+    const sections: { heading: Paragraph | undefined; level: number; content: BodyElement[] }[] =
+      [];
+    let current: { heading: Paragraph | undefined; level: number; content: BodyElement[] } = {
+      heading: undefined,
+      level: 0,
+      content: [],
+    };
+    for (const element of this.bodyElements) {
+      if (element instanceof Paragraph) {
+        const headingLevel = element.detectHeadingLevel();
+        if (headingLevel !== null && headingLevel <= maxLevel) {
+          // Save current section if it has any content or a heading
+          if (current.heading || current.content.length > 0) {
+            sections.push(current);
+          }
+          // Start a new section
+          current = { heading: element, level: headingLevel, content: [] };
+          continue;
+        }
+      }
+      current.content.push(element);
+    }
+    // Push the last section
+    if (current.heading || current.content.length > 0) {
+      sections.push(current);
+    }
+    return sections;
+  }
+  /**
+   * Returns all body elements between two reference elements (exclusive)
+   *
+   * Finds both elements in the body and returns everything between them.
+   * The start and end elements themselves are NOT included in the result.
+   * Returns an empty array if either element is not found or if start
+   * appears after end.
+   *
+   * @param startElement - Element after which to begin collecting
+   * @param endElement - Element before which to stop collecting
+   * @returns Array of body elements between the two references
+   *
+   * @example
+   * ```typescript
+   * const headings = doc.getParagraphs().filter(p => p.detectHeadingLevel() === 1);
+   * const chapter1Content = doc.getElementsBetween(headings[0], headings[1]);
+   * ```
+   */
+  getElementsBetween(startElement: BodyElement, endElement: BodyElement): BodyElement[] {
+    const startIndex = this.bodyElements.indexOf(startElement);
+    const endIndex = this.bodyElements.indexOf(endElement);
+    if (startIndex === -1 || endIndex === -1 || startIndex >= endIndex) {
+      return [];
+    }
+    return this.bodyElements.slice(startIndex + 1, endIndex);
+  }
+  /**
+   * Removes a paragraph from the document
+   * @param paragraphOrIndex - The paragraph object or its index
+   * @returns True if the paragraph was removed, false otherwise
+   */
+  removeParagraph(paragraphOrIndex: Paragraph | number): boolean {
+    let index: number;
+    if (typeof paragraphOrIndex === 'number') {
+      index = paragraphOrIndex;
+    } else {
+      // Find the index of the paragraph
+      index = this.bodyElements.indexOf(paragraphOrIndex);
+    }
+    if (index >= 0 && index < this.bodyElements.length) {
+      const element = this.bodyElements[index];
+      if (element instanceof Paragraph) {
+        // When tracking enabled, wrap content in w:del instead of removing
+        if (this.trackChangesEnabled && this.trackingContext.isEnabled()) {
+          const runs = element.getRuns();
+          if (runs.length > 0) {
+            const author = this.trackingContext.getAuthor();
+            const deletion = Revision.createDeletion(author, runs);
+            this.trackingContext.getRevisionManager().register(deletion);
+            element.addRevision(deletion);
+          }
+          return true;
+        }
+        this.bodyElements.splice(index, 1);
+        return true;
+      }
+    }
+    return false;
+  }
+  /**
+   * Removes a table from the document
+   * @param tableOrIndex - The table object or its index
+   * @returns True if the table was removed, false otherwise
+   */
+  removeTable(tableOrIndex: Table | number): boolean {
+    let index: number;
+    if (typeof tableOrIndex === 'number') {
+      // If number provided, find the nth table
+      const tables = this.getTables();
+      if (tableOrIndex >= 0 && tableOrIndex < tables.length) {
+        const table = tables[tableOrIndex];
+        if (!table) return false;
+        index = this.bodyElements.indexOf(table);
+      } else {
+        return false;
+      }
+    } else {
+      // Find the index of the table
+      index = this.bodyElements.indexOf(tableOrIndex);
+    }
+    if (index >= 0 && index < this.bodyElements.length) {
+      const element = this.bodyElements[index];
+      if (element instanceof Table) {
+        this.bodyElements.splice(index, 1);
+        return true;
+      }
+    }
     return false;
   }
@@ -14373,6 +16008,122 @@ export class Document {
     return false;
   }
+  /**
+   * Removes a body element by reference
+   *
+   * Finds the element in the body and removes it. More convenient than
+   * the index-based `removeBodyElementAt()` when you already have a
+   * reference to the element.
+   *
+   * @param element - The element to remove
+   * @returns True if removed, false if not found
+   *
+   * @example
+   * ```typescript
+   * // Remove a specific paragraph
+   * const para = doc.getParagraphs().find(p => p.getText() === 'Delete me');
+   * if (para) doc.removeElement(para);
+   *
+   * // Remove all tables
+   * for (const table of doc.getTables()) {
+   *   doc.removeElement(table);
+   * }
+   * ```
+   */
+  removeElement(element: BodyElement): boolean {
+    const index = this.bodyElements.indexOf(element);
+    if (index === -1) return false;
+    this.bodyElements.splice(index, 1);
+    return true;
+  }
+  /**
+   * Inserts a body element after a reference element
+   *
+   * Finds the reference element in the body and inserts the new element
+   * immediately after it. Returns false if the reference is not found.
+   *
+   * @param reference - The existing element to insert after
+   * @param element - The element to insert
+   * @returns True if inserted, false if reference not found
+   *
+   * @example
+   * ```typescript
+   * // Find a heading and insert a table after it
+   * const heading = doc.getParagraphs().find(p => p.getText() === 'Data');
+   * if (heading) {
+   *   doc.insertAfter(heading, table);
+   * }
+   *
+   * // Split a paragraph and insert content between halves
+   * const tail = para.splitAt(offset);
+   * doc.insertAfter(para, newTable);
+   * doc.insertAfter(newTable, tail);
+   * ```
+   */
+  insertAfter(reference: BodyElement, element: BodyElement): boolean {
+    const index = this.bodyElements.indexOf(reference);
+    if (index === -1) return false;
+    this.bodyElements.splice(index + 1, 0, element);
+    return true;
+  }
+  /**
+   * Inserts a body element before a reference element
+   *
+   * Finds the reference element in the body and inserts the new element
+   * immediately before it. Returns false if the reference is not found.
+   *
+   * @param reference - The existing element to insert before
+   * @param element - The element to insert
+   * @returns True if inserted, false if reference not found
+   *
+   * @example
+   * ```typescript
+   * // Insert a heading before a table
+   * const table = doc.getTables()[0];
+   * if (table) {
+   *   const heading = new Paragraph().addText('Table 1').setStyle('Heading2');
+   *   doc.insertBefore(table, heading);
+   * }
+   * ```
+   */
+  insertBefore(reference: BodyElement, element: BodyElement): boolean {
+    const index = this.bodyElements.indexOf(reference);
+    if (index === -1) return false;
+    this.bodyElements.splice(index, 0, element);
+    return true;
+  }
+  /**
+   * Replaces a body element with another
+   *
+   * Finds the old element in the body and replaces it in-place with the
+   * new element. The new element occupies the same position. Returns false
+   * if the old element is not found.
+   *
+   * @param oldElement - The element to replace
+   * @param newElement - The replacement element
+   * @returns True if replaced, false if old element not found
+   *
+   * @example
+   * ```typescript
+   * // Replace a placeholder paragraph with a table
+   * const placeholder = doc.getParagraphs().find(
+   *   p => p.getText() === '{{INSERT_TABLE_HERE}}'
+   * );
+   * if (placeholder) {
+   *   doc.replaceElement(placeholder, dataTable);
+   * }
+   * ```
+   */
+  replaceElement(oldElement: BodyElement, newElement: BodyElement): boolean {
+    const index = this.bodyElements.indexOf(oldElement);
+    if (index === -1) return false;
+    this.bodyElements[index] = newElement;
+    return true;
+  }
   /**
    * Inserts a body element at a specific index, shifting existing elements forward.
    * @param index - The zero-based index at which to insert. Clamped to valid range.