npm - docrev - Versions diffs - 0.9.18 → 0.10.1 - Mend

docrev 0.9.18 → 0.10.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (134) hide show

package/.gitattributes +1 -1
package/CHANGELOG.md +173 -149
package/PLAN-tables-and-postprocess.md +850 -850
package/README.md +431 -406
package/bin/rev.js +11 -11
package/bin/rev.ts +145 -145
package/completions/rev.bash +127 -127
package/completions/rev.ps1 +210 -210
package/completions/rev.zsh +207 -207
package/dist/lib/build.d.ts +8 -0
package/dist/lib/build.d.ts.map +1 -1
package/dist/lib/build.js +62 -6
package/dist/lib/build.js.map +1 -1
package/dist/lib/commands/context.d.ts +1 -1
package/dist/lib/commands/context.d.ts.map +1 -1
package/dist/lib/commands/context.js +1 -1
package/dist/lib/commands/context.js.map +1 -1
package/dist/lib/commands/sections.js +7 -7
package/dist/lib/commands/sections.js.map +1 -1
package/dist/lib/commands/sync.d.ts.map +1 -1
package/dist/lib/commands/sync.js +15 -14
package/dist/lib/commands/sync.js.map +1 -1
package/dist/lib/commands/utilities.js +164 -164
package/dist/lib/commands/verify-anchors.js +6 -6
package/dist/lib/commands/verify-anchors.js.map +1 -1
package/dist/lib/commands/word-tools.js +8 -8
package/dist/lib/grammar.js +3 -3
package/dist/lib/macro-filter.lua +201 -0
package/dist/lib/macros.d.ts +102 -0
package/dist/lib/macros.d.ts.map +1 -0
package/dist/lib/macros.js +218 -0
package/dist/lib/macros.js.map +1 -0
package/dist/lib/pdf-comments.js +44 -44
package/dist/lib/plugins.js +57 -57
package/dist/lib/pptx-color-filter.lua +37 -0
package/dist/lib/pptx-themes.js +115 -115
package/dist/lib/schema.d.ts.map +1 -1
package/dist/lib/schema.js +34 -0
package/dist/lib/schema.js.map +1 -1
package/dist/lib/sections.d.ts +35 -0
package/dist/lib/sections.d.ts.map +1 -1
package/dist/lib/sections.js +81 -0
package/dist/lib/sections.js.map +1 -1
package/dist/lib/spelling.js +2 -2
package/dist/lib/templates.js +387 -387
package/dist/lib/themes.js +51 -51
package/eslint.config.js +27 -27
package/lib/anchor-match.ts +276 -276
package/lib/annotations.ts +644 -644
package/lib/build.ts +1766 -1694
package/lib/citations.ts +160 -160
package/lib/commands/build.ts +855 -855
package/lib/commands/citations.ts +515 -515
package/lib/commands/comments.ts +1050 -1050
package/lib/commands/context.ts +176 -174
package/lib/commands/core.ts +309 -309
package/lib/commands/doi.ts +435 -435
package/lib/commands/file-ops.ts +372 -372
package/lib/commands/history.ts +320 -320
package/lib/commands/index.ts +87 -87
package/lib/commands/init.ts +259 -259
package/lib/commands/merge-resolve.ts +378 -378
package/lib/commands/preview.ts +178 -178
package/lib/commands/project-info.ts +244 -244
package/lib/commands/quality.ts +517 -517
package/lib/commands/response.ts +454 -454
package/lib/commands/section-boundaries.ts +82 -82
package/lib/commands/sections.ts +451 -451
package/lib/commands/sync.ts +709 -706
package/lib/commands/text-ops.ts +449 -449
package/lib/commands/utilities.ts +448 -448
package/lib/commands/verify-anchors.ts +272 -272
package/lib/commands/word-tools.ts +340 -340
package/lib/comment-realign.ts +517 -517
package/lib/config.ts +84 -84
package/lib/crossref.ts +781 -781
package/lib/csl.ts +191 -191
package/lib/dependencies.ts +98 -98
package/lib/diff-engine.ts +465 -465
package/lib/doi-cache.ts +115 -115
package/lib/doi.ts +897 -897
package/lib/equations.ts +506 -506
package/lib/errors.ts +346 -346
package/lib/format.ts +541 -541
package/lib/git.ts +326 -326
package/lib/grammar.ts +303 -303
package/lib/image-registry.ts +180 -180
package/lib/import.ts +911 -911
package/lib/journals.ts +543 -543
package/lib/macro-filter.lua +201 -0
package/lib/macros.ts +273 -0
package/lib/merge.ts +633 -633
package/lib/orcid.ts +144 -144
package/lib/pdf-comments.ts +263 -263
package/lib/pdf-import.ts +524 -524
package/lib/plugins.ts +362 -362
package/lib/postprocess.ts +188 -188
package/lib/pptx-color-filter.lua +37 -37
package/lib/pptx-template.ts +469 -469
package/lib/pptx-themes.ts +483 -483
package/lib/protect-restore.ts +520 -520
package/lib/rate-limiter.ts +94 -94
package/lib/response.ts +197 -197
package/lib/restore-references.ts +240 -240
package/lib/review.ts +327 -327
package/lib/schema.ts +488 -454
package/lib/scientific-words.ts +73 -73
package/lib/sections.ts +425 -335
package/lib/slides.ts +756 -756
package/lib/spelling.ts +334 -334
package/lib/templates.ts +526 -526
package/lib/themes.ts +742 -742
package/lib/trackchanges.ts +247 -247
package/lib/tui.ts +450 -450
package/lib/types.ts +550 -550
package/lib/undo.ts +250 -250
package/lib/utils.ts +69 -69
package/lib/variables.ts +179 -179
package/lib/word-extraction.ts +806 -806
package/lib/word.ts +643 -643
package/lib/wordcomments.ts +840 -840
package/package.json +137 -137
package/scripts/postbuild.js +47 -28
package/skill/REFERENCE.md +539 -539
package/skill/SKILL.md +295 -295
package/tsconfig.json +26 -26
package/types/index.d.ts +525 -525
package/issues.md +0 -180
package/site/assets/extra.css +0 -208
package/site/commands.html +0 -926
package/site/configuration.html +0 -469
package/site/index.html +0 -288
package/site/troubleshooting.html +0 -461
package/site/workflow.html +0 -518

package/lib/commands/sections.ts CHANGED Viewed

@@ -1,451 +1,451 @@
-/**
- * Section commands: import, extract, split
- *
- * Commands for importing Word documents and splitting section files.
- * Sync and merge commands are in sync.ts and merge-resolve.ts respectively.
- */
-import {
-  chalk,
-  fs,
-  path,
-  countAnnotations,
-  loadConfig,
-  splitAnnotatedPaper,
-} from './context.js';
-import type { Command } from 'commander';
-interface DetectedSection {
-  header: string;
-  content: string;
-  file: string;
-}
-interface ImportStats {
-  insertions: number;
-  deletions: number;
-  substitutions: number;
-  comments: number;
-  total: number;
-}
-interface BootstrapOptions {
-  output: string;
-  dryRun?: boolean;
-}
-interface ImportOptions {
-  output?: string;
-  author?: string;
-  dryRun?: boolean;
-}
-interface ExtractOptions {
-  output?: string;
-}
-interface SplitOptions {
-  config: string;
-  dir: string;
-  dryRun?: boolean;
-}
-/**
- * Detect sections from Word document text
- * Looks for common academic paper section headers
- */
-function detectSectionsFromWord(text: string): DetectedSection[] {
-  const lines = text.split('\n');
-  const sections: DetectedSection[] = [];
-  const headerPatterns = [
-    /^(Abstract|Summary)$/i,
-    /^(Introduction|Background)$/i,
-    /^(Methods?|Materials?\s*(and|&)\s*Methods?|Methodology|Experimental\s*Methods?)$/i,
-    /^(Results?)$/i,
-    /^(Results?\s*(and|&)\s*Discussion)$/i,
-    /^(Discussion)$/i,
-    /^(Conclusions?|Summary\s*(and|&)?\s*Conclusions?)$/i,
-    /^(Acknowledgements?|Acknowledgments?)$/i,
-    /^(References|Bibliography|Literature\s*Cited|Works\s*Cited)$/i,
-    /^(Appendix|Appendices|Supplementary\s*(Materials?|Information)?|Supporting\s*Information)$/i,
-    /^(Literature\s*Review|Related\s*Work|Previous\s*Work)$/i,
-    /^(Study\s*Area|Study\s*Site|Site\s*Description)$/i,
-    /^(Data\s*Analysis|Statistical\s*Analysis|Data\s*Collection)$/i,
-    /^(Theoretical\s*Framework|Conceptual\s*Framework)$/i,
-    /^(Case\s*Study|Case\s*Studies)$/i,
-    /^(Limitations?)$/i,
-    /^(Future\s*Work|Future\s*Directions?)$/i,
-    /^(Funding|Author\s*Contributions?|Conflict\s*of\s*Interest|Data\s*Availability)$/i,
-  ];
-  const numberedHeaderPattern = /^(\d+\.?\s+)(Abstract|Introduction|Background|Methods?|Materials|Results?|Discussion|Conclusions?|References|Acknowledgements?|Appendix)/i;
-  let currentSection: string | null = null;
-  let currentContent: string[] = [];
-  let preambleContent: string[] = [];
-  for (const line of lines) {
-    const trimmed = line.trim();
-    if (!trimmed) {
-      if (currentSection) {
-        currentContent.push(line);
-      } else {
-        preambleContent.push(line);
-      }
-      continue;
-    }
-    let isHeader = false;
-    let headerText = trimmed;
-    for (const pattern of headerPatterns) {
-      if (pattern.test(trimmed)) {
-        isHeader = true;
-        break;
-      }
-    }
-    if (!isHeader) {
-      const match = trimmed.match(numberedHeaderPattern);
-      if (match) {
-        isHeader = true;
-        headerText = trimmed.replace(/^\d+\.?\s+/, '');
-      }
-    }
-    if (isHeader) {
-      if (currentSection) {
-        sections.push({
-          header: currentSection,
-          content: currentContent.join('\n'),
-          file: headerToFilename(currentSection),
-        });
-      } else if (preambleContent.some(l => l.trim())) {
-        sections.push({
-          header: 'Preamble',
-          content: preambleContent.join('\n'),
-          file: 'preamble.md',
-        });
-      }
-      currentSection = headerText;
-      currentContent = [];
-    } else if (currentSection) {
-      currentContent.push(line);
-    } else {
-      preambleContent.push(line);
-    }
-  }
-  if (currentSection) {
-    sections.push({
-      header: currentSection,
-      content: currentContent.join('\n'),
-      file: headerToFilename(currentSection),
-    });
-  }
-  if (sections.length === 0) {
-    const allContent = [...preambleContent, ...currentContent].join('\n');
-    if (allContent.trim()) {
-      sections.push({
-        header: 'Content',
-        content: allContent,
-        file: 'content.md',
-      });
-    }
-  }
-  return sections;
-}
-/**
- * Convert a section header to a filename
- */
-function headerToFilename(header: string): string {
-  return header
-    .toLowerCase()
-    .replace(/[^a-z0-9]+/g, '-')
-    .replace(/^-|-$/g, '')
-    .slice(0, 30) + '.md';
-}
-/**
- * Bootstrap a new project from a Word document
- */
-async function bootstrapFromWord(docx: string, options: BootstrapOptions): Promise<void> {
-  const outputDir = path.resolve(options.output);
-  console.log(chalk.cyan(`Bootstrapping project from ${path.basename(docx)}...\n`));
-  try {
-    const { extractTextFromWord } = await import('../word.js');
-    const { default: YAML } = await import('yaml');
-    const text = await extractTextFromWord(docx);
-    const sections = detectSectionsFromWord(text);
-    if (sections.length === 0) {
-      console.error(chalk.yellow('No sections detected. Creating single content.md file.'));
-      sections.push({ header: 'Content', content: text, file: 'content.md' });
-    }
-    console.log(chalk.green(`Detected ${sections.length} section(s):\n`));
-    if (!fs.existsSync(outputDir)) {
-      fs.mkdirSync(outputDir, { recursive: true });
-    }
-    const sectionFiles: string[] = [];
-    for (const section of sections) {
-      const filePath = path.join(outputDir, section.file);
-      const content = `# ${section.header}\n\n${section.content.trim()}\n`;
-      console.log(`  ${chalk.bold(section.file)} - "${section.header}" (${section.content.split('\n').length} lines)`);
-      if (!options.dryRun) {
-        fs.writeFileSync(filePath, content, 'utf-8');
-      }
-      sectionFiles.push(section.file);
-    }
-    const docxName = path.basename(docx, '.docx');
-    const title = docxName.replace(/[-_]/g, ' ').replace(/\b\w/g, (c) => c.toUpperCase());
-    const config = {
-      title: title,
-      authors: [],
-      sections: sectionFiles,
-      bibliography: null,
-      crossref: {
-        figureTitle: 'Figure',
-        tableTitle: 'Table',
-        figPrefix: ['Fig.', 'Figs.'],
-        tblPrefix: ['Table', 'Tables'],
-      },
-      pdf: {
-        documentclass: 'article',
-        fontsize: '12pt',
-        geometry: 'margin=1in',
-        linestretch: 1.5,
-      },
-      docx: {
-        keepComments: true,
-      },
-    };
-    const configPath = path.join(outputDir, 'rev.yaml');
-    console.log(`\n  ${chalk.bold('rev.yaml')} - project configuration`);
-    if (!options.dryRun) {
-      fs.writeFileSync(configPath, YAML.stringify(config), 'utf-8');
-    }
-    const figuresDir = path.join(outputDir, 'figures');
-    if (!fs.existsSync(figuresDir) && !options.dryRun) {
-      fs.mkdirSync(figuresDir, { recursive: true });
-      console.log(`  ${chalk.dim('figures/')} - image directory`);
-    }
-    if (options.dryRun) {
-      console.log(chalk.yellow('\n(Dry run - no files written)'));
-    } else {
-      console.log(chalk.green('\nProject created!'));
-      console.log(chalk.cyan('\nNext steps:'));
-      if (outputDir !== process.cwd()) {
-        console.log(chalk.dim(`  cd ${path.relative(process.cwd(), outputDir) || '.'}`));
-      }
-      console.log(chalk.dim('  # Edit rev.yaml to add authors and adjust settings'));
-      console.log(chalk.dim('  # Review and clean up section files'));
-      console.log(chalk.dim('  rev build          # Build PDF and DOCX'));
-    }
-  } catch (err) {
-    const error = err as Error;
-    console.error(chalk.red(`Error: ${error.message}`));
-    if (process.env.DEBUG) console.error(error.stack);
-    process.exit(1);
-  }
-}
-/**
- * Register section commands with the program
- */
-export function register(program: Command): void {
-  // ==========================================================================
-  // IMPORT command - Import from Word (bootstrap or diff mode)
-  // ==========================================================================
-  program
-    .command('import')
-    .description('Import from Word: creates sections from scratch, or diffs against existing MD')
-    .argument('<docx>', 'Word document')
-    .argument('[original]', 'Optional: original Markdown file to compare against')
-    .option('-o, --output <dir>', 'Output directory for bootstrap mode', '.')
-    .option('-a, --author <name>', 'Author name for changes (diff mode)', 'Reviewer')
-    .option('--dry-run', 'Preview without saving')
-    .action(async (docx: string, original: string | undefined, options: ImportOptions) => {
-      if (!fs.existsSync(docx)) {
-        console.error(chalk.red(`Error: Word file not found: ${docx}`));
-        process.exit(1);
-      }
-      if (!original) {
-        await bootstrapFromWord(docx, options as BootstrapOptions);
-        return;
-      }
-      if (!fs.existsSync(original)) {
-        console.error(chalk.red(`Error: Original MD not found: ${original}`));
-        process.exit(1);
-      }
-      console.log(chalk.cyan(`Comparing ${path.basename(docx)} against ${path.basename(original)}...`));
-      // Warn if pandoc is missing
-      const { hasPandoc: hasPandocImport, getInstallInstructions: getInstallImport } = await import('../dependencies.js');
-      if (!hasPandocImport()) {
-        console.log(chalk.yellow(`\n  Warning: Pandoc not installed. Track changes extracted from XML (formatting may differ).`));
-        console.log(chalk.dim(`  Install for best results: ${getInstallImport('pandoc')}\n`));
-      }
-      try {
-        const { importFromWord } = await import('../import.js');
-        const { annotated, stats } = await importFromWord(docx, original, {
-          author: options.author,
-        });
-        console.log(chalk.cyan('\nChanges detected:'));
-        if (stats.insertions > 0) console.log(chalk.green(`  + Insertions:    ${stats.insertions}`));
-        if (stats.deletions > 0) console.log(chalk.red(`  - Deletions:     ${stats.deletions}`));
-        if (stats.substitutions > 0) console.log(chalk.yellow(`  ~ Substitutions: ${stats.substitutions}`));
-        if (stats.comments > 0) console.log(chalk.blue(`  # Comments:      ${stats.comments}`));
-        if (stats.total === 0) {
-          console.log(chalk.green('\nNo changes detected.'));
-          return;
-        }
-        console.log(chalk.dim(`\n  Total: ${stats.total}`));
-        if (options.dryRun) {
-          console.log(chalk.cyan('\n--- Preview (first 1000 chars) ---\n'));
-          console.log(annotated.slice(0, 1000));
-          if (annotated.length > 1000) console.log(chalk.dim('\n... (truncated)'));
-          return;
-        }
-        const outputPath = options.output || original;
-        fs.writeFileSync(outputPath, annotated, 'utf-8');
-        console.log(chalk.green(`\nSaved annotated version to ${outputPath}`));
-        console.log(chalk.cyan('\nNext steps:'));
-        console.log(`  1. ${chalk.bold('rev review ' + outputPath)}  - Accept/reject track changes`);
-        console.log(`  2. Work with Claude to address comments`);
-        console.log(`  3. ${chalk.bold('rev build docx')}  - Rebuild Word doc`);
-      } catch (err) {
-        const error = err as Error;
-        console.error(chalk.red(`Error: ${error.message}`));
-        if (process.env.DEBUG) console.error(error.stack);
-        process.exit(1);
-      }
-    });
-  // ==========================================================================
-  // EXTRACT command - Just extract text from Word
-  // ==========================================================================
-  program
-    .command('extract')
-    .description('Extract plain text from Word document (no diff)')
-    .argument('<docx>', 'Word document')
-    .option('-o, --output <file>', 'Output file (default: stdout)')
-    .action(async (docx: string, options: ExtractOptions) => {
-      if (!fs.existsSync(docx)) {
-        console.error(chalk.red(`Error: File not found: ${docx}`));
-        process.exit(1);
-      }
-      try {
-        const { extractTextFromWord } = await import('../word.js');
-        const text = await extractTextFromWord(docx);
-        if (options.output) {
-          fs.writeFileSync(options.output, text, 'utf-8');
-          console.error(chalk.green(`Extracted to ${options.output}`));
-        } else {
-          process.stdout.write(text);
-        }
-      } catch (err) {
-        const error = err as Error;
-        console.error(chalk.red(`Error: ${error.message}`));
-        process.exit(1);
-      }
-    });
-  // ==========================================================================
-  // SPLIT command - Split annotated paper.md back to section files
-  // ==========================================================================
-  program
-    .command('split')
-    .description('Split annotated paper.md back to section files')
-    .argument('<file>', 'Annotated paper.md file')
-    .option('-c, --config <file>', 'Sections config file', 'sections.yaml')
-    .option('-d, --dir <directory>', 'Output directory for section files', '.')
-    .option('--dry-run', 'Preview without writing files')
-    .action((file: string, options: SplitOptions) => {
-      if (!fs.existsSync(file)) {
-        console.error(chalk.red(`File not found: ${file}`));
-        process.exit(1);
-      }
-      const configPath = path.resolve(options.dir, options.config);
-      if (!fs.existsSync(configPath)) {
-        console.error(chalk.red(`Config not found: ${configPath}`));
-        console.error(chalk.dim('Run "rev init" first to generate sections.yaml'));
-        process.exit(1);
-      }
-      console.log(chalk.cyan(`Splitting ${file} using ${options.config}...`));
-      const config = loadConfig(configPath);
-      const paperContent = fs.readFileSync(file, 'utf-8');
-      const sections = splitAnnotatedPaper(paperContent, config.sections);
-      if (sections.size === 0) {
-        console.error(chalk.yellow('No sections detected.'));
-        console.error(chalk.dim('Check that headers match sections.yaml'));
-        process.exit(1);
-      }
-      console.log(chalk.green(`\nFound ${sections.size} sections:\n`));
-      for (const [sectionFile, content] of sections) {
-        const outputPath = path.join(options.dir, sectionFile);
-        const lines = content.split('\n').length;
-        const annotations = countAnnotations(content);
-        console.log(`  ${chalk.bold(sectionFile)} (${lines} lines)`);
-        if (annotations.total > 0) {
-          const parts: string[] = [];
-          if (annotations.inserts > 0) parts.push(chalk.green(`+${annotations.inserts}`));
-          if (annotations.deletes > 0) parts.push(chalk.red(`-${annotations.deletes}`));
-          if (annotations.substitutes > 0) parts.push(chalk.yellow(`~${annotations.substitutes}`));
-          if (annotations.comments > 0) parts.push(chalk.blue(`#${annotations.comments}`));
-          console.log(chalk.dim(`    Annotations: ${parts.join(' ')}`));
-        }
-        if (!options.dryRun) {
-          fs.writeFileSync(outputPath, content, 'utf-8');
-        }
-      }
-      if (options.dryRun) {
-        console.log(chalk.yellow('\n(Dry run - no files written)'));
-      } else {
-        console.log(chalk.green('\nSection files updated.'));
-        console.log(chalk.cyan('\nNext: rev review <section.md> for each section'));
-      }
-    });
-}
+/**
+ * Section commands: import, extract, split
+ *
+ * Commands for importing Word documents and splitting section files.
+ * Sync and merge commands are in sync.ts and merge-resolve.ts respectively.
+ */
+import {
+  chalk,
+  fs,
+  path,
+  countAnnotations,
+  resolveSectionsConfig,
+  splitAnnotatedPaper,
+} from './context.js';
+import type { Command } from 'commander';
+interface DetectedSection {
+  header: string;
+  content: string;
+  file: string;
+}
+interface ImportStats {
+  insertions: number;
+  deletions: number;
+  substitutions: number;
+  comments: number;
+  total: number;
+}
+interface BootstrapOptions {
+  output: string;
+  dryRun?: boolean;
+}
+interface ImportOptions {
+  output?: string;
+  author?: string;
+  dryRun?: boolean;
+}
+interface ExtractOptions {
+  output?: string;
+}
+interface SplitOptions {
+  config: string;
+  dir: string;
+  dryRun?: boolean;
+}
+/**
+ * Detect sections from Word document text
+ * Looks for common academic paper section headers
+ */
+function detectSectionsFromWord(text: string): DetectedSection[] {
+  const lines = text.split('\n');
+  const sections: DetectedSection[] = [];
+  const headerPatterns = [
+    /^(Abstract|Summary)$/i,
+    /^(Introduction|Background)$/i,
+    /^(Methods?|Materials?\s*(and|&)\s*Methods?|Methodology|Experimental\s*Methods?)$/i,
+    /^(Results?)$/i,
+    /^(Results?\s*(and|&)\s*Discussion)$/i,
+    /^(Discussion)$/i,
+    /^(Conclusions?|Summary\s*(and|&)?\s*Conclusions?)$/i,
+    /^(Acknowledgements?|Acknowledgments?)$/i,
+    /^(References|Bibliography|Literature\s*Cited|Works\s*Cited)$/i,
+    /^(Appendix|Appendices|Supplementary\s*(Materials?|Information)?|Supporting\s*Information)$/i,
+    /^(Literature\s*Review|Related\s*Work|Previous\s*Work)$/i,
+    /^(Study\s*Area|Study\s*Site|Site\s*Description)$/i,
+    /^(Data\s*Analysis|Statistical\s*Analysis|Data\s*Collection)$/i,
+    /^(Theoretical\s*Framework|Conceptual\s*Framework)$/i,
+    /^(Case\s*Study|Case\s*Studies)$/i,
+    /^(Limitations?)$/i,
+    /^(Future\s*Work|Future\s*Directions?)$/i,
+    /^(Funding|Author\s*Contributions?|Conflict\s*of\s*Interest|Data\s*Availability)$/i,
+  ];
+  const numberedHeaderPattern = /^(\d+\.?\s+)(Abstract|Introduction|Background|Methods?|Materials|Results?|Discussion|Conclusions?|References|Acknowledgements?|Appendix)/i;
+  let currentSection: string | null = null;
+  let currentContent: string[] = [];
+  let preambleContent: string[] = [];
+  for (const line of lines) {
+    const trimmed = line.trim();
+    if (!trimmed) {
+      if (currentSection) {
+        currentContent.push(line);
+      } else {
+        preambleContent.push(line);
+      }
+      continue;
+    }
+    let isHeader = false;
+    let headerText = trimmed;
+    for (const pattern of headerPatterns) {
+      if (pattern.test(trimmed)) {
+        isHeader = true;
+        break;
+      }
+    }
+    if (!isHeader) {
+      const match = trimmed.match(numberedHeaderPattern);
+      if (match) {
+        isHeader = true;
+        headerText = trimmed.replace(/^\d+\.?\s+/, '');
+      }
+    }
+    if (isHeader) {
+      if (currentSection) {
+        sections.push({
+          header: currentSection,
+          content: currentContent.join('\n'),
+          file: headerToFilename(currentSection),
+        });
+      } else if (preambleContent.some(l => l.trim())) {
+        sections.push({
+          header: 'Preamble',
+          content: preambleContent.join('\n'),
+          file: 'preamble.md',
+        });
+      }
+      currentSection = headerText;
+      currentContent = [];
+    } else if (currentSection) {
+      currentContent.push(line);
+    } else {
+      preambleContent.push(line);
+    }
+  }
+  if (currentSection) {
+    sections.push({
+      header: currentSection,
+      content: currentContent.join('\n'),
+      file: headerToFilename(currentSection),
+    });
+  }
+  if (sections.length === 0) {
+    const allContent = [...preambleContent, ...currentContent].join('\n');
+    if (allContent.trim()) {
+      sections.push({
+        header: 'Content',
+        content: allContent,
+        file: 'content.md',
+      });
+    }
+  }
+  return sections;
+}
+/**
+ * Convert a section header to a filename
+ */
+function headerToFilename(header: string): string {
+  return header
+    .toLowerCase()
+    .replace(/[^a-z0-9]+/g, '-')
+    .replace(/^-|-$/g, '')
+    .slice(0, 30) + '.md';
+}
+/**
+ * Bootstrap a new project from a Word document
+ */
+async function bootstrapFromWord(docx: string, options: BootstrapOptions): Promise<void> {
+  const outputDir = path.resolve(options.output);
+  console.log(chalk.cyan(`Bootstrapping project from ${path.basename(docx)}...\n`));
+  try {
+    const { extractTextFromWord } = await import('../word.js');
+    const { default: YAML } = await import('yaml');
+    const text = await extractTextFromWord(docx);
+    const sections = detectSectionsFromWord(text);
+    if (sections.length === 0) {
+      console.error(chalk.yellow('No sections detected. Creating single content.md file.'));
+      sections.push({ header: 'Content', content: text, file: 'content.md' });
+    }
+    console.log(chalk.green(`Detected ${sections.length} section(s):\n`));
+    if (!fs.existsSync(outputDir)) {
+      fs.mkdirSync(outputDir, { recursive: true });
+    }
+    const sectionFiles: string[] = [];
+    for (const section of sections) {
+      const filePath = path.join(outputDir, section.file);
+      const content = `# ${section.header}\n\n${section.content.trim()}\n`;
+      console.log(`  ${chalk.bold(section.file)} - "${section.header}" (${section.content.split('\n').length} lines)`);
+      if (!options.dryRun) {
+        fs.writeFileSync(filePath, content, 'utf-8');
+      }
+      sectionFiles.push(section.file);
+    }
+    const docxName = path.basename(docx, '.docx');
+    const title = docxName.replace(/[-_]/g, ' ').replace(/\b\w/g, (c) => c.toUpperCase());
+    const config = {
+      title: title,
+      authors: [],
+      sections: sectionFiles,
+      bibliography: null,
+      crossref: {
+        figureTitle: 'Figure',
+        tableTitle: 'Table',
+        figPrefix: ['Fig.', 'Figs.'],
+        tblPrefix: ['Table', 'Tables'],
+      },
+      pdf: {
+        documentclass: 'article',
+        fontsize: '12pt',
+        geometry: 'margin=1in',
+        linestretch: 1.5,
+      },
+      docx: {
+        keepComments: true,
+      },
+    };
+    const configPath = path.join(outputDir, 'rev.yaml');
+    console.log(`\n  ${chalk.bold('rev.yaml')} - project configuration`);
+    if (!options.dryRun) {
+      fs.writeFileSync(configPath, YAML.stringify(config), 'utf-8');
+    }
+    const figuresDir = path.join(outputDir, 'figures');
+    if (!fs.existsSync(figuresDir) && !options.dryRun) {
+      fs.mkdirSync(figuresDir, { recursive: true });
+      console.log(`  ${chalk.dim('figures/')} - image directory`);
+    }
+    if (options.dryRun) {
+      console.log(chalk.yellow('\n(Dry run - no files written)'));
+    } else {
+      console.log(chalk.green('\nProject created!'));
+      console.log(chalk.cyan('\nNext steps:'));
+      if (outputDir !== process.cwd()) {
+        console.log(chalk.dim(`  cd ${path.relative(process.cwd(), outputDir) || '.'}`));
+      }
+      console.log(chalk.dim('  # Edit rev.yaml to add authors and adjust settings'));
+      console.log(chalk.dim('  # Review and clean up section files'));
+      console.log(chalk.dim('  rev build          # Build PDF and DOCX'));
+    }
+  } catch (err) {
+    const error = err as Error;
+    console.error(chalk.red(`Error: ${error.message}`));
+    if (process.env.DEBUG) console.error(error.stack);
+    process.exit(1);
+  }
+}
+/**
+ * Register section commands with the program
+ */
+export function register(program: Command): void {
+  // ==========================================================================
+  // IMPORT command - Import from Word (bootstrap or diff mode)
+  // ==========================================================================
+  program
+    .command('import')
+    .description('Import from Word: creates sections from scratch, or diffs against existing MD')
+    .argument('<docx>', 'Word document')
+    .argument('[original]', 'Optional: original Markdown file to compare against')
+    .option('-o, --output <dir>', 'Output directory for bootstrap mode', '.')
+    .option('-a, --author <name>', 'Author name for changes (diff mode)', 'Reviewer')
+    .option('--dry-run', 'Preview without saving')
+    .action(async (docx: string, original: string | undefined, options: ImportOptions) => {
+      if (!fs.existsSync(docx)) {
+        console.error(chalk.red(`Error: Word file not found: ${docx}`));
+        process.exit(1);
+      }
+      if (!original) {
+        await bootstrapFromWord(docx, options as BootstrapOptions);
+        return;
+      }
+      if (!fs.existsSync(original)) {
+        console.error(chalk.red(`Error: Original MD not found: ${original}`));
+        process.exit(1);
+      }
+      console.log(chalk.cyan(`Comparing ${path.basename(docx)} against ${path.basename(original)}...`));
+      // Warn if pandoc is missing
+      const { hasPandoc: hasPandocImport, getInstallInstructions: getInstallImport } = await import('../dependencies.js');
+      if (!hasPandocImport()) {
+        console.log(chalk.yellow(`\n  Warning: Pandoc not installed. Track changes extracted from XML (formatting may differ).`));
+        console.log(chalk.dim(`  Install for best results: ${getInstallImport('pandoc')}\n`));
+      }
+      try {
+        const { importFromWord } = await import('../import.js');
+        const { annotated, stats } = await importFromWord(docx, original, {
+          author: options.author,
+        });
+        console.log(chalk.cyan('\nChanges detected:'));
+        if (stats.insertions > 0) console.log(chalk.green(`  + Insertions:    ${stats.insertions}`));
+        if (stats.deletions > 0) console.log(chalk.red(`  - Deletions:     ${stats.deletions}`));
+        if (stats.substitutions > 0) console.log(chalk.yellow(`  ~ Substitutions: ${stats.substitutions}`));
+        if (stats.comments > 0) console.log(chalk.blue(`  # Comments:      ${stats.comments}`));
+        if (stats.total === 0) {
+          console.log(chalk.green('\nNo changes detected.'));
+          return;
+        }
+        console.log(chalk.dim(`\n  Total: ${stats.total}`));
+        if (options.dryRun) {
+          console.log(chalk.cyan('\n--- Preview (first 1000 chars) ---\n'));
+          console.log(annotated.slice(0, 1000));
+          if (annotated.length > 1000) console.log(chalk.dim('\n... (truncated)'));
+          return;
+        }
+        const outputPath = options.output || original;
+        fs.writeFileSync(outputPath, annotated, 'utf-8');
+        console.log(chalk.green(`\nSaved annotated version to ${outputPath}`));
+        console.log(chalk.cyan('\nNext steps:'));
+        console.log(`  1. ${chalk.bold('rev review ' + outputPath)}  - Accept/reject track changes`);
+        console.log(`  2. Work with Claude to address comments`);
+        console.log(`  3. ${chalk.bold('rev build docx')}  - Rebuild Word doc`);
+      } catch (err) {
+        const error = err as Error;
+        console.error(chalk.red(`Error: ${error.message}`));
+        if (process.env.DEBUG) console.error(error.stack);
+        process.exit(1);
+      }
+    });
+  // ==========================================================================
+  // EXTRACT command - Just extract text from Word
+  // ==========================================================================
+  program
+    .command('extract')
+    .description('Extract plain text from Word document (no diff)')
+    .argument('<docx>', 'Word document')
+    .option('-o, --output <file>', 'Output file (default: stdout)')
+    .action(async (docx: string, options: ExtractOptions) => {
+      if (!fs.existsSync(docx)) {
+        console.error(chalk.red(`Error: File not found: ${docx}`));
+        process.exit(1);
+      }
+      try {
+        const { extractTextFromWord } = await import('../word.js');
+        const text = await extractTextFromWord(docx);
+        if (options.output) {
+          fs.writeFileSync(options.output, text, 'utf-8');
+          console.error(chalk.green(`Extracted to ${options.output}`));
+        } else {
+          process.stdout.write(text);
+        }
+      } catch (err) {
+        const error = err as Error;
+        console.error(chalk.red(`Error: ${error.message}`));
+        process.exit(1);
+      }
+    });
+  // ==========================================================================
+  // SPLIT command - Split annotated paper.md back to section files
+  // ==========================================================================
+  program
+    .command('split')
+    .description('Split annotated paper.md back to section files')
+    .argument('<file>', 'Annotated paper.md file')
+    .option('-c, --config <file>', 'Sections config file', 'sections.yaml')
+    .option('-d, --dir <directory>', 'Output directory for section files', '.')
+    .option('--dry-run', 'Preview without writing files')
+    .action((file: string, options: SplitOptions) => {
+      if (!fs.existsSync(file)) {
+        console.error(chalk.red(`File not found: ${file}`));
+        process.exit(1);
+      }
+      const resolved = resolveSectionsConfig(options.dir, options.config);
+      if (!resolved) {
+        console.error(chalk.red(`No section config found in ${path.resolve(options.dir)}`));
+        console.error(chalk.dim('Add a `sections:` list to rev.yaml, or run "rev init" to generate sections.yaml.'));
+        process.exit(1);
+      }
+      console.log(chalk.cyan(`Splitting ${file}...`));
+      const config = resolved.config;
+      const paperContent = fs.readFileSync(file, 'utf-8');
+      const sections = splitAnnotatedPaper(paperContent, config.sections);
+      if (sections.size === 0) {
+        console.error(chalk.yellow('No sections detected.'));
+        console.error(chalk.dim('Check that headers match sections.yaml'));
+        process.exit(1);
+      }
+      console.log(chalk.green(`\nFound ${sections.size} sections:\n`));
+      for (const [sectionFile, content] of sections) {
+        const outputPath = path.join(options.dir, sectionFile);
+        const lines = content.split('\n').length;
+        const annotations = countAnnotations(content);
+        console.log(`  ${chalk.bold(sectionFile)} (${lines} lines)`);
+        if (annotations.total > 0) {
+          const parts: string[] = [];
+          if (annotations.inserts > 0) parts.push(chalk.green(`+${annotations.inserts}`));
+          if (annotations.deletes > 0) parts.push(chalk.red(`-${annotations.deletes}`));
+          if (annotations.substitutes > 0) parts.push(chalk.yellow(`~${annotations.substitutes}`));
+          if (annotations.comments > 0) parts.push(chalk.blue(`#${annotations.comments}`));
+          console.log(chalk.dim(`    Annotations: ${parts.join(' ')}`));
+        }
+        if (!options.dryRun) {
+          fs.writeFileSync(outputPath, content, 'utf-8');
+        }
+      }
+      if (options.dryRun) {
+        console.log(chalk.yellow('\n(Dry run - no files written)'));
+      } else {
+        console.log(chalk.green('\nSection files updated.'));
+        console.log(chalk.cyan('\nNext: rev review <section.md> for each section'));
+      }
+    });
+}