docrev 0.9.11 → 0.9.14
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude/settings.local.json +9 -9
- package/.gitattributes +1 -1
- package/CHANGELOG.md +149 -149
- package/PLAN-tables-and-postprocess.md +850 -850
- package/README.md +391 -391
- package/bin/rev.js +11 -11
- package/bin/rev.ts +145 -145
- package/completions/rev.bash +127 -127
- package/completions/rev.ps1 +210 -210
- package/completions/rev.zsh +207 -207
- package/dev_notes/stress2/build_adversarial.ts +186 -186
- package/dev_notes/stress2/drift_matcher.ts +62 -62
- package/dev_notes/stress2/probe_anchors.ts +35 -35
- package/dev_notes/stress2/project/discussion.before.md +3 -3
- package/dev_notes/stress2/project/discussion.md +3 -3
- package/dev_notes/stress2/project/methods.before.md +20 -20
- package/dev_notes/stress2/project/methods.md +20 -20
- package/dev_notes/stress2/project/rev.yaml +5 -5
- package/dev_notes/stress2/project/sections.yaml +4 -4
- package/dev_notes/stress2/sections.yaml +5 -5
- package/dev_notes/stress2/trace_placement.ts +50 -50
- package/dev_notes/stresstest_boundaries.ts +27 -27
- package/dev_notes/stresstest_drift_apply.ts +43 -43
- package/dev_notes/stresstest_drift_compare.ts +43 -43
- package/dev_notes/stresstest_drift_v2.ts +54 -54
- package/dev_notes/stresstest_inspect.ts +54 -54
- package/dev_notes/stresstest_pstyle.ts +55 -55
- package/dev_notes/stresstest_section_debug.ts +23 -23
- package/dev_notes/stresstest_split.ts +70 -70
- package/dev_notes/stresstest_trace.ts +19 -19
- package/dev_notes/stresstest_verify_no_overwrite.ts +40 -40
- package/dist/lib/build.d.ts +50 -1
- package/dist/lib/build.d.ts.map +1 -1
- package/dist/lib/build.js +80 -30
- package/dist/lib/build.js.map +1 -1
- package/dist/lib/commands/build.d.ts.map +1 -1
- package/dist/lib/commands/build.js +38 -5
- package/dist/lib/commands/build.js.map +1 -1
- package/dist/lib/commands/utilities.js +164 -164
- package/dist/lib/commands/word-tools.js +8 -8
- package/dist/lib/grammar.js +3 -3
- package/dist/lib/import.d.ts.map +1 -1
- package/dist/lib/import.js +146 -24
- package/dist/lib/import.js.map +1 -1
- package/dist/lib/pdf-comments.js +44 -44
- package/dist/lib/plugins.js +57 -57
- package/dist/lib/pptx-themes.js +115 -115
- package/dist/lib/spelling.js +2 -2
- package/dist/lib/templates.js +387 -387
- package/dist/lib/themes.js +51 -51
- package/dist/lib/types.d.ts +20 -0
- package/dist/lib/types.d.ts.map +1 -1
- package/dist/lib/word-extraction.d.ts +6 -0
- package/dist/lib/word-extraction.d.ts.map +1 -1
- package/dist/lib/word-extraction.js +46 -3
- package/dist/lib/word-extraction.js.map +1 -1
- package/dist/lib/wordcomments.d.ts.map +1 -1
- package/dist/lib/wordcomments.js +23 -5
- package/dist/lib/wordcomments.js.map +1 -1
- package/eslint.config.js +27 -27
- package/lib/anchor-match.ts +276 -276
- package/lib/annotations.ts +644 -644
- package/lib/build.ts +1300 -1227
- package/lib/citations.ts +160 -160
- package/lib/commands/build.ts +833 -801
- package/lib/commands/citations.ts +515 -515
- package/lib/commands/comments.ts +1050 -1050
- package/lib/commands/context.ts +174 -174
- package/lib/commands/core.ts +309 -309
- package/lib/commands/doi.ts +435 -435
- package/lib/commands/file-ops.ts +372 -372
- package/lib/commands/history.ts +320 -320
- package/lib/commands/index.ts +87 -87
- package/lib/commands/init.ts +259 -259
- package/lib/commands/merge-resolve.ts +378 -378
- package/lib/commands/preview.ts +178 -178
- package/lib/commands/project-info.ts +244 -244
- package/lib/commands/quality.ts +517 -517
- package/lib/commands/response.ts +454 -454
- package/lib/commands/section-boundaries.ts +82 -82
- package/lib/commands/sections.ts +451 -451
- package/lib/commands/sync.ts +706 -706
- package/lib/commands/text-ops.ts +449 -449
- package/lib/commands/utilities.ts +448 -448
- package/lib/commands/verify-anchors.ts +272 -272
- package/lib/commands/word-tools.ts +340 -340
- package/lib/comment-realign.ts +517 -517
- package/lib/config.ts +84 -84
- package/lib/crossref.ts +781 -781
- package/lib/csl.ts +191 -191
- package/lib/dependencies.ts +98 -98
- package/lib/diff-engine.ts +465 -465
- package/lib/doi-cache.ts +115 -115
- package/lib/doi.ts +897 -897
- package/lib/equations.ts +506 -506
- package/lib/errors.ts +346 -346
- package/lib/format.ts +541 -541
- package/lib/git.ts +326 -326
- package/lib/grammar.ts +303 -303
- package/lib/image-registry.ts +180 -180
- package/lib/import.ts +911 -792
- package/lib/journals.ts +543 -543
- package/lib/merge.ts +633 -633
- package/lib/orcid.ts +144 -144
- package/lib/pdf-comments.ts +263 -263
- package/lib/pdf-import.ts +524 -524
- package/lib/plugins.ts +362 -362
- package/lib/postprocess.ts +188 -188
- package/lib/pptx-color-filter.lua +37 -37
- package/lib/pptx-template.ts +469 -469
- package/lib/pptx-themes.ts +483 -483
- package/lib/protect-restore.ts +520 -520
- package/lib/rate-limiter.ts +94 -94
- package/lib/response.ts +197 -197
- package/lib/restore-references.ts +240 -240
- package/lib/review.ts +327 -327
- package/lib/schema.ts +417 -417
- package/lib/scientific-words.ts +73 -73
- package/lib/sections.ts +335 -335
- package/lib/slides.ts +756 -756
- package/lib/spelling.ts +334 -334
- package/lib/templates.ts +526 -526
- package/lib/themes.ts +742 -742
- package/lib/trackchanges.ts +247 -247
- package/lib/tui.ts +450 -450
- package/lib/types.ts +550 -530
- package/lib/undo.ts +250 -250
- package/lib/utils.ts +69 -69
- package/lib/variables.ts +179 -179
- package/lib/word-extraction.ts +806 -759
- package/lib/word.ts +643 -643
- package/lib/wordcomments.ts +817 -798
- package/package.json +137 -137
- package/scripts/postbuild.js +28 -28
- package/skill/REFERENCE.md +431 -431
- package/skill/SKILL.md +258 -258
- package/tsconfig.json +26 -26
- package/types/index.d.ts +525 -525
|
@@ -1,272 +1,272 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* VERIFY-ANCHORS command: report drift between Word comment anchors
|
|
3
|
-
* and the current markdown.
|
|
4
|
-
*
|
|
5
|
-
* Useful when prose has been revised between sending the docx out for
|
|
6
|
-
* review and receiving it back. Each comment is classified by how well
|
|
7
|
-
* its anchor still matches the current section prose:
|
|
8
|
-
*
|
|
9
|
-
* clean – exact or whitespace-normalized hit
|
|
10
|
-
* drift – anchor only matches via stripped/partial fallbacks
|
|
11
|
-
* context-only – anchor text is gone, only surrounding context survives
|
|
12
|
-
* ambiguous – multiple matches, can't pick one without context
|
|
13
|
-
* unmatched – nothing maps; user must place the comment manually
|
|
14
|
-
*/
|
|
15
|
-
|
|
16
|
-
import {
|
|
17
|
-
chalk,
|
|
18
|
-
fs,
|
|
19
|
-
path,
|
|
20
|
-
fmt,
|
|
21
|
-
loadConfig,
|
|
22
|
-
jsonMode,
|
|
23
|
-
jsonOutput,
|
|
24
|
-
} from './context.js';
|
|
25
|
-
import type { Command } from 'commander';
|
|
26
|
-
import { findAnchorInText, classifyStrategy, scoreContextAt, type AnchorMatchQuality } from '../anchor-match.js';
|
|
27
|
-
import type { CommentAnchorData } from '../word-extraction.js';
|
|
28
|
-
import { computeSectionBoundaries } from './section-boundaries.js';
|
|
29
|
-
|
|
30
|
-
interface VerifyOptions {
|
|
31
|
-
config: string;
|
|
32
|
-
dir: string;
|
|
33
|
-
json?: boolean;
|
|
34
|
-
}
|
|
35
|
-
|
|
36
|
-
interface CommentReport {
|
|
37
|
-
id: string;
|
|
38
|
-
author: string;
|
|
39
|
-
text: string;
|
|
40
|
-
section: string | null;
|
|
41
|
-
quality: AnchorMatchQuality | 'ambiguous';
|
|
42
|
-
strategy: string;
|
|
43
|
-
anchor: string;
|
|
44
|
-
occurrences: number;
|
|
45
|
-
}
|
|
46
|
-
|
|
47
|
-
export function register(program: Command): void {
|
|
48
|
-
program
|
|
49
|
-
.command('verify-anchors')
|
|
50
|
-
.description('Report drift between Word comment anchors and current markdown')
|
|
51
|
-
.argument('<file>', 'Word document with reviewer comments (.docx)')
|
|
52
|
-
.option('-c, --config <file>', 'Sections config file', 'sections.yaml')
|
|
53
|
-
.option('-d, --dir <directory>', 'Directory with section files', '.')
|
|
54
|
-
.option('--json', 'Output JSON report (for scripting)')
|
|
55
|
-
.action(async (docxPath: string, options: VerifyOptions) => {
|
|
56
|
-
if (!fs.existsSync(docxPath)) {
|
|
57
|
-
console.error(fmt.status('error', `File not found: ${docxPath}`));
|
|
58
|
-
process.exit(1);
|
|
59
|
-
}
|
|
60
|
-
|
|
61
|
-
const configPath = path.resolve(options.dir, options.config);
|
|
62
|
-
if (!fs.existsSync(configPath)) {
|
|
63
|
-
console.error(fmt.status('error', `Config not found: ${configPath}`));
|
|
64
|
-
console.error(chalk.dim(' Run "rev init" first to generate sections.yaml'));
|
|
65
|
-
process.exit(1);
|
|
66
|
-
}
|
|
67
|
-
|
|
68
|
-
const config = loadConfig(configPath);
|
|
69
|
-
const { extractWordComments, extractCommentAnchors, extractHeadings } = await import('../import.js');
|
|
70
|
-
|
|
71
|
-
let comments;
|
|
72
|
-
let anchors;
|
|
73
|
-
let headings;
|
|
74
|
-
let fullDocText = '';
|
|
75
|
-
try {
|
|
76
|
-
comments = await extractWordComments(docxPath);
|
|
77
|
-
const result = await extractCommentAnchors(docxPath);
|
|
78
|
-
anchors = result.anchors;
|
|
79
|
-
fullDocText = result.fullDocText;
|
|
80
|
-
headings = await extractHeadings(docxPath);
|
|
81
|
-
} catch (err) {
|
|
82
|
-
const error = err as Error;
|
|
83
|
-
console.error(fmt.status('error', `Failed to read ${path.basename(docxPath)}: ${error.message}`));
|
|
84
|
-
if (process.env.DEBUG) console.error(error.stack);
|
|
85
|
-
process.exit(1);
|
|
86
|
-
}
|
|
87
|
-
|
|
88
|
-
if (comments.length === 0) {
|
|
89
|
-
console.log(fmt.status('info', 'No comments found in document.'));
|
|
90
|
-
return;
|
|
91
|
-
}
|
|
92
|
-
|
|
93
|
-
const boundaries = computeSectionBoundaries(config.sections, headings, fullDocText.length);
|
|
94
|
-
|
|
95
|
-
// Cache section markdown contents on first read
|
|
96
|
-
const sectionCache = new Map<string, string>();
|
|
97
|
-
function loadSection(file: string): string | null {
|
|
98
|
-
if (sectionCache.has(file)) return sectionCache.get(file)!;
|
|
99
|
-
const sectionPath = path.join(options.dir, file);
|
|
100
|
-
if (!fs.existsSync(sectionPath)) return null;
|
|
101
|
-
const content = fs.readFileSync(sectionPath, 'utf-8');
|
|
102
|
-
sectionCache.set(file, content);
|
|
103
|
-
return content;
|
|
104
|
-
}
|
|
105
|
-
|
|
106
|
-
const firstBoundaryStart = boundaries.length > 0 ? boundaries[0].start : 0;
|
|
107
|
-
const reports: CommentReport[] = [];
|
|
108
|
-
|
|
109
|
-
for (const c of comments) {
|
|
110
|
-
const anchor: CommentAnchorData | undefined = anchors.get(c.id);
|
|
111
|
-
const anchorText = anchor?.anchor || '';
|
|
112
|
-
if (!anchor) {
|
|
113
|
-
reports.push({
|
|
114
|
-
id: c.id,
|
|
115
|
-
author: c.author,
|
|
116
|
-
text: c.text,
|
|
117
|
-
section: null,
|
|
118
|
-
quality: 'unmatched',
|
|
119
|
-
strategy: 'no-anchor',
|
|
120
|
-
anchor: '',
|
|
121
|
-
occurrences: 0,
|
|
122
|
-
});
|
|
123
|
-
continue;
|
|
124
|
-
}
|
|
125
|
-
|
|
126
|
-
// Determine which section file this comment lives in
|
|
127
|
-
let sectionFile: string | null = null;
|
|
128
|
-
for (const b of boundaries) {
|
|
129
|
-
if (anchor.docPosition >= b.start && anchor.docPosition < b.end) {
|
|
130
|
-
sectionFile = b.file;
|
|
131
|
-
break;
|
|
132
|
-
}
|
|
133
|
-
}
|
|
134
|
-
if (!sectionFile && boundaries.length > 0 && anchor.docPosition < firstBoundaryStart) {
|
|
135
|
-
sectionFile = boundaries[0].file;
|
|
136
|
-
}
|
|
137
|
-
|
|
138
|
-
if (!sectionFile) {
|
|
139
|
-
reports.push({
|
|
140
|
-
id: c.id,
|
|
141
|
-
author: c.author,
|
|
142
|
-
text: c.text,
|
|
143
|
-
section: null,
|
|
144
|
-
quality: 'unmatched',
|
|
145
|
-
strategy: 'no-section',
|
|
146
|
-
anchor: anchorText,
|
|
147
|
-
occurrences: 0,
|
|
148
|
-
});
|
|
149
|
-
continue;
|
|
150
|
-
}
|
|
151
|
-
|
|
152
|
-
const md = loadSection(sectionFile);
|
|
153
|
-
if (md === null) {
|
|
154
|
-
reports.push({
|
|
155
|
-
id: c.id,
|
|
156
|
-
author: c.author,
|
|
157
|
-
text: c.text,
|
|
158
|
-
section: sectionFile,
|
|
159
|
-
quality: 'unmatched',
|
|
160
|
-
strategy: 'missing-file',
|
|
161
|
-
anchor: anchorText,
|
|
162
|
-
occurrences: 0,
|
|
163
|
-
});
|
|
164
|
-
continue;
|
|
165
|
-
}
|
|
166
|
-
|
|
167
|
-
const search = findAnchorInText(anchor.anchor, md, anchor.before, anchor.after);
|
|
168
|
-
let quality: AnchorMatchQuality | 'ambiguous' = classifyStrategy(search.strategy, search.occurrences.length);
|
|
169
|
-
if (quality === 'clean' && search.occurrences.length > 1) {
|
|
170
|
-
// Multiple direct hits — only flag as ambiguous when before/after
|
|
171
|
-
// context can't pick a clear winner. If one candidate scores
|
|
172
|
-
// strictly higher than the others, sync will place it correctly.
|
|
173
|
-
const anchorLen = anchor.anchor.length;
|
|
174
|
-
const scores = search.occurrences.map(p => scoreContextAt(p, md, anchor.before, anchor.after, anchorLen));
|
|
175
|
-
const max = Math.max(...scores);
|
|
176
|
-
const winners = scores.filter(s => s === max).length;
|
|
177
|
-
if (max === 0 || winners > 1) {
|
|
178
|
-
quality = 'ambiguous';
|
|
179
|
-
}
|
|
180
|
-
}
|
|
181
|
-
|
|
182
|
-
reports.push({
|
|
183
|
-
id: c.id,
|
|
184
|
-
author: c.author,
|
|
185
|
-
text: c.text,
|
|
186
|
-
section: sectionFile,
|
|
187
|
-
quality,
|
|
188
|
-
strategy: search.strategy,
|
|
189
|
-
anchor: anchorText,
|
|
190
|
-
occurrences: search.occurrences.length,
|
|
191
|
-
});
|
|
192
|
-
}
|
|
193
|
-
|
|
194
|
-
if (options.json || jsonMode) {
|
|
195
|
-
jsonOutput({
|
|
196
|
-
file: docxPath,
|
|
197
|
-
totalComments: comments.length,
|
|
198
|
-
summary: tally(reports),
|
|
199
|
-
comments: reports,
|
|
200
|
-
});
|
|
201
|
-
return;
|
|
202
|
-
}
|
|
203
|
-
|
|
204
|
-
printReport(docxPath, reports);
|
|
205
|
-
});
|
|
206
|
-
}
|
|
207
|
-
|
|
208
|
-
function tally(reports: CommentReport[]): Record<string, number> {
|
|
209
|
-
const out: Record<string, number> = { clean: 0, drift: 0, 'context-only': 0, ambiguous: 0, unmatched: 0 };
|
|
210
|
-
for (const r of reports) out[r.quality] = (out[r.quality] || 0) + 1;
|
|
211
|
-
return out;
|
|
212
|
-
}
|
|
213
|
-
|
|
214
|
-
function printReport(docxPath: string, reports: CommentReport[]): void {
|
|
215
|
-
console.log(fmt.header(`Anchor Verification: ${path.basename(docxPath)}`));
|
|
216
|
-
console.log();
|
|
217
|
-
|
|
218
|
-
const totals = tally(reports);
|
|
219
|
-
const summaryLines: string[] = [];
|
|
220
|
-
summaryLines.push(`${chalk.green(totals.clean)} clean (anchor still matches)`);
|
|
221
|
-
if (totals.drift) summaryLines.push(`${chalk.cyan(totals.drift)} drifted (matched via fallback strategies)`);
|
|
222
|
-
if (totals['context-only']) summaryLines.push(`${chalk.yellow(totals['context-only'])} context-only (anchor text gone, neighbors survive)`);
|
|
223
|
-
if (totals.ambiguous) summaryLines.push(`${chalk.magenta(totals.ambiguous)} ambiguous (multiple candidate positions)`);
|
|
224
|
-
if (totals.unmatched) summaryLines.push(`${chalk.red(totals.unmatched)} unmatched (manual placement needed)`);
|
|
225
|
-
console.log(fmt.box(summaryLines.join('\n'), { title: 'Summary', padding: 0 }));
|
|
226
|
-
console.log();
|
|
227
|
-
|
|
228
|
-
// Per-comment table for everything that isn't a clean direct hit
|
|
229
|
-
const problems = reports.filter(r => r.quality !== 'clean');
|
|
230
|
-
if (problems.length === 0) {
|
|
231
|
-
console.log(fmt.status('success', 'All comment anchors match the current markdown.'));
|
|
232
|
-
return;
|
|
233
|
-
}
|
|
234
|
-
|
|
235
|
-
const rows = problems.map(r => [
|
|
236
|
-
chalk.dim(`#${r.id}`),
|
|
237
|
-
qualityColor(r.quality),
|
|
238
|
-
r.section ? chalk.bold(r.section) : chalk.dim('—'),
|
|
239
|
-
chalk.dim(r.strategy),
|
|
240
|
-
truncate(r.anchor, 35),
|
|
241
|
-
truncate(r.text, 35),
|
|
242
|
-
]);
|
|
243
|
-
|
|
244
|
-
console.log(fmt.table(
|
|
245
|
-
['ID', 'Quality', 'Section', 'Strategy', 'Anchor (Word)', 'Comment'],
|
|
246
|
-
rows,
|
|
247
|
-
{ align: ['right', 'left', 'left', 'left', 'left', 'left'] },
|
|
248
|
-
));
|
|
249
|
-
|
|
250
|
-
if (totals.unmatched > 0 || totals.ambiguous > 0) {
|
|
251
|
-
console.log();
|
|
252
|
-
console.log(chalk.dim('Comments flagged "unmatched" or "ambiguous" need manual placement.'));
|
|
253
|
-
console.log(chalk.dim('Run "rev sync --comments-only" to import the matched ones without touching prose.'));
|
|
254
|
-
}
|
|
255
|
-
}
|
|
256
|
-
|
|
257
|
-
function qualityColor(q: string): string {
|
|
258
|
-
switch (q) {
|
|
259
|
-
case 'clean': return chalk.green('clean');
|
|
260
|
-
case 'drift': return chalk.cyan('drift');
|
|
261
|
-
case 'context-only': return chalk.yellow('context');
|
|
262
|
-
case 'ambiguous': return chalk.magenta('ambiguous');
|
|
263
|
-
case 'unmatched': return chalk.red('unmatched');
|
|
264
|
-
default: return q;
|
|
265
|
-
}
|
|
266
|
-
}
|
|
267
|
-
|
|
268
|
-
function truncate(s: string, max: number): string {
|
|
269
|
-
if (!s) return chalk.dim('—');
|
|
270
|
-
const flat = s.replace(/\s+/g, ' ').trim();
|
|
271
|
-
return flat.length > max ? flat.slice(0, max - 1) + '…' : flat;
|
|
272
|
-
}
|
|
1
|
+
/**
|
|
2
|
+
* VERIFY-ANCHORS command: report drift between Word comment anchors
|
|
3
|
+
* and the current markdown.
|
|
4
|
+
*
|
|
5
|
+
* Useful when prose has been revised between sending the docx out for
|
|
6
|
+
* review and receiving it back. Each comment is classified by how well
|
|
7
|
+
* its anchor still matches the current section prose:
|
|
8
|
+
*
|
|
9
|
+
* clean – exact or whitespace-normalized hit
|
|
10
|
+
* drift – anchor only matches via stripped/partial fallbacks
|
|
11
|
+
* context-only – anchor text is gone, only surrounding context survives
|
|
12
|
+
* ambiguous – multiple matches, can't pick one without context
|
|
13
|
+
* unmatched – nothing maps; user must place the comment manually
|
|
14
|
+
*/
|
|
15
|
+
|
|
16
|
+
import {
|
|
17
|
+
chalk,
|
|
18
|
+
fs,
|
|
19
|
+
path,
|
|
20
|
+
fmt,
|
|
21
|
+
loadConfig,
|
|
22
|
+
jsonMode,
|
|
23
|
+
jsonOutput,
|
|
24
|
+
} from './context.js';
|
|
25
|
+
import type { Command } from 'commander';
|
|
26
|
+
import { findAnchorInText, classifyStrategy, scoreContextAt, type AnchorMatchQuality } from '../anchor-match.js';
|
|
27
|
+
import type { CommentAnchorData } from '../word-extraction.js';
|
|
28
|
+
import { computeSectionBoundaries } from './section-boundaries.js';
|
|
29
|
+
|
|
30
|
+
interface VerifyOptions {
|
|
31
|
+
config: string;
|
|
32
|
+
dir: string;
|
|
33
|
+
json?: boolean;
|
|
34
|
+
}
|
|
35
|
+
|
|
36
|
+
interface CommentReport {
|
|
37
|
+
id: string;
|
|
38
|
+
author: string;
|
|
39
|
+
text: string;
|
|
40
|
+
section: string | null;
|
|
41
|
+
quality: AnchorMatchQuality | 'ambiguous';
|
|
42
|
+
strategy: string;
|
|
43
|
+
anchor: string;
|
|
44
|
+
occurrences: number;
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
export function register(program: Command): void {
|
|
48
|
+
program
|
|
49
|
+
.command('verify-anchors')
|
|
50
|
+
.description('Report drift between Word comment anchors and current markdown')
|
|
51
|
+
.argument('<file>', 'Word document with reviewer comments (.docx)')
|
|
52
|
+
.option('-c, --config <file>', 'Sections config file', 'sections.yaml')
|
|
53
|
+
.option('-d, --dir <directory>', 'Directory with section files', '.')
|
|
54
|
+
.option('--json', 'Output JSON report (for scripting)')
|
|
55
|
+
.action(async (docxPath: string, options: VerifyOptions) => {
|
|
56
|
+
if (!fs.existsSync(docxPath)) {
|
|
57
|
+
console.error(fmt.status('error', `File not found: ${docxPath}`));
|
|
58
|
+
process.exit(1);
|
|
59
|
+
}
|
|
60
|
+
|
|
61
|
+
const configPath = path.resolve(options.dir, options.config);
|
|
62
|
+
if (!fs.existsSync(configPath)) {
|
|
63
|
+
console.error(fmt.status('error', `Config not found: ${configPath}`));
|
|
64
|
+
console.error(chalk.dim(' Run "rev init" first to generate sections.yaml'));
|
|
65
|
+
process.exit(1);
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
const config = loadConfig(configPath);
|
|
69
|
+
const { extractWordComments, extractCommentAnchors, extractHeadings } = await import('../import.js');
|
|
70
|
+
|
|
71
|
+
let comments;
|
|
72
|
+
let anchors;
|
|
73
|
+
let headings;
|
|
74
|
+
let fullDocText = '';
|
|
75
|
+
try {
|
|
76
|
+
comments = await extractWordComments(docxPath);
|
|
77
|
+
const result = await extractCommentAnchors(docxPath);
|
|
78
|
+
anchors = result.anchors;
|
|
79
|
+
fullDocText = result.fullDocText;
|
|
80
|
+
headings = await extractHeadings(docxPath);
|
|
81
|
+
} catch (err) {
|
|
82
|
+
const error = err as Error;
|
|
83
|
+
console.error(fmt.status('error', `Failed to read ${path.basename(docxPath)}: ${error.message}`));
|
|
84
|
+
if (process.env.DEBUG) console.error(error.stack);
|
|
85
|
+
process.exit(1);
|
|
86
|
+
}
|
|
87
|
+
|
|
88
|
+
if (comments.length === 0) {
|
|
89
|
+
console.log(fmt.status('info', 'No comments found in document.'));
|
|
90
|
+
return;
|
|
91
|
+
}
|
|
92
|
+
|
|
93
|
+
const boundaries = computeSectionBoundaries(config.sections, headings, fullDocText.length);
|
|
94
|
+
|
|
95
|
+
// Cache section markdown contents on first read
|
|
96
|
+
const sectionCache = new Map<string, string>();
|
|
97
|
+
function loadSection(file: string): string | null {
|
|
98
|
+
if (sectionCache.has(file)) return sectionCache.get(file)!;
|
|
99
|
+
const sectionPath = path.join(options.dir, file);
|
|
100
|
+
if (!fs.existsSync(sectionPath)) return null;
|
|
101
|
+
const content = fs.readFileSync(sectionPath, 'utf-8');
|
|
102
|
+
sectionCache.set(file, content);
|
|
103
|
+
return content;
|
|
104
|
+
}
|
|
105
|
+
|
|
106
|
+
const firstBoundaryStart = boundaries.length > 0 ? boundaries[0].start : 0;
|
|
107
|
+
const reports: CommentReport[] = [];
|
|
108
|
+
|
|
109
|
+
for (const c of comments) {
|
|
110
|
+
const anchor: CommentAnchorData | undefined = anchors.get(c.id);
|
|
111
|
+
const anchorText = anchor?.anchor || '';
|
|
112
|
+
if (!anchor) {
|
|
113
|
+
reports.push({
|
|
114
|
+
id: c.id,
|
|
115
|
+
author: c.author,
|
|
116
|
+
text: c.text,
|
|
117
|
+
section: null,
|
|
118
|
+
quality: 'unmatched',
|
|
119
|
+
strategy: 'no-anchor',
|
|
120
|
+
anchor: '',
|
|
121
|
+
occurrences: 0,
|
|
122
|
+
});
|
|
123
|
+
continue;
|
|
124
|
+
}
|
|
125
|
+
|
|
126
|
+
// Determine which section file this comment lives in
|
|
127
|
+
let sectionFile: string | null = null;
|
|
128
|
+
for (const b of boundaries) {
|
|
129
|
+
if (anchor.docPosition >= b.start && anchor.docPosition < b.end) {
|
|
130
|
+
sectionFile = b.file;
|
|
131
|
+
break;
|
|
132
|
+
}
|
|
133
|
+
}
|
|
134
|
+
if (!sectionFile && boundaries.length > 0 && anchor.docPosition < firstBoundaryStart) {
|
|
135
|
+
sectionFile = boundaries[0].file;
|
|
136
|
+
}
|
|
137
|
+
|
|
138
|
+
if (!sectionFile) {
|
|
139
|
+
reports.push({
|
|
140
|
+
id: c.id,
|
|
141
|
+
author: c.author,
|
|
142
|
+
text: c.text,
|
|
143
|
+
section: null,
|
|
144
|
+
quality: 'unmatched',
|
|
145
|
+
strategy: 'no-section',
|
|
146
|
+
anchor: anchorText,
|
|
147
|
+
occurrences: 0,
|
|
148
|
+
});
|
|
149
|
+
continue;
|
|
150
|
+
}
|
|
151
|
+
|
|
152
|
+
const md = loadSection(sectionFile);
|
|
153
|
+
if (md === null) {
|
|
154
|
+
reports.push({
|
|
155
|
+
id: c.id,
|
|
156
|
+
author: c.author,
|
|
157
|
+
text: c.text,
|
|
158
|
+
section: sectionFile,
|
|
159
|
+
quality: 'unmatched',
|
|
160
|
+
strategy: 'missing-file',
|
|
161
|
+
anchor: anchorText,
|
|
162
|
+
occurrences: 0,
|
|
163
|
+
});
|
|
164
|
+
continue;
|
|
165
|
+
}
|
|
166
|
+
|
|
167
|
+
const search = findAnchorInText(anchor.anchor, md, anchor.before, anchor.after);
|
|
168
|
+
let quality: AnchorMatchQuality | 'ambiguous' = classifyStrategy(search.strategy, search.occurrences.length);
|
|
169
|
+
if (quality === 'clean' && search.occurrences.length > 1) {
|
|
170
|
+
// Multiple direct hits — only flag as ambiguous when before/after
|
|
171
|
+
// context can't pick a clear winner. If one candidate scores
|
|
172
|
+
// strictly higher than the others, sync will place it correctly.
|
|
173
|
+
const anchorLen = anchor.anchor.length;
|
|
174
|
+
const scores = search.occurrences.map(p => scoreContextAt(p, md, anchor.before, anchor.after, anchorLen));
|
|
175
|
+
const max = Math.max(...scores);
|
|
176
|
+
const winners = scores.filter(s => s === max).length;
|
|
177
|
+
if (max === 0 || winners > 1) {
|
|
178
|
+
quality = 'ambiguous';
|
|
179
|
+
}
|
|
180
|
+
}
|
|
181
|
+
|
|
182
|
+
reports.push({
|
|
183
|
+
id: c.id,
|
|
184
|
+
author: c.author,
|
|
185
|
+
text: c.text,
|
|
186
|
+
section: sectionFile,
|
|
187
|
+
quality,
|
|
188
|
+
strategy: search.strategy,
|
|
189
|
+
anchor: anchorText,
|
|
190
|
+
occurrences: search.occurrences.length,
|
|
191
|
+
});
|
|
192
|
+
}
|
|
193
|
+
|
|
194
|
+
if (options.json || jsonMode) {
|
|
195
|
+
jsonOutput({
|
|
196
|
+
file: docxPath,
|
|
197
|
+
totalComments: comments.length,
|
|
198
|
+
summary: tally(reports),
|
|
199
|
+
comments: reports,
|
|
200
|
+
});
|
|
201
|
+
return;
|
|
202
|
+
}
|
|
203
|
+
|
|
204
|
+
printReport(docxPath, reports);
|
|
205
|
+
});
|
|
206
|
+
}
|
|
207
|
+
|
|
208
|
+
function tally(reports: CommentReport[]): Record<string, number> {
|
|
209
|
+
const out: Record<string, number> = { clean: 0, drift: 0, 'context-only': 0, ambiguous: 0, unmatched: 0 };
|
|
210
|
+
for (const r of reports) out[r.quality] = (out[r.quality] || 0) + 1;
|
|
211
|
+
return out;
|
|
212
|
+
}
|
|
213
|
+
|
|
214
|
+
function printReport(docxPath: string, reports: CommentReport[]): void {
|
|
215
|
+
console.log(fmt.header(`Anchor Verification: ${path.basename(docxPath)}`));
|
|
216
|
+
console.log();
|
|
217
|
+
|
|
218
|
+
const totals = tally(reports);
|
|
219
|
+
const summaryLines: string[] = [];
|
|
220
|
+
summaryLines.push(`${chalk.green(totals.clean)} clean (anchor still matches)`);
|
|
221
|
+
if (totals.drift) summaryLines.push(`${chalk.cyan(totals.drift)} drifted (matched via fallback strategies)`);
|
|
222
|
+
if (totals['context-only']) summaryLines.push(`${chalk.yellow(totals['context-only'])} context-only (anchor text gone, neighbors survive)`);
|
|
223
|
+
if (totals.ambiguous) summaryLines.push(`${chalk.magenta(totals.ambiguous)} ambiguous (multiple candidate positions)`);
|
|
224
|
+
if (totals.unmatched) summaryLines.push(`${chalk.red(totals.unmatched)} unmatched (manual placement needed)`);
|
|
225
|
+
console.log(fmt.box(summaryLines.join('\n'), { title: 'Summary', padding: 0 }));
|
|
226
|
+
console.log();
|
|
227
|
+
|
|
228
|
+
// Per-comment table for everything that isn't a clean direct hit
|
|
229
|
+
const problems = reports.filter(r => r.quality !== 'clean');
|
|
230
|
+
if (problems.length === 0) {
|
|
231
|
+
console.log(fmt.status('success', 'All comment anchors match the current markdown.'));
|
|
232
|
+
return;
|
|
233
|
+
}
|
|
234
|
+
|
|
235
|
+
const rows = problems.map(r => [
|
|
236
|
+
chalk.dim(`#${r.id}`),
|
|
237
|
+
qualityColor(r.quality),
|
|
238
|
+
r.section ? chalk.bold(r.section) : chalk.dim('—'),
|
|
239
|
+
chalk.dim(r.strategy),
|
|
240
|
+
truncate(r.anchor, 35),
|
|
241
|
+
truncate(r.text, 35),
|
|
242
|
+
]);
|
|
243
|
+
|
|
244
|
+
console.log(fmt.table(
|
|
245
|
+
['ID', 'Quality', 'Section', 'Strategy', 'Anchor (Word)', 'Comment'],
|
|
246
|
+
rows,
|
|
247
|
+
{ align: ['right', 'left', 'left', 'left', 'left', 'left'] },
|
|
248
|
+
));
|
|
249
|
+
|
|
250
|
+
if (totals.unmatched > 0 || totals.ambiguous > 0) {
|
|
251
|
+
console.log();
|
|
252
|
+
console.log(chalk.dim('Comments flagged "unmatched" or "ambiguous" need manual placement.'));
|
|
253
|
+
console.log(chalk.dim('Run "rev sync --comments-only" to import the matched ones without touching prose.'));
|
|
254
|
+
}
|
|
255
|
+
}
|
|
256
|
+
|
|
257
|
+
function qualityColor(q: string): string {
|
|
258
|
+
switch (q) {
|
|
259
|
+
case 'clean': return chalk.green('clean');
|
|
260
|
+
case 'drift': return chalk.cyan('drift');
|
|
261
|
+
case 'context-only': return chalk.yellow('context');
|
|
262
|
+
case 'ambiguous': return chalk.magenta('ambiguous');
|
|
263
|
+
case 'unmatched': return chalk.red('unmatched');
|
|
264
|
+
default: return q;
|
|
265
|
+
}
|
|
266
|
+
}
|
|
267
|
+
|
|
268
|
+
function truncate(s: string, max: number): string {
|
|
269
|
+
if (!s) return chalk.dim('—');
|
|
270
|
+
const flat = s.replace(/\s+/g, ' ').trim();
|
|
271
|
+
return flat.length > max ? flat.slice(0, max - 1) + '…' : flat;
|
|
272
|
+
}
|