docrev 0.9.13 → 0.9.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (126) hide show
  1. package/.claude/settings.local.json +9 -9
  2. package/.gitattributes +1 -1
  3. package/CHANGELOG.md +149 -149
  4. package/PLAN-tables-and-postprocess.md +850 -850
  5. package/README.md +411 -391
  6. package/bin/rev.js +11 -11
  7. package/bin/rev.ts +145 -145
  8. package/completions/rev.bash +127 -127
  9. package/completions/rev.ps1 +210 -210
  10. package/completions/rev.zsh +207 -207
  11. package/dev_notes/stress2/build_adversarial.ts +186 -186
  12. package/dev_notes/stress2/drift_matcher.ts +62 -62
  13. package/dev_notes/stress2/probe_anchors.ts +35 -35
  14. package/dev_notes/stress2/project/discussion.before.md +3 -3
  15. package/dev_notes/stress2/project/discussion.md +3 -3
  16. package/dev_notes/stress2/project/methods.before.md +20 -20
  17. package/dev_notes/stress2/project/methods.md +20 -20
  18. package/dev_notes/stress2/project/rev.yaml +5 -5
  19. package/dev_notes/stress2/project/sections.yaml +4 -4
  20. package/dev_notes/stress2/sections.yaml +5 -5
  21. package/dev_notes/stress2/trace_placement.ts +50 -50
  22. package/dev_notes/stresstest_boundaries.ts +27 -27
  23. package/dev_notes/stresstest_drift_apply.ts +43 -43
  24. package/dev_notes/stresstest_drift_compare.ts +43 -43
  25. package/dev_notes/stresstest_drift_v2.ts +54 -54
  26. package/dev_notes/stresstest_inspect.ts +54 -54
  27. package/dev_notes/stresstest_pstyle.ts +55 -55
  28. package/dev_notes/stresstest_section_debug.ts +23 -23
  29. package/dev_notes/stresstest_split.ts +70 -70
  30. package/dev_notes/stresstest_trace.ts +19 -19
  31. package/dev_notes/stresstest_verify_no_overwrite.ts +40 -40
  32. package/dist/lib/build.d.ts +38 -1
  33. package/dist/lib/build.d.ts.map +1 -1
  34. package/dist/lib/build.js +68 -30
  35. package/dist/lib/build.js.map +1 -1
  36. package/dist/lib/commands/build.d.ts.map +1 -1
  37. package/dist/lib/commands/build.js +38 -5
  38. package/dist/lib/commands/build.js.map +1 -1
  39. package/dist/lib/commands/utilities.js +164 -164
  40. package/dist/lib/commands/word-tools.js +8 -8
  41. package/dist/lib/grammar.js +3 -3
  42. package/dist/lib/pdf-comments.js +44 -44
  43. package/dist/lib/plugins.js +57 -57
  44. package/dist/lib/pptx-themes.js +115 -115
  45. package/dist/lib/spelling.js +2 -2
  46. package/dist/lib/templates.js +387 -387
  47. package/dist/lib/themes.js +51 -51
  48. package/eslint.config.js +27 -27
  49. package/lib/anchor-match.ts +276 -276
  50. package/lib/annotations.ts +644 -644
  51. package/lib/build.ts +1300 -1251
  52. package/lib/citations.ts +160 -160
  53. package/lib/commands/build.ts +833 -801
  54. package/lib/commands/citations.ts +515 -515
  55. package/lib/commands/comments.ts +1050 -1050
  56. package/lib/commands/context.ts +174 -174
  57. package/lib/commands/core.ts +309 -309
  58. package/lib/commands/doi.ts +435 -435
  59. package/lib/commands/file-ops.ts +372 -372
  60. package/lib/commands/history.ts +320 -320
  61. package/lib/commands/index.ts +87 -87
  62. package/lib/commands/init.ts +259 -259
  63. package/lib/commands/merge-resolve.ts +378 -378
  64. package/lib/commands/preview.ts +178 -178
  65. package/lib/commands/project-info.ts +244 -244
  66. package/lib/commands/quality.ts +517 -517
  67. package/lib/commands/response.ts +454 -454
  68. package/lib/commands/section-boundaries.ts +82 -82
  69. package/lib/commands/sections.ts +451 -451
  70. package/lib/commands/sync.ts +706 -706
  71. package/lib/commands/text-ops.ts +449 -449
  72. package/lib/commands/utilities.ts +448 -448
  73. package/lib/commands/verify-anchors.ts +272 -272
  74. package/lib/commands/word-tools.ts +340 -340
  75. package/lib/comment-realign.ts +517 -517
  76. package/lib/config.ts +84 -84
  77. package/lib/crossref.ts +781 -781
  78. package/lib/csl.ts +191 -191
  79. package/lib/dependencies.ts +98 -98
  80. package/lib/diff-engine.ts +465 -465
  81. package/lib/doi-cache.ts +115 -115
  82. package/lib/doi.ts +897 -897
  83. package/lib/equations.ts +506 -506
  84. package/lib/errors.ts +346 -346
  85. package/lib/format.ts +541 -541
  86. package/lib/git.ts +326 -326
  87. package/lib/grammar.ts +303 -303
  88. package/lib/image-registry.ts +180 -180
  89. package/lib/import.ts +911 -911
  90. package/lib/journals.ts +543 -543
  91. package/lib/merge.ts +633 -633
  92. package/lib/orcid.ts +144 -144
  93. package/lib/pdf-comments.ts +263 -263
  94. package/lib/pdf-import.ts +524 -524
  95. package/lib/plugins.ts +362 -362
  96. package/lib/postprocess.ts +188 -188
  97. package/lib/pptx-color-filter.lua +37 -37
  98. package/lib/pptx-template.ts +469 -469
  99. package/lib/pptx-themes.ts +483 -483
  100. package/lib/protect-restore.ts +520 -520
  101. package/lib/rate-limiter.ts +94 -94
  102. package/lib/response.ts +197 -197
  103. package/lib/restore-references.ts +240 -240
  104. package/lib/review.ts +327 -327
  105. package/lib/schema.ts +417 -417
  106. package/lib/scientific-words.ts +73 -73
  107. package/lib/sections.ts +335 -335
  108. package/lib/slides.ts +756 -756
  109. package/lib/spelling.ts +334 -334
  110. package/lib/templates.ts +526 -526
  111. package/lib/themes.ts +742 -742
  112. package/lib/trackchanges.ts +247 -247
  113. package/lib/tui.ts +450 -450
  114. package/lib/types.ts +550 -550
  115. package/lib/undo.ts +250 -250
  116. package/lib/utils.ts +69 -69
  117. package/lib/variables.ts +179 -179
  118. package/lib/word-extraction.ts +806 -806
  119. package/lib/word.ts +643 -643
  120. package/lib/wordcomments.ts +817 -817
  121. package/package.json +137 -137
  122. package/scripts/postbuild.js +28 -28
  123. package/skill/REFERENCE.md +473 -431
  124. package/skill/SKILL.md +274 -258
  125. package/tsconfig.json +26 -26
  126. package/types/index.d.ts +525 -525
@@ -1,240 +1,240 @@
1
- /**
2
- * Post-extraction reference restoration and comment parsing
3
- */
4
-
5
- import { readImageRegistry } from './image-registry.js';
6
-
7
- // ============================================
8
- // Type Definitions
9
- // ============================================
10
-
11
- export interface RestoreCrossrefResult {
12
- text: string;
13
- restored: number;
14
- messages: string[];
15
- restoredLabels: Set<string>;
16
- }
17
-
18
- export interface RestoreImagesResult {
19
- text: string;
20
- restored: number;
21
- messages: string[];
22
- }
23
-
24
- // ============================================
25
- // Functions
26
- // ============================================
27
-
28
- /**
29
- * Parse visible comment markers from Word text
30
- */
31
- export function parseVisibleComments(text: string): Array<{ author: string; text: string; position: number }> {
32
- const comments: Array<{ author: string; text: string; position: number }> = [];
33
- const pattern = /\[([^\]:]+):\s*([^\]]+)\]/g;
34
-
35
- let match;
36
- while ((match = pattern.exec(text)) !== null) {
37
- comments.push({
38
- author: match[1].trim(),
39
- text: match[2].trim(),
40
- position: match.index,
41
- });
42
- }
43
-
44
- return comments;
45
- }
46
-
47
- /**
48
- * Convert visible comments to CriticMarkup format
49
- */
50
- export function convertVisibleComments(text: string): string {
51
- return text.replace(/\[([^\]:]+):\s*([^\]]+)\]/g, '{>>$1: $2<<}');
52
- }
53
-
54
- /**
55
- * Restore pandoc-crossref figure/table references from Word-rendered format
56
- */
57
- export function restoreCrossrefFromWord(
58
- text: string,
59
- projectDir: string,
60
- restoredLabels: Set<string> | null = null
61
- ): RestoreCrossrefResult {
62
- const messages: string[] = [];
63
- let restored = 0;
64
- let result = text;
65
-
66
- const registry = readImageRegistry(projectDir);
67
-
68
- if (!restoredLabels) {
69
- restoredLabels = new Set<string>();
70
- }
71
-
72
- // Pattern 1: [Figure]{.mark} [N]{.mark}
73
- result = result.replace(/\[(Figure|Table|Fig\.?)\]\{\.mark\}\s*\[(\d+|S\d+)\]\{\.mark\}/gi, (match, type, num) => {
74
- const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
75
- if (registry) {
76
- const entry = registry.byNumber?.get(`${prefix}:${num}`);
77
- if (entry && entry.label) {
78
- restored++;
79
- return `@${prefix}:${entry.label}`;
80
- }
81
- }
82
- restored++;
83
- messages.push(`Restored ${type} ${num} (no label found, using placeholder)`);
84
- return `@${prefix}:fig${num}`;
85
- });
86
-
87
- // Pattern 2: Plain "Figure N" or "Fig. N"
88
- result = result.replace(/(?<!!)\b(Figure|Fig\.?|Table|Tbl\.?)\s+(\d+|S\d+)\b(?!\s*:)/gi, (match, type, num) => {
89
- const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
90
- if (registry) {
91
- const entry = registry.byNumber?.get(`${prefix}:${num}`);
92
- if (entry && entry.label) {
93
- restored++;
94
- return `@${prefix}:${entry.label}`;
95
- }
96
- }
97
- return match;
98
- });
99
-
100
- // Pattern 3: Remove duplicate plain-text captions
101
- result = result.replace(/(\!\[[^\]]+\]\([^)]+\)(?:\{[^}]*\})?)\s*\n+\s*(?:Figure|Fig\.?|Table|Tbl\.?)\s+\d+[:\.]?\s*[^\n]+/gi, '$1');
102
-
103
- // Pattern 4: Clean up image captions that start with "Figure N: "
104
- result = result.replace(/!\[(Figure|Fig\.?|Table|Tbl\.?)\s+(\d+|S\d+)[:\.]?\s*([^\]]*)\]\(([^)]+)\)(?:\{[^}]*\})?/gi,
105
- (match, type, num, caption, imgPath) => {
106
- const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
107
- const labelKey = `${prefix}:${num}`;
108
-
109
- if (registry) {
110
- const entry = registry.byNumber?.get(labelKey);
111
- if (entry) {
112
- if (restoredLabels!.has(labelKey)) {
113
- messages.push(`Skipped duplicate ${prefix}:${entry.label} (already restored)`);
114
- return `![${entry.caption}](${entry.path})`;
115
- }
116
- restoredLabels!.add(labelKey);
117
- restored++;
118
- messages.push(`Restored image ${prefix}:${entry.label} from Figure ${num}`);
119
- return `![${entry.caption}](${entry.path}){#${prefix}:${entry.label}}`;
120
- }
121
- }
122
- const cleanCaption = caption.trim();
123
- return `![${cleanCaption}](${imgPath})`;
124
- });
125
-
126
- return { text: result, restored, messages, restoredLabels };
127
- }
128
-
129
- /**
130
- * Restore proper markdown image syntax from Word-extracted text using image registry
131
- */
132
- export function restoreImagesFromRegistry(
133
- text: string,
134
- projectDir: string,
135
- restoredLabels: Set<string> | null = null
136
- ): RestoreImagesResult {
137
- const messages: string[] = [];
138
- let restored = 0;
139
-
140
- const registry = readImageRegistry(projectDir);
141
- if (!registry || !registry.figures || registry.figures.length === 0) {
142
- return { text, restored: 0, messages: ['No image registry found'] };
143
- }
144
-
145
- if (!restoredLabels) {
146
- restoredLabels = new Set<string>();
147
- }
148
-
149
- let result = text;
150
-
151
- // Pattern 1: Caption-like text
152
- const captionPatterns = [
153
- /@(fig|tbl):([a-zA-Z0-9_-]+):\s*([^\n]+)/gi,
154
- /^(Figure|Fig\.?)\s+(\d+|S\d+)[.:]\s*([^\n]+)/gim,
155
- /\|\s*@(fig|tbl):([a-zA-Z0-9_-]+):\s*([^|]+)\s*\|/gi,
156
- ];
157
-
158
- // Fix @fig:label: caption patterns
159
- result = result.replace(captionPatterns[0], (match, type, label, caption) => {
160
- const key = `${type}:${label}`;
161
- const entry = registry.byLabel.get(key);
162
- if (entry) {
163
- if (restoredLabels!.has(key)) {
164
- messages.push(`Skipped duplicate ${key} (already restored)`);
165
- return `![${entry.caption}](${entry.path})`;
166
- }
167
- restoredLabels!.add(key);
168
- restored++;
169
- messages.push(`Restored ${type}:${label} from registry`);
170
- return `![${entry.caption}](${entry.path}){#${type}:${label}}`;
171
- }
172
- return match;
173
- });
174
-
175
- // Fix table-wrapped captions
176
- result = result.replace(captionPatterns[2], (match, type, label, caption) => {
177
- const key = `${type}:${label}`;
178
- const entry = registry.byLabel.get(key);
179
- if (entry) {
180
- if (restoredLabels!.has(key)) {
181
- messages.push(`Skipped duplicate ${key} from table wrapper`);
182
- return `![${entry.caption}](${entry.path})`;
183
- }
184
- restoredLabels!.add(key);
185
- restored++;
186
- messages.push(`Restored ${type}:${label} from table wrapper`);
187
- return `![${entry.caption}](${entry.path}){#${type}:${label}}`;
188
- }
189
- return match;
190
- });
191
-
192
- // Clean up empty table structures
193
- result = result.replace(/\|\s*\|\s*\n\|:--:\|\s*\n/g, '');
194
-
195
- // Fix "Figure N:" standalone lines
196
- result = result.replace(captionPatterns[1], (match, prefix, num, caption) => {
197
- const numKey = `fig:${num}`;
198
- const entry = registry.byNumber.get(numKey);
199
- if (entry) {
200
- const labelKey = `fig:${entry.label}`;
201
- if (restoredLabels!.has(labelKey)) {
202
- messages.push(`Skipped duplicate Figure ${num} (already restored)`);
203
- return `![${entry.caption}](${entry.path})`;
204
- }
205
- restoredLabels!.add(labelKey);
206
- restored++;
207
- messages.push(`Restored Figure ${num} by number lookup`);
208
- return `![${entry.caption}](${entry.path}){#fig:${entry.label}}`;
209
- }
210
- return match;
211
- });
212
-
213
- // Fix generic media paths by matching caption text
214
- const genericImagePattern = /!\[([^\]]*)\]\(media\/[^)]+\)/g;
215
- result = result.replace(genericImagePattern, (match, caption) => {
216
- if (!caption || caption.trim() === '') {
217
- return match;
218
- }
219
-
220
- const captionKey = caption.slice(0, 50).toLowerCase().trim();
221
- const entry = registry.byCaption.get(captionKey);
222
- if (entry) {
223
- const labelKey = entry.label ? `${entry.type}:${entry.label}` : null;
224
- if (labelKey && restoredLabels!.has(labelKey)) {
225
- messages.push(`Skipped duplicate by caption match: ${captionKey.slice(0, 30)}...`);
226
- return `![${entry.caption}](${entry.path})`;
227
- }
228
- if (labelKey) {
229
- restoredLabels!.add(labelKey);
230
- }
231
- restored++;
232
- messages.push(`Restored image by caption match: ${captionKey.slice(0, 30)}...`);
233
- const anchor = (entry.label && !restoredLabels!.has(labelKey!)) ? `{#${entry.type}:${entry.label}}` : '';
234
- return `![${entry.caption}](${entry.path})${anchor}`;
235
- }
236
- return match;
237
- });
238
-
239
- return { text: result, restored, messages };
240
- }
1
+ /**
2
+ * Post-extraction reference restoration and comment parsing
3
+ */
4
+
5
+ import { readImageRegistry } from './image-registry.js';
6
+
7
+ // ============================================
8
+ // Type Definitions
9
+ // ============================================
10
+
11
+ export interface RestoreCrossrefResult {
12
+ text: string;
13
+ restored: number;
14
+ messages: string[];
15
+ restoredLabels: Set<string>;
16
+ }
17
+
18
+ export interface RestoreImagesResult {
19
+ text: string;
20
+ restored: number;
21
+ messages: string[];
22
+ }
23
+
24
+ // ============================================
25
+ // Functions
26
+ // ============================================
27
+
28
+ /**
29
+ * Parse visible comment markers from Word text
30
+ */
31
+ export function parseVisibleComments(text: string): Array<{ author: string; text: string; position: number }> {
32
+ const comments: Array<{ author: string; text: string; position: number }> = [];
33
+ const pattern = /\[([^\]:]+):\s*([^\]]+)\]/g;
34
+
35
+ let match;
36
+ while ((match = pattern.exec(text)) !== null) {
37
+ comments.push({
38
+ author: match[1].trim(),
39
+ text: match[2].trim(),
40
+ position: match.index,
41
+ });
42
+ }
43
+
44
+ return comments;
45
+ }
46
+
47
+ /**
48
+ * Convert visible comments to CriticMarkup format
49
+ */
50
+ export function convertVisibleComments(text: string): string {
51
+ return text.replace(/\[([^\]:]+):\s*([^\]]+)\]/g, '{>>$1: $2<<}');
52
+ }
53
+
54
+ /**
55
+ * Restore pandoc-crossref figure/table references from Word-rendered format
56
+ */
57
+ export function restoreCrossrefFromWord(
58
+ text: string,
59
+ projectDir: string,
60
+ restoredLabels: Set<string> | null = null
61
+ ): RestoreCrossrefResult {
62
+ const messages: string[] = [];
63
+ let restored = 0;
64
+ let result = text;
65
+
66
+ const registry = readImageRegistry(projectDir);
67
+
68
+ if (!restoredLabels) {
69
+ restoredLabels = new Set<string>();
70
+ }
71
+
72
+ // Pattern 1: [Figure]{.mark} [N]{.mark}
73
+ result = result.replace(/\[(Figure|Table|Fig\.?)\]\{\.mark\}\s*\[(\d+|S\d+)\]\{\.mark\}/gi, (match, type, num) => {
74
+ const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
75
+ if (registry) {
76
+ const entry = registry.byNumber?.get(`${prefix}:${num}`);
77
+ if (entry && entry.label) {
78
+ restored++;
79
+ return `@${prefix}:${entry.label}`;
80
+ }
81
+ }
82
+ restored++;
83
+ messages.push(`Restored ${type} ${num} (no label found, using placeholder)`);
84
+ return `@${prefix}:fig${num}`;
85
+ });
86
+
87
+ // Pattern 2: Plain "Figure N" or "Fig. N"
88
+ result = result.replace(/(?<!!)\b(Figure|Fig\.?|Table|Tbl\.?)\s+(\d+|S\d+)\b(?!\s*:)/gi, (match, type, num) => {
89
+ const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
90
+ if (registry) {
91
+ const entry = registry.byNumber?.get(`${prefix}:${num}`);
92
+ if (entry && entry.label) {
93
+ restored++;
94
+ return `@${prefix}:${entry.label}`;
95
+ }
96
+ }
97
+ return match;
98
+ });
99
+
100
+ // Pattern 3: Remove duplicate plain-text captions
101
+ result = result.replace(/(\!\[[^\]]+\]\([^)]+\)(?:\{[^}]*\})?)\s*\n+\s*(?:Figure|Fig\.?|Table|Tbl\.?)\s+\d+[:\.]?\s*[^\n]+/gi, '$1');
102
+
103
+ // Pattern 4: Clean up image captions that start with "Figure N: "
104
+ result = result.replace(/!\[(Figure|Fig\.?|Table|Tbl\.?)\s+(\d+|S\d+)[:\.]?\s*([^\]]*)\]\(([^)]+)\)(?:\{[^}]*\})?/gi,
105
+ (match, type, num, caption, imgPath) => {
106
+ const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
107
+ const labelKey = `${prefix}:${num}`;
108
+
109
+ if (registry) {
110
+ const entry = registry.byNumber?.get(labelKey);
111
+ if (entry) {
112
+ if (restoredLabels!.has(labelKey)) {
113
+ messages.push(`Skipped duplicate ${prefix}:${entry.label} (already restored)`);
114
+ return `![${entry.caption}](${entry.path})`;
115
+ }
116
+ restoredLabels!.add(labelKey);
117
+ restored++;
118
+ messages.push(`Restored image ${prefix}:${entry.label} from Figure ${num}`);
119
+ return `![${entry.caption}](${entry.path}){#${prefix}:${entry.label}}`;
120
+ }
121
+ }
122
+ const cleanCaption = caption.trim();
123
+ return `![${cleanCaption}](${imgPath})`;
124
+ });
125
+
126
+ return { text: result, restored, messages, restoredLabels };
127
+ }
128
+
129
+ /**
130
+ * Restore proper markdown image syntax from Word-extracted text using image registry
131
+ */
132
+ export function restoreImagesFromRegistry(
133
+ text: string,
134
+ projectDir: string,
135
+ restoredLabels: Set<string> | null = null
136
+ ): RestoreImagesResult {
137
+ const messages: string[] = [];
138
+ let restored = 0;
139
+
140
+ const registry = readImageRegistry(projectDir);
141
+ if (!registry || !registry.figures || registry.figures.length === 0) {
142
+ return { text, restored: 0, messages: ['No image registry found'] };
143
+ }
144
+
145
+ if (!restoredLabels) {
146
+ restoredLabels = new Set<string>();
147
+ }
148
+
149
+ let result = text;
150
+
151
+ // Pattern 1: Caption-like text
152
+ const captionPatterns = [
153
+ /@(fig|tbl):([a-zA-Z0-9_-]+):\s*([^\n]+)/gi,
154
+ /^(Figure|Fig\.?)\s+(\d+|S\d+)[.:]\s*([^\n]+)/gim,
155
+ /\|\s*@(fig|tbl):([a-zA-Z0-9_-]+):\s*([^|]+)\s*\|/gi,
156
+ ];
157
+
158
+ // Fix @fig:label: caption patterns
159
+ result = result.replace(captionPatterns[0], (match, type, label, caption) => {
160
+ const key = `${type}:${label}`;
161
+ const entry = registry.byLabel.get(key);
162
+ if (entry) {
163
+ if (restoredLabels!.has(key)) {
164
+ messages.push(`Skipped duplicate ${key} (already restored)`);
165
+ return `![${entry.caption}](${entry.path})`;
166
+ }
167
+ restoredLabels!.add(key);
168
+ restored++;
169
+ messages.push(`Restored ${type}:${label} from registry`);
170
+ return `![${entry.caption}](${entry.path}){#${type}:${label}}`;
171
+ }
172
+ return match;
173
+ });
174
+
175
+ // Fix table-wrapped captions
176
+ result = result.replace(captionPatterns[2], (match, type, label, caption) => {
177
+ const key = `${type}:${label}`;
178
+ const entry = registry.byLabel.get(key);
179
+ if (entry) {
180
+ if (restoredLabels!.has(key)) {
181
+ messages.push(`Skipped duplicate ${key} from table wrapper`);
182
+ return `![${entry.caption}](${entry.path})`;
183
+ }
184
+ restoredLabels!.add(key);
185
+ restored++;
186
+ messages.push(`Restored ${type}:${label} from table wrapper`);
187
+ return `![${entry.caption}](${entry.path}){#${type}:${label}}`;
188
+ }
189
+ return match;
190
+ });
191
+
192
+ // Clean up empty table structures
193
+ result = result.replace(/\|\s*\|\s*\n\|:--:\|\s*\n/g, '');
194
+
195
+ // Fix "Figure N:" standalone lines
196
+ result = result.replace(captionPatterns[1], (match, prefix, num, caption) => {
197
+ const numKey = `fig:${num}`;
198
+ const entry = registry.byNumber.get(numKey);
199
+ if (entry) {
200
+ const labelKey = `fig:${entry.label}`;
201
+ if (restoredLabels!.has(labelKey)) {
202
+ messages.push(`Skipped duplicate Figure ${num} (already restored)`);
203
+ return `![${entry.caption}](${entry.path})`;
204
+ }
205
+ restoredLabels!.add(labelKey);
206
+ restored++;
207
+ messages.push(`Restored Figure ${num} by number lookup`);
208
+ return `![${entry.caption}](${entry.path}){#fig:${entry.label}}`;
209
+ }
210
+ return match;
211
+ });
212
+
213
+ // Fix generic media paths by matching caption text
214
+ const genericImagePattern = /!\[([^\]]*)\]\(media\/[^)]+\)/g;
215
+ result = result.replace(genericImagePattern, (match, caption) => {
216
+ if (!caption || caption.trim() === '') {
217
+ return match;
218
+ }
219
+
220
+ const captionKey = caption.slice(0, 50).toLowerCase().trim();
221
+ const entry = registry.byCaption.get(captionKey);
222
+ if (entry) {
223
+ const labelKey = entry.label ? `${entry.type}:${entry.label}` : null;
224
+ if (labelKey && restoredLabels!.has(labelKey)) {
225
+ messages.push(`Skipped duplicate by caption match: ${captionKey.slice(0, 30)}...`);
226
+ return `![${entry.caption}](${entry.path})`;
227
+ }
228
+ if (labelKey) {
229
+ restoredLabels!.add(labelKey);
230
+ }
231
+ restored++;
232
+ messages.push(`Restored image by caption match: ${captionKey.slice(0, 30)}...`);
233
+ const anchor = (entry.label && !restoredLabels!.has(labelKey!)) ? `{#${entry.type}:${entry.label}}` : '';
234
+ return `![${entry.caption}](${entry.path})${anchor}`;
235
+ }
236
+ return match;
237
+ });
238
+
239
+ return { text: result, restored, messages };
240
+ }