docrev 0.10.0 → 0.10.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (126) hide show
  1. package/.gitattributes +1 -1
  2. package/CHANGELOG.md +173 -164
  3. package/PLAN-tables-and-postprocess.md +850 -850
  4. package/README.md +431 -431
  5. package/bin/rev.js +11 -11
  6. package/bin/rev.ts +145 -145
  7. package/completions/rev.bash +127 -127
  8. package/completions/rev.ps1 +210 -210
  9. package/completions/rev.zsh +207 -207
  10. package/dist/lib/anchor-match.d.ts +1 -1
  11. package/dist/lib/anchor-match.d.ts.map +1 -1
  12. package/dist/lib/anchor-match.js +17 -47
  13. package/dist/lib/anchor-match.js.map +1 -1
  14. package/dist/lib/build.js +4 -4
  15. package/dist/lib/commands/context.d.ts +1 -1
  16. package/dist/lib/commands/context.d.ts.map +1 -1
  17. package/dist/lib/commands/context.js +1 -1
  18. package/dist/lib/commands/context.js.map +1 -1
  19. package/dist/lib/commands/sections.js +7 -7
  20. package/dist/lib/commands/sections.js.map +1 -1
  21. package/dist/lib/commands/sync.d.ts.map +1 -1
  22. package/dist/lib/commands/sync.js +15 -14
  23. package/dist/lib/commands/sync.js.map +1 -1
  24. package/dist/lib/commands/utilities.js +164 -164
  25. package/dist/lib/commands/verify-anchors.js +6 -6
  26. package/dist/lib/commands/verify-anchors.js.map +1 -1
  27. package/dist/lib/commands/word-tools.js +8 -8
  28. package/dist/lib/grammar.js +3 -3
  29. package/dist/lib/macro-filter.lua +201 -201
  30. package/dist/lib/pdf-comments.js +44 -44
  31. package/dist/lib/plugins.js +57 -57
  32. package/dist/lib/pptx-color-filter.lua +37 -37
  33. package/dist/lib/pptx-themes.js +115 -115
  34. package/dist/lib/sections.d.ts +35 -0
  35. package/dist/lib/sections.d.ts.map +1 -1
  36. package/dist/lib/sections.js +81 -0
  37. package/dist/lib/sections.js.map +1 -1
  38. package/dist/lib/spelling.js +2 -2
  39. package/dist/lib/templates.js +387 -387
  40. package/dist/lib/themes.js +51 -51
  41. package/docs-src/build.py +113 -113
  42. package/docs-src/extra.css +208 -208
  43. package/docs-src/md-to-html.lua +6 -6
  44. package/docs-src/template.html +116 -116
  45. package/eslint.config.js +27 -27
  46. package/lib/anchor-match.ts +276 -308
  47. package/lib/annotations.ts +644 -644
  48. package/lib/build.ts +1766 -1766
  49. package/lib/citations.ts +160 -160
  50. package/lib/commands/build.ts +855 -855
  51. package/lib/commands/citations.ts +515 -515
  52. package/lib/commands/comments.ts +1050 -1050
  53. package/lib/commands/context.ts +176 -174
  54. package/lib/commands/core.ts +309 -309
  55. package/lib/commands/doi.ts +435 -435
  56. package/lib/commands/file-ops.ts +372 -372
  57. package/lib/commands/history.ts +320 -320
  58. package/lib/commands/index.ts +87 -87
  59. package/lib/commands/init.ts +259 -259
  60. package/lib/commands/merge-resolve.ts +378 -378
  61. package/lib/commands/preview.ts +178 -178
  62. package/lib/commands/project-info.ts +244 -244
  63. package/lib/commands/quality.ts +517 -517
  64. package/lib/commands/response.ts +454 -454
  65. package/lib/commands/section-boundaries.ts +82 -82
  66. package/lib/commands/sections.ts +451 -451
  67. package/lib/commands/sync.ts +709 -706
  68. package/lib/commands/text-ops.ts +449 -449
  69. package/lib/commands/utilities.ts +448 -448
  70. package/lib/commands/verify-anchors.ts +272 -272
  71. package/lib/commands/word-tools.ts +340 -340
  72. package/lib/comment-realign.ts +517 -517
  73. package/lib/config.ts +84 -84
  74. package/lib/crossref.ts +781 -781
  75. package/lib/csl.ts +191 -191
  76. package/lib/dependencies.ts +98 -98
  77. package/lib/diff-engine.ts +465 -465
  78. package/lib/doi-cache.ts +115 -115
  79. package/lib/doi.ts +897 -897
  80. package/lib/equations.ts +506 -506
  81. package/lib/errors.ts +346 -346
  82. package/lib/format.ts +541 -541
  83. package/lib/git.ts +326 -326
  84. package/lib/grammar.ts +303 -303
  85. package/lib/image-registry.ts +180 -180
  86. package/lib/import.ts +911 -911
  87. package/lib/journals.ts +543 -543
  88. package/lib/macro-filter.lua +201 -201
  89. package/lib/macros.ts +273 -273
  90. package/lib/merge.ts +633 -633
  91. package/lib/orcid.ts +144 -144
  92. package/lib/pdf-comments.ts +263 -263
  93. package/lib/pdf-import.ts +524 -524
  94. package/lib/plugins.ts +362 -362
  95. package/lib/postprocess.ts +188 -188
  96. package/lib/pptx-color-filter.lua +37 -37
  97. package/lib/pptx-template.ts +469 -469
  98. package/lib/pptx-themes.ts +483 -483
  99. package/lib/protect-restore.ts +520 -520
  100. package/lib/rate-limiter.ts +94 -94
  101. package/lib/response.ts +197 -197
  102. package/lib/restore-references.ts +240 -240
  103. package/lib/review.ts +327 -327
  104. package/lib/schema.ts +488 -488
  105. package/lib/scientific-words.ts +73 -73
  106. package/lib/sections.ts +425 -335
  107. package/lib/slides.ts +756 -756
  108. package/lib/spelling.ts +334 -334
  109. package/lib/templates.ts +526 -526
  110. package/lib/themes.ts +742 -742
  111. package/lib/trackchanges.ts +247 -247
  112. package/lib/tui.ts +450 -450
  113. package/lib/types.ts +550 -550
  114. package/lib/undo.ts +250 -250
  115. package/lib/utils.ts +69 -69
  116. package/lib/variables.ts +179 -179
  117. package/lib/word-extraction.ts +806 -806
  118. package/lib/word.ts +643 -643
  119. package/lib/wordcomments.ts +840 -840
  120. package/mkdocs.yml +64 -64
  121. package/package.json +137 -137
  122. package/scripts/postbuild.js +47 -47
  123. package/skill/REFERENCE.md +539 -539
  124. package/skill/SKILL.md +295 -295
  125. package/tsconfig.json +26 -26
  126. package/types/index.d.ts +525 -525
@@ -1,240 +1,240 @@
1
- /**
2
- * Post-extraction reference restoration and comment parsing
3
- */
4
-
5
- import { readImageRegistry } from './image-registry.js';
6
-
7
- // ============================================
8
- // Type Definitions
9
- // ============================================
10
-
11
- export interface RestoreCrossrefResult {
12
- text: string;
13
- restored: number;
14
- messages: string[];
15
- restoredLabels: Set<string>;
16
- }
17
-
18
- export interface RestoreImagesResult {
19
- text: string;
20
- restored: number;
21
- messages: string[];
22
- }
23
-
24
- // ============================================
25
- // Functions
26
- // ============================================
27
-
28
- /**
29
- * Parse visible comment markers from Word text
30
- */
31
- export function parseVisibleComments(text: string): Array<{ author: string; text: string; position: number }> {
32
- const comments: Array<{ author: string; text: string; position: number }> = [];
33
- const pattern = /\[([^\]:]+):\s*([^\]]+)\]/g;
34
-
35
- let match;
36
- while ((match = pattern.exec(text)) !== null) {
37
- comments.push({
38
- author: match[1].trim(),
39
- text: match[2].trim(),
40
- position: match.index,
41
- });
42
- }
43
-
44
- return comments;
45
- }
46
-
47
- /**
48
- * Convert visible comments to CriticMarkup format
49
- */
50
- export function convertVisibleComments(text: string): string {
51
- return text.replace(/\[([^\]:]+):\s*([^\]]+)\]/g, '{>>$1: $2<<}');
52
- }
53
-
54
- /**
55
- * Restore pandoc-crossref figure/table references from Word-rendered format
56
- */
57
- export function restoreCrossrefFromWord(
58
- text: string,
59
- projectDir: string,
60
- restoredLabels: Set<string> | null = null
61
- ): RestoreCrossrefResult {
62
- const messages: string[] = [];
63
- let restored = 0;
64
- let result = text;
65
-
66
- const registry = readImageRegistry(projectDir);
67
-
68
- if (!restoredLabels) {
69
- restoredLabels = new Set<string>();
70
- }
71
-
72
- // Pattern 1: [Figure]{.mark} [N]{.mark}
73
- result = result.replace(/\[(Figure|Table|Fig\.?)\]\{\.mark\}\s*\[(\d+|S\d+)\]\{\.mark\}/gi, (match, type, num) => {
74
- const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
75
- if (registry) {
76
- const entry = registry.byNumber?.get(`${prefix}:${num}`);
77
- if (entry && entry.label) {
78
- restored++;
79
- return `@${prefix}:${entry.label}`;
80
- }
81
- }
82
- restored++;
83
- messages.push(`Restored ${type} ${num} (no label found, using placeholder)`);
84
- return `@${prefix}:fig${num}`;
85
- });
86
-
87
- // Pattern 2: Plain "Figure N" or "Fig. N"
88
- result = result.replace(/(?<!!)\b(Figure|Fig\.?|Table|Tbl\.?)\s+(\d+|S\d+)\b(?!\s*:)/gi, (match, type, num) => {
89
- const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
90
- if (registry) {
91
- const entry = registry.byNumber?.get(`${prefix}:${num}`);
92
- if (entry && entry.label) {
93
- restored++;
94
- return `@${prefix}:${entry.label}`;
95
- }
96
- }
97
- return match;
98
- });
99
-
100
- // Pattern 3: Remove duplicate plain-text captions
101
- result = result.replace(/(\!\[[^\]]+\]\([^)]+\)(?:\{[^}]*\})?)\s*\n+\s*(?:Figure|Fig\.?|Table|Tbl\.?)\s+\d+[:\.]?\s*[^\n]+/gi, '$1');
102
-
103
- // Pattern 4: Clean up image captions that start with "Figure N: "
104
- result = result.replace(/!\[(Figure|Fig\.?|Table|Tbl\.?)\s+(\d+|S\d+)[:\.]?\s*([^\]]*)\]\(([^)]+)\)(?:\{[^}]*\})?/gi,
105
- (match, type, num, caption, imgPath) => {
106
- const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
107
- const labelKey = `${prefix}:${num}`;
108
-
109
- if (registry) {
110
- const entry = registry.byNumber?.get(labelKey);
111
- if (entry) {
112
- if (restoredLabels!.has(labelKey)) {
113
- messages.push(`Skipped duplicate ${prefix}:${entry.label} (already restored)`);
114
- return `![${entry.caption}](${entry.path})`;
115
- }
116
- restoredLabels!.add(labelKey);
117
- restored++;
118
- messages.push(`Restored image ${prefix}:${entry.label} from Figure ${num}`);
119
- return `![${entry.caption}](${entry.path}){#${prefix}:${entry.label}}`;
120
- }
121
- }
122
- const cleanCaption = caption.trim();
123
- return `![${cleanCaption}](${imgPath})`;
124
- });
125
-
126
- return { text: result, restored, messages, restoredLabels };
127
- }
128
-
129
- /**
130
- * Restore proper markdown image syntax from Word-extracted text using image registry
131
- */
132
- export function restoreImagesFromRegistry(
133
- text: string,
134
- projectDir: string,
135
- restoredLabels: Set<string> | null = null
136
- ): RestoreImagesResult {
137
- const messages: string[] = [];
138
- let restored = 0;
139
-
140
- const registry = readImageRegistry(projectDir);
141
- if (!registry || !registry.figures || registry.figures.length === 0) {
142
- return { text, restored: 0, messages: ['No image registry found'] };
143
- }
144
-
145
- if (!restoredLabels) {
146
- restoredLabels = new Set<string>();
147
- }
148
-
149
- let result = text;
150
-
151
- // Pattern 1: Caption-like text
152
- const captionPatterns = [
153
- /@(fig|tbl):([a-zA-Z0-9_-]+):\s*([^\n]+)/gi,
154
- /^(Figure|Fig\.?)\s+(\d+|S\d+)[.:]\s*([^\n]+)/gim,
155
- /\|\s*@(fig|tbl):([a-zA-Z0-9_-]+):\s*([^|]+)\s*\|/gi,
156
- ];
157
-
158
- // Fix @fig:label: caption patterns
159
- result = result.replace(captionPatterns[0], (match, type, label, caption) => {
160
- const key = `${type}:${label}`;
161
- const entry = registry.byLabel.get(key);
162
- if (entry) {
163
- if (restoredLabels!.has(key)) {
164
- messages.push(`Skipped duplicate ${key} (already restored)`);
165
- return `![${entry.caption}](${entry.path})`;
166
- }
167
- restoredLabels!.add(key);
168
- restored++;
169
- messages.push(`Restored ${type}:${label} from registry`);
170
- return `![${entry.caption}](${entry.path}){#${type}:${label}}`;
171
- }
172
- return match;
173
- });
174
-
175
- // Fix table-wrapped captions
176
- result = result.replace(captionPatterns[2], (match, type, label, caption) => {
177
- const key = `${type}:${label}`;
178
- const entry = registry.byLabel.get(key);
179
- if (entry) {
180
- if (restoredLabels!.has(key)) {
181
- messages.push(`Skipped duplicate ${key} from table wrapper`);
182
- return `![${entry.caption}](${entry.path})`;
183
- }
184
- restoredLabels!.add(key);
185
- restored++;
186
- messages.push(`Restored ${type}:${label} from table wrapper`);
187
- return `![${entry.caption}](${entry.path}){#${type}:${label}}`;
188
- }
189
- return match;
190
- });
191
-
192
- // Clean up empty table structures
193
- result = result.replace(/\|\s*\|\s*\n\|:--:\|\s*\n/g, '');
194
-
195
- // Fix "Figure N:" standalone lines
196
- result = result.replace(captionPatterns[1], (match, prefix, num, caption) => {
197
- const numKey = `fig:${num}`;
198
- const entry = registry.byNumber.get(numKey);
199
- if (entry) {
200
- const labelKey = `fig:${entry.label}`;
201
- if (restoredLabels!.has(labelKey)) {
202
- messages.push(`Skipped duplicate Figure ${num} (already restored)`);
203
- return `![${entry.caption}](${entry.path})`;
204
- }
205
- restoredLabels!.add(labelKey);
206
- restored++;
207
- messages.push(`Restored Figure ${num} by number lookup`);
208
- return `![${entry.caption}](${entry.path}){#fig:${entry.label}}`;
209
- }
210
- return match;
211
- });
212
-
213
- // Fix generic media paths by matching caption text
214
- const genericImagePattern = /!\[([^\]]*)\]\(media\/[^)]+\)/g;
215
- result = result.replace(genericImagePattern, (match, caption) => {
216
- if (!caption || caption.trim() === '') {
217
- return match;
218
- }
219
-
220
- const captionKey = caption.slice(0, 50).toLowerCase().trim();
221
- const entry = registry.byCaption.get(captionKey);
222
- if (entry) {
223
- const labelKey = entry.label ? `${entry.type}:${entry.label}` : null;
224
- if (labelKey && restoredLabels!.has(labelKey)) {
225
- messages.push(`Skipped duplicate by caption match: ${captionKey.slice(0, 30)}...`);
226
- return `![${entry.caption}](${entry.path})`;
227
- }
228
- if (labelKey) {
229
- restoredLabels!.add(labelKey);
230
- }
231
- restored++;
232
- messages.push(`Restored image by caption match: ${captionKey.slice(0, 30)}...`);
233
- const anchor = (entry.label && !restoredLabels!.has(labelKey!)) ? `{#${entry.type}:${entry.label}}` : '';
234
- return `![${entry.caption}](${entry.path})${anchor}`;
235
- }
236
- return match;
237
- });
238
-
239
- return { text: result, restored, messages };
240
- }
1
+ /**
2
+ * Post-extraction reference restoration and comment parsing
3
+ */
4
+
5
+ import { readImageRegistry } from './image-registry.js';
6
+
7
+ // ============================================
8
+ // Type Definitions
9
+ // ============================================
10
+
11
+ export interface RestoreCrossrefResult {
12
+ text: string;
13
+ restored: number;
14
+ messages: string[];
15
+ restoredLabels: Set<string>;
16
+ }
17
+
18
+ export interface RestoreImagesResult {
19
+ text: string;
20
+ restored: number;
21
+ messages: string[];
22
+ }
23
+
24
+ // ============================================
25
+ // Functions
26
+ // ============================================
27
+
28
+ /**
29
+ * Parse visible comment markers from Word text
30
+ */
31
+ export function parseVisibleComments(text: string): Array<{ author: string; text: string; position: number }> {
32
+ const comments: Array<{ author: string; text: string; position: number }> = [];
33
+ const pattern = /\[([^\]:]+):\s*([^\]]+)\]/g;
34
+
35
+ let match;
36
+ while ((match = pattern.exec(text)) !== null) {
37
+ comments.push({
38
+ author: match[1].trim(),
39
+ text: match[2].trim(),
40
+ position: match.index,
41
+ });
42
+ }
43
+
44
+ return comments;
45
+ }
46
+
47
+ /**
48
+ * Convert visible comments to CriticMarkup format
49
+ */
50
+ export function convertVisibleComments(text: string): string {
51
+ return text.replace(/\[([^\]:]+):\s*([^\]]+)\]/g, '{>>$1: $2<<}');
52
+ }
53
+
54
+ /**
55
+ * Restore pandoc-crossref figure/table references from Word-rendered format
56
+ */
57
+ export function restoreCrossrefFromWord(
58
+ text: string,
59
+ projectDir: string,
60
+ restoredLabels: Set<string> | null = null
61
+ ): RestoreCrossrefResult {
62
+ const messages: string[] = [];
63
+ let restored = 0;
64
+ let result = text;
65
+
66
+ const registry = readImageRegistry(projectDir);
67
+
68
+ if (!restoredLabels) {
69
+ restoredLabels = new Set<string>();
70
+ }
71
+
72
+ // Pattern 1: [Figure]{.mark} [N]{.mark}
73
+ result = result.replace(/\[(Figure|Table|Fig\.?)\]\{\.mark\}\s*\[(\d+|S\d+)\]\{\.mark\}/gi, (match, type, num) => {
74
+ const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
75
+ if (registry) {
76
+ const entry = registry.byNumber?.get(`${prefix}:${num}`);
77
+ if (entry && entry.label) {
78
+ restored++;
79
+ return `@${prefix}:${entry.label}`;
80
+ }
81
+ }
82
+ restored++;
83
+ messages.push(`Restored ${type} ${num} (no label found, using placeholder)`);
84
+ return `@${prefix}:fig${num}`;
85
+ });
86
+
87
+ // Pattern 2: Plain "Figure N" or "Fig. N"
88
+ result = result.replace(/(?<!!)\b(Figure|Fig\.?|Table|Tbl\.?)\s+(\d+|S\d+)\b(?!\s*:)/gi, (match, type, num) => {
89
+ const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
90
+ if (registry) {
91
+ const entry = registry.byNumber?.get(`${prefix}:${num}`);
92
+ if (entry && entry.label) {
93
+ restored++;
94
+ return `@${prefix}:${entry.label}`;
95
+ }
96
+ }
97
+ return match;
98
+ });
99
+
100
+ // Pattern 3: Remove duplicate plain-text captions
101
+ result = result.replace(/(\!\[[^\]]+\]\([^)]+\)(?:\{[^}]*\})?)\s*\n+\s*(?:Figure|Fig\.?|Table|Tbl\.?)\s+\d+[:\.]?\s*[^\n]+/gi, '$1');
102
+
103
+ // Pattern 4: Clean up image captions that start with "Figure N: "
104
+ result = result.replace(/!\[(Figure|Fig\.?|Table|Tbl\.?)\s+(\d+|S\d+)[:\.]?\s*([^\]]*)\]\(([^)]+)\)(?:\{[^}]*\})?/gi,
105
+ (match, type, num, caption, imgPath) => {
106
+ const prefix = type.toLowerCase().startsWith('tab') ? 'tbl' : 'fig';
107
+ const labelKey = `${prefix}:${num}`;
108
+
109
+ if (registry) {
110
+ const entry = registry.byNumber?.get(labelKey);
111
+ if (entry) {
112
+ if (restoredLabels!.has(labelKey)) {
113
+ messages.push(`Skipped duplicate ${prefix}:${entry.label} (already restored)`);
114
+ return `![${entry.caption}](${entry.path})`;
115
+ }
116
+ restoredLabels!.add(labelKey);
117
+ restored++;
118
+ messages.push(`Restored image ${prefix}:${entry.label} from Figure ${num}`);
119
+ return `![${entry.caption}](${entry.path}){#${prefix}:${entry.label}}`;
120
+ }
121
+ }
122
+ const cleanCaption = caption.trim();
123
+ return `![${cleanCaption}](${imgPath})`;
124
+ });
125
+
126
+ return { text: result, restored, messages, restoredLabels };
127
+ }
128
+
129
+ /**
130
+ * Restore proper markdown image syntax from Word-extracted text using image registry
131
+ */
132
+ export function restoreImagesFromRegistry(
133
+ text: string,
134
+ projectDir: string,
135
+ restoredLabels: Set<string> | null = null
136
+ ): RestoreImagesResult {
137
+ const messages: string[] = [];
138
+ let restored = 0;
139
+
140
+ const registry = readImageRegistry(projectDir);
141
+ if (!registry || !registry.figures || registry.figures.length === 0) {
142
+ return { text, restored: 0, messages: ['No image registry found'] };
143
+ }
144
+
145
+ if (!restoredLabels) {
146
+ restoredLabels = new Set<string>();
147
+ }
148
+
149
+ let result = text;
150
+
151
+ // Pattern 1: Caption-like text
152
+ const captionPatterns = [
153
+ /@(fig|tbl):([a-zA-Z0-9_-]+):\s*([^\n]+)/gi,
154
+ /^(Figure|Fig\.?)\s+(\d+|S\d+)[.:]\s*([^\n]+)/gim,
155
+ /\|\s*@(fig|tbl):([a-zA-Z0-9_-]+):\s*([^|]+)\s*\|/gi,
156
+ ];
157
+
158
+ // Fix @fig:label: caption patterns
159
+ result = result.replace(captionPatterns[0], (match, type, label, caption) => {
160
+ const key = `${type}:${label}`;
161
+ const entry = registry.byLabel.get(key);
162
+ if (entry) {
163
+ if (restoredLabels!.has(key)) {
164
+ messages.push(`Skipped duplicate ${key} (already restored)`);
165
+ return `![${entry.caption}](${entry.path})`;
166
+ }
167
+ restoredLabels!.add(key);
168
+ restored++;
169
+ messages.push(`Restored ${type}:${label} from registry`);
170
+ return `![${entry.caption}](${entry.path}){#${type}:${label}}`;
171
+ }
172
+ return match;
173
+ });
174
+
175
+ // Fix table-wrapped captions
176
+ result = result.replace(captionPatterns[2], (match, type, label, caption) => {
177
+ const key = `${type}:${label}`;
178
+ const entry = registry.byLabel.get(key);
179
+ if (entry) {
180
+ if (restoredLabels!.has(key)) {
181
+ messages.push(`Skipped duplicate ${key} from table wrapper`);
182
+ return `![${entry.caption}](${entry.path})`;
183
+ }
184
+ restoredLabels!.add(key);
185
+ restored++;
186
+ messages.push(`Restored ${type}:${label} from table wrapper`);
187
+ return `![${entry.caption}](${entry.path}){#${type}:${label}}`;
188
+ }
189
+ return match;
190
+ });
191
+
192
+ // Clean up empty table structures
193
+ result = result.replace(/\|\s*\|\s*\n\|:--:\|\s*\n/g, '');
194
+
195
+ // Fix "Figure N:" standalone lines
196
+ result = result.replace(captionPatterns[1], (match, prefix, num, caption) => {
197
+ const numKey = `fig:${num}`;
198
+ const entry = registry.byNumber.get(numKey);
199
+ if (entry) {
200
+ const labelKey = `fig:${entry.label}`;
201
+ if (restoredLabels!.has(labelKey)) {
202
+ messages.push(`Skipped duplicate Figure ${num} (already restored)`);
203
+ return `![${entry.caption}](${entry.path})`;
204
+ }
205
+ restoredLabels!.add(labelKey);
206
+ restored++;
207
+ messages.push(`Restored Figure ${num} by number lookup`);
208
+ return `![${entry.caption}](${entry.path}){#fig:${entry.label}}`;
209
+ }
210
+ return match;
211
+ });
212
+
213
+ // Fix generic media paths by matching caption text
214
+ const genericImagePattern = /!\[([^\]]*)\]\(media\/[^)]+\)/g;
215
+ result = result.replace(genericImagePattern, (match, caption) => {
216
+ if (!caption || caption.trim() === '') {
217
+ return match;
218
+ }
219
+
220
+ const captionKey = caption.slice(0, 50).toLowerCase().trim();
221
+ const entry = registry.byCaption.get(captionKey);
222
+ if (entry) {
223
+ const labelKey = entry.label ? `${entry.type}:${entry.label}` : null;
224
+ if (labelKey && restoredLabels!.has(labelKey)) {
225
+ messages.push(`Skipped duplicate by caption match: ${captionKey.slice(0, 30)}...`);
226
+ return `![${entry.caption}](${entry.path})`;
227
+ }
228
+ if (labelKey) {
229
+ restoredLabels!.add(labelKey);
230
+ }
231
+ restored++;
232
+ messages.push(`Restored image by caption match: ${captionKey.slice(0, 30)}...`);
233
+ const anchor = (entry.label && !restoredLabels!.has(labelKey!)) ? `{#${entry.type}:${entry.label}}` : '';
234
+ return `![${entry.caption}](${entry.path})${anchor}`;
235
+ }
236
+ return match;
237
+ });
238
+
239
+ return { text: result, restored, messages };
240
+ }