@beyondwork/docx-react-component 1.0.28 → 1.0.29

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (354) hide show
  1. package/dist/canonical-document-BLEbzL2J.d.cts +844 -0
  2. package/dist/canonical-document-BLEbzL2J.d.ts +844 -0
  3. package/dist/chunk-2FJS5GZM.js +763 -0
  4. package/dist/chunk-2FJS5GZM.js.map +1 -0
  5. package/{src/core/commands/section-layout-commands.ts → dist/chunk-2OQBZS3F.js} +106 -340
  6. package/dist/chunk-2OQBZS3F.js.map +1 -0
  7. package/dist/chunk-2S7W4KFO.js +127 -0
  8. package/dist/chunk-2S7W4KFO.js.map +1 -0
  9. package/dist/chunk-2TG72QSW.js +3874 -0
  10. package/dist/chunk-2TG72QSW.js.map +1 -0
  11. package/{src/core/commands/table-structure-commands.ts → dist/chunk-36QNIZBO.js} +126 -315
  12. package/dist/chunk-36QNIZBO.js.map +1 -0
  13. package/dist/chunk-4AQOYAW4.js +3069 -0
  14. package/dist/chunk-4AQOYAW4.js.map +1 -0
  15. package/dist/chunk-4D5EWJ3P.js +77 -0
  16. package/dist/chunk-4D5EWJ3P.js.map +1 -0
  17. package/dist/chunk-5FN54NDH.js +2257 -0
  18. package/dist/chunk-5FN54NDH.js.map +1 -0
  19. package/dist/chunk-BOYGQYRQ.js +7306 -0
  20. package/dist/chunk-BOYGQYRQ.js.map +1 -0
  21. package/dist/chunk-CN3XMECL.js +212 -0
  22. package/dist/chunk-CN3XMECL.js.map +1 -0
  23. package/dist/chunk-EBI3BX6U.js +164 -0
  24. package/dist/chunk-EBI3BX6U.js.map +1 -0
  25. package/dist/chunk-EILUG3VB.js +1275 -0
  26. package/dist/chunk-EILUG3VB.js.map +1 -0
  27. package/dist/chunk-FUDY333O.js +70 -0
  28. package/dist/chunk-FUDY333O.js.map +1 -0
  29. package/dist/chunk-GBVOWFIK.js +1237 -0
  30. package/dist/chunk-GBVOWFIK.js.map +1 -0
  31. package/dist/chunk-H4TQ3H3Y.js +262 -0
  32. package/dist/chunk-H4TQ3H3Y.js.map +1 -0
  33. package/{src/core/commands/style-commands.ts → dist/chunk-JGB3IXZO.js} +40 -113
  34. package/dist/chunk-JGB3IXZO.js.map +1 -0
  35. package/dist/chunk-KD2QRQPY.js +4342 -0
  36. package/dist/chunk-KD2QRQPY.js.map +1 -0
  37. package/dist/chunk-KLMXQVYK.js +369 -0
  38. package/dist/chunk-KLMXQVYK.js.map +1 -0
  39. package/dist/chunk-KZUG5KFQ.js +214 -0
  40. package/dist/chunk-KZUG5KFQ.js.map +1 -0
  41. package/{src/core/state/text-transaction.ts → dist/chunk-QDAQ4CJU.js} +79 -236
  42. package/dist/chunk-QDAQ4CJU.js.map +1 -0
  43. package/{src/legal/bookmarks.ts → dist/chunk-RMH72RZI.js} +44 -130
  44. package/dist/chunk-RMH72RZI.js.map +1 -0
  45. package/dist/chunk-SWKWQZXM.js +117 -0
  46. package/dist/chunk-SWKWQZXM.js.map +1 -0
  47. package/{src/core/commands/formatting-commands.ts → dist/chunk-TJBP2K4T.js} +196 -536
  48. package/dist/chunk-TJBP2K4T.js.map +1 -0
  49. package/dist/chunk-TLCEAQDQ.js +542 -0
  50. package/dist/chunk-TLCEAQDQ.js.map +1 -0
  51. package/{src/core/commands/text-commands.ts → dist/chunk-UZXBISGO.js} +86 -142
  52. package/dist/chunk-UZXBISGO.js.map +1 -0
  53. package/dist/chunk-WGBAKP3Q.js +3220 -0
  54. package/dist/chunk-WGBAKP3Q.js.map +1 -0
  55. package/dist/compare/index.cjs +5475 -0
  56. package/dist/compare/index.cjs.map +1 -0
  57. package/dist/compare/index.d.cts +114 -0
  58. package/dist/compare/index.d.ts +114 -0
  59. package/dist/compare/index.js +731 -0
  60. package/dist/compare/index.js.map +1 -0
  61. package/dist/core/commands/formatting-commands.cjs +828 -0
  62. package/dist/core/commands/formatting-commands.cjs.map +1 -0
  63. package/dist/core/commands/formatting-commands.d.cts +63 -0
  64. package/dist/core/commands/formatting-commands.d.ts +63 -0
  65. package/dist/core/commands/formatting-commands.js +37 -0
  66. package/dist/core/commands/formatting-commands.js.map +1 -0
  67. package/dist/core/commands/image-commands.cjs +2023 -0
  68. package/dist/core/commands/image-commands.cjs.map +1 -0
  69. package/dist/core/commands/image-commands.d.cts +58 -0
  70. package/dist/core/commands/image-commands.d.ts +58 -0
  71. package/dist/core/commands/image-commands.js +18 -0
  72. package/dist/core/commands/image-commands.js.map +1 -0
  73. package/dist/core/commands/section-layout-commands.cjs +477 -0
  74. package/dist/core/commands/section-layout-commands.cjs.map +1 -0
  75. package/dist/core/commands/section-layout-commands.d.cts +62 -0
  76. package/dist/core/commands/section-layout-commands.d.ts +62 -0
  77. package/dist/core/commands/section-layout-commands.js +21 -0
  78. package/dist/core/commands/section-layout-commands.js.map +1 -0
  79. package/dist/core/commands/style-commands.cjs +214 -0
  80. package/dist/core/commands/style-commands.cjs.map +1 -0
  81. package/dist/core/commands/style-commands.d.cts +13 -0
  82. package/dist/core/commands/style-commands.d.ts +13 -0
  83. package/dist/core/commands/style-commands.js +9 -0
  84. package/dist/core/commands/style-commands.js.map +1 -0
  85. package/dist/core/commands/table-structure-commands.cjs +1883 -0
  86. package/dist/core/commands/table-structure-commands.cjs.map +1 -0
  87. package/dist/core/commands/table-structure-commands.d.cts +59 -0
  88. package/dist/core/commands/table-structure-commands.d.ts +59 -0
  89. package/dist/core/commands/table-structure-commands.js +12 -0
  90. package/dist/core/commands/table-structure-commands.js.map +1 -0
  91. package/dist/core/commands/text-commands.cjs +2391 -0
  92. package/dist/core/commands/text-commands.cjs.map +1 -0
  93. package/dist/core/commands/text-commands.d.cts +24 -0
  94. package/dist/core/commands/text-commands.d.ts +24 -0
  95. package/dist/core/commands/text-commands.js +28 -0
  96. package/dist/core/commands/text-commands.js.map +1 -0
  97. package/dist/core/selection/mapping.cjs +200 -0
  98. package/dist/core/selection/mapping.cjs.map +1 -0
  99. package/dist/core/selection/mapping.d.cts +2 -0
  100. package/dist/core/selection/mapping.d.ts +2 -0
  101. package/dist/core/selection/mapping.js +31 -0
  102. package/dist/core/selection/mapping.js.map +1 -0
  103. package/dist/core/state/editor-state.cjs +2278 -0
  104. package/dist/core/state/editor-state.cjs.map +1 -0
  105. package/dist/core/state/editor-state.d.cts +2 -0
  106. package/dist/core/state/editor-state.d.ts +2 -0
  107. package/dist/core/state/editor-state.js +26 -0
  108. package/dist/core/state/editor-state.js.map +1 -0
  109. package/dist/index.cjs +38553 -0
  110. package/dist/index.cjs.map +1 -0
  111. package/dist/index.d.cts +15 -0
  112. package/dist/index.d.ts +15 -0
  113. package/dist/index.js +7856 -0
  114. package/dist/index.js.map +1 -0
  115. package/dist/io/docx-session.cjs +16236 -0
  116. package/dist/io/docx-session.cjs.map +1 -0
  117. package/dist/io/docx-session.d.cts +21 -0
  118. package/dist/io/docx-session.d.ts +21 -0
  119. package/dist/io/docx-session.js +18 -0
  120. package/dist/io/docx-session.js.map +1 -0
  121. package/dist/legal/index.cjs +3900 -0
  122. package/dist/legal/index.cjs.map +1 -0
  123. package/dist/legal/index.d.cts +86 -0
  124. package/dist/legal/index.d.ts +86 -0
  125. package/dist/legal/index.js +616 -0
  126. package/dist/legal/index.js.map +1 -0
  127. package/dist/public-types-7ZL_94cz.d.ts +1573 -0
  128. package/dist/public-types-CeMaDueh.d.cts +1573 -0
  129. package/dist/public-types.cjs +19 -0
  130. package/dist/public-types.cjs.map +1 -0
  131. package/dist/public-types.d.cts +2 -0
  132. package/dist/public-types.d.ts +2 -0
  133. package/dist/public-types.js +1 -0
  134. package/dist/public-types.js.map +1 -0
  135. package/dist/runtime/document-runtime.cjs +11140 -0
  136. package/dist/runtime/document-runtime.cjs.map +1 -0
  137. package/dist/runtime/document-runtime.d.cts +231 -0
  138. package/dist/runtime/document-runtime.d.ts +231 -0
  139. package/dist/runtime/document-runtime.js +21 -0
  140. package/dist/runtime/document-runtime.js.map +1 -0
  141. package/dist/structural-helpers-CilgOVhh.d.cts +10 -0
  142. package/dist/structural-helpers-q0Gd-eBN.d.ts +10 -0
  143. package/dist/ui-tailwind/editor-surface/search-plugin.cjs +313 -0
  144. package/dist/ui-tailwind/editor-surface/search-plugin.cjs.map +1 -0
  145. package/dist/ui-tailwind/editor-surface/search-plugin.d.cts +67 -0
  146. package/dist/ui-tailwind/editor-surface/search-plugin.d.ts +67 -0
  147. package/dist/ui-tailwind/editor-surface/search-plugin.js +23 -0
  148. package/dist/ui-tailwind/editor-surface/search-plugin.js.map +1 -0
  149. package/dist/ui-tailwind/index.cjs +4833 -0
  150. package/dist/ui-tailwind/index.cjs.map +1 -0
  151. package/dist/ui-tailwind/index.d.cts +617 -0
  152. package/dist/ui-tailwind/index.d.ts +617 -0
  153. package/dist/ui-tailwind/index.js +575 -0
  154. package/dist/ui-tailwind/index.js.map +1 -0
  155. package/package.json +61 -41
  156. package/src/README.md +0 -85
  157. package/src/api/README.md +0 -26
  158. package/src/api/public-types.ts +0 -1421
  159. package/src/api/session-state.ts +0 -60
  160. package/src/compare/diff-engine.ts +0 -623
  161. package/src/compare/export-redlines.ts +0 -280
  162. package/src/compare/index.ts +0 -25
  163. package/src/compare/snapshot.ts +0 -97
  164. package/src/component-inventory.md +0 -99
  165. package/src/core/README.md +0 -10
  166. package/src/core/commands/README.md +0 -3
  167. package/src/core/commands/image-commands.ts +0 -373
  168. package/src/core/commands/index.ts +0 -1757
  169. package/src/core/commands/list-commands.ts +0 -565
  170. package/src/core/commands/paragraph-layout-commands.ts +0 -339
  171. package/src/core/commands/review-commands.ts +0 -108
  172. package/src/core/commands/structural-helpers.ts +0 -309
  173. package/src/core/schema/README.md +0 -3
  174. package/src/core/schema/text-schema.ts +0 -516
  175. package/src/core/search/search-text.ts +0 -357
  176. package/src/core/selection/README.md +0 -3
  177. package/src/core/selection/mapping.ts +0 -289
  178. package/src/core/selection/review-anchors.ts +0 -183
  179. package/src/core/state/README.md +0 -3
  180. package/src/core/state/editor-state.ts +0 -892
  181. package/src/formats/xlsx/io/parse-shared-strings.ts +0 -41
  182. package/src/formats/xlsx/io/parse-sheet.ts +0 -459
  183. package/src/formats/xlsx/io/parse-styles.ts +0 -59
  184. package/src/formats/xlsx/io/parse-workbook.ts +0 -75
  185. package/src/formats/xlsx/io/serialize-shared-strings.ts +0 -72
  186. package/src/formats/xlsx/io/serialize-sheet.ts +0 -333
  187. package/src/formats/xlsx/io/serialize-styles.ts +0 -98
  188. package/src/formats/xlsx/io/serialize-workbook.ts +0 -429
  189. package/src/formats/xlsx/io/xlsx-session.ts +0 -314
  190. package/src/formats/xlsx/model/cell.ts +0 -189
  191. package/src/formats/xlsx/model/sheet.ts +0 -326
  192. package/src/formats/xlsx/model/styles.ts +0 -118
  193. package/src/formats/xlsx/model/workbook.ts +0 -453
  194. package/src/formats/xlsx/runtime/cell-commands.ts +0 -567
  195. package/src/formats/xlsx/runtime/sheet-commands.ts +0 -206
  196. package/src/formats/xlsx/runtime/workbook-runtime.ts +0 -177
  197. package/src/formats/xlsx/runtime/workbook-transaction.ts +0 -822
  198. package/src/index.ts +0 -101
  199. package/src/io/README.md +0 -10
  200. package/src/io/docx-session.ts +0 -2882
  201. package/src/io/export/README.md +0 -3
  202. package/src/io/export/export-session.ts +0 -220
  203. package/src/io/export/minimal-docx.ts +0 -115
  204. package/src/io/export/reattach-preserved-parts.ts +0 -54
  205. package/src/io/export/serialize-comments.ts +0 -947
  206. package/src/io/export/serialize-footnotes.ts +0 -399
  207. package/src/io/export/serialize-headers-footers.ts +0 -372
  208. package/src/io/export/serialize-main-document.ts +0 -1376
  209. package/src/io/export/serialize-numbering.ts +0 -118
  210. package/src/io/export/serialize-revisions.ts +0 -389
  211. package/src/io/export/serialize-runtime-revisions.ts +0 -269
  212. package/src/io/export/serialize-tables.ts +0 -174
  213. package/src/io/export/split-review-boundaries.ts +0 -356
  214. package/src/io/normalize/README.md +0 -3
  215. package/src/io/normalize/normalize-text.ts +0 -639
  216. package/src/io/ooxml/README.md +0 -3
  217. package/src/io/ooxml/highlight-colors.ts +0 -39
  218. package/src/io/ooxml/numbering-sentinels.ts +0 -44
  219. package/src/io/ooxml/parse-comments.ts +0 -846
  220. package/src/io/ooxml/parse-complex-content.ts +0 -287
  221. package/src/io/ooxml/parse-fields.ts +0 -834
  222. package/src/io/ooxml/parse-footnotes.ts +0 -896
  223. package/src/io/ooxml/parse-headers-footers.ts +0 -1169
  224. package/src/io/ooxml/parse-inline-media.ts +0 -461
  225. package/src/io/ooxml/parse-main-document.ts +0 -2877
  226. package/src/io/ooxml/parse-numbering.ts +0 -432
  227. package/src/io/ooxml/parse-revisions.ts +0 -931
  228. package/src/io/ooxml/parse-settings.ts +0 -184
  229. package/src/io/ooxml/parse-shapes.ts +0 -296
  230. package/src/io/ooxml/parse-styles.ts +0 -463
  231. package/src/io/ooxml/parse-tables.ts +0 -618
  232. package/src/io/ooxml/parse-theme.ts +0 -346
  233. package/src/io/ooxml/part-manifest.ts +0 -136
  234. package/src/io/ooxml/revision-boundaries.ts +0 -351
  235. package/src/io/opc/README.md +0 -3
  236. package/src/io/opc/corrupt-package.ts +0 -166
  237. package/src/io/opc/docx-package.ts +0 -74
  238. package/src/io/opc/package-reader.ts +0 -325
  239. package/src/io/opc/package-writer.ts +0 -273
  240. package/src/io/source-package-provenance.ts +0 -241
  241. package/src/legal/cross-references.ts +0 -414
  242. package/src/legal/defined-terms.ts +0 -203
  243. package/src/legal/index.ts +0 -32
  244. package/src/legal/signature-blocks.ts +0 -259
  245. package/src/model/README.md +0 -3
  246. package/src/model/canonical-document.ts +0 -2632
  247. package/src/model/cds-1.0.0.ts +0 -212
  248. package/src/model/snapshot.ts +0 -649
  249. package/src/preservation/README.md +0 -3
  250. package/src/preservation/markup-compatibility.ts +0 -48
  251. package/src/preservation/opaque-fragment-store.ts +0 -89
  252. package/src/preservation/opaque-region.ts +0 -233
  253. package/src/preservation/package-preservation.ts +0 -113
  254. package/src/preservation/preserved-part-manifest.ts +0 -56
  255. package/src/preservation/relationship-retention.ts +0 -57
  256. package/src/preservation/store.ts +0 -185
  257. package/src/review/README.md +0 -16
  258. package/src/review/store/README.md +0 -3
  259. package/src/review/store/comment-anchors.ts +0 -70
  260. package/src/review/store/comment-remapping.ts +0 -154
  261. package/src/review/store/comment-store.ts +0 -331
  262. package/src/review/store/comment-thread.ts +0 -109
  263. package/src/review/store/revision-actions.ts +0 -394
  264. package/src/review/store/revision-store.ts +0 -312
  265. package/src/review/store/revision-types.ts +0 -171
  266. package/src/review/store/runtime-comment-store.ts +0 -43
  267. package/src/runtime/README.md +0 -3
  268. package/src/runtime/ai-action-policy.ts +0 -764
  269. package/src/runtime/document-layout.ts +0 -332
  270. package/src/runtime/document-navigation.ts +0 -603
  271. package/src/runtime/document-runtime.ts +0 -3159
  272. package/src/runtime/document-search.ts +0 -145
  273. package/src/runtime/numbering-prefix.ts +0 -216
  274. package/src/runtime/page-layout-estimation.ts +0 -212
  275. package/src/runtime/read-only-diagnostics-runtime.ts +0 -241
  276. package/src/runtime/review-runtime.ts +0 -44
  277. package/src/runtime/revision-runtime.ts +0 -107
  278. package/src/runtime/session-capabilities.ts +0 -192
  279. package/src/runtime/story-context.ts +0 -164
  280. package/src/runtime/story-targeting.ts +0 -162
  281. package/src/runtime/surface-projection.ts +0 -1357
  282. package/src/runtime/table-commands.ts +0 -173
  283. package/src/runtime/table-schema.ts +0 -309
  284. package/src/runtime/view-state.ts +0 -477
  285. package/src/runtime/virtualized-rendering.ts +0 -258
  286. package/src/runtime/workflow-markup.ts +0 -353
  287. package/src/ui/README.md +0 -30
  288. package/src/ui/WordReviewEditor.tsx +0 -4086
  289. package/src/ui/browser-export.ts +0 -52
  290. package/src/ui/comments/README.md +0 -3
  291. package/src/ui/compatibility/README.md +0 -3
  292. package/src/ui/editor-command-bag.ts +0 -120
  293. package/src/ui/editor-runtime-boundary.ts +0 -1457
  294. package/src/ui/editor-shell-view.tsx +0 -142
  295. package/src/ui/editor-surface/README.md +0 -3
  296. package/src/ui/editor-surface-controller.tsx +0 -61
  297. package/src/ui/headless/comment-decoration-model.ts +0 -124
  298. package/src/ui/headless/preserve-editor-selection.ts +0 -5
  299. package/src/ui/headless/revision-decoration-model.ts +0 -128
  300. package/src/ui/headless/selection-helpers.ts +0 -54
  301. package/src/ui/headless/selection-toolbar-model.ts +0 -34
  302. package/src/ui/headless/use-editor-keyboard.ts +0 -103
  303. package/src/ui/review/README.md +0 -3
  304. package/src/ui/runtime-snapshot-selectors.ts +0 -197
  305. package/src/ui/shared/revision-filters.ts +0 -31
  306. package/src/ui/status/README.md +0 -3
  307. package/src/ui/theme/README.md +0 -3
  308. package/src/ui/toolbar/README.md +0 -3
  309. package/src/ui/workflow-surface-blocked-rails.ts +0 -94
  310. package/src/ui-tailwind/chrome/tw-alert-banner.tsx +0 -64
  311. package/src/ui-tailwind/chrome/tw-image-context-toolbar.tsx +0 -129
  312. package/src/ui-tailwind/chrome/tw-layout-panel.tsx +0 -114
  313. package/src/ui-tailwind/chrome/tw-object-context-toolbar.tsx +0 -34
  314. package/src/ui-tailwind/chrome/tw-page-ruler.tsx +0 -386
  315. package/src/ui-tailwind/chrome/tw-selection-toolbar.tsx +0 -186
  316. package/src/ui-tailwind/chrome/tw-suggestion-card.tsx +0 -139
  317. package/src/ui-tailwind/chrome/tw-table-context-toolbar.tsx +0 -128
  318. package/src/ui-tailwind/chrome/tw-unsaved-modal.tsx +0 -58
  319. package/src/ui-tailwind/chrome/use-before-unload.ts +0 -20
  320. package/src/ui-tailwind/editor-surface/perf-probe.ts +0 -179
  321. package/src/ui-tailwind/editor-surface/pm-command-bridge.ts +0 -184
  322. package/src/ui-tailwind/editor-surface/pm-contextual-ui.ts +0 -31
  323. package/src/ui-tailwind/editor-surface/pm-decorations.ts +0 -427
  324. package/src/ui-tailwind/editor-surface/pm-position-map.ts +0 -123
  325. package/src/ui-tailwind/editor-surface/pm-schema.ts +0 -876
  326. package/src/ui-tailwind/editor-surface/pm-state-from-snapshot.ts +0 -504
  327. package/src/ui-tailwind/editor-surface/search-plugin.ts +0 -168
  328. package/src/ui-tailwind/editor-surface/surface-build-keys.ts +0 -61
  329. package/src/ui-tailwind/editor-surface/tw-caret.tsx +0 -12
  330. package/src/ui-tailwind/editor-surface/tw-editor-surface.tsx +0 -150
  331. package/src/ui-tailwind/editor-surface/tw-inline-token.tsx +0 -129
  332. package/src/ui-tailwind/editor-surface/tw-opaque-block.tsx +0 -58
  333. package/src/ui-tailwind/editor-surface/tw-paragraph-block.tsx +0 -151
  334. package/src/ui-tailwind/editor-surface/tw-prosemirror-surface.tsx +0 -944
  335. package/src/ui-tailwind/editor-surface/tw-segment-view.tsx +0 -111
  336. package/src/ui-tailwind/editor-surface/tw-table-node-view.tsx +0 -436
  337. package/src/ui-tailwind/index.ts +0 -62
  338. package/src/ui-tailwind/page-chrome-model.ts +0 -27
  339. package/src/ui-tailwind/review/tw-comment-sidebar.tsx +0 -406
  340. package/src/ui-tailwind/review/tw-health-panel.tsx +0 -149
  341. package/src/ui-tailwind/review/tw-review-rail.tsx +0 -120
  342. package/src/ui-tailwind/review/tw-revision-sidebar.tsx +0 -164
  343. package/src/ui-tailwind/status/tw-status-bar.tsx +0 -61
  344. package/src/ui-tailwind/toolbar/tw-toolbar-icon-button.tsx +0 -52
  345. package/src/ui-tailwind/toolbar/tw-toolbar.tsx +0 -1064
  346. package/src/ui-tailwind/tw-review-workspace.tsx +0 -1417
  347. package/src/validation/README.md +0 -3
  348. package/src/validation/compatibility-engine.ts +0 -634
  349. package/src/validation/compatibility-report.ts +0 -161
  350. package/src/validation/diagnostics.ts +0 -204
  351. package/src/validation/docx-comment-proof.ts +0 -707
  352. package/src/validation/import-diagnostics.ts +0 -128
  353. package/src/validation/low-priority-word-surfaces.ts +0 -373
  354. /package/{src → dist}/ui-tailwind/theme/editor-theme.css +0 -0
@@ -1,834 +0,0 @@
1
- /**
2
- * parse-fields.ts
3
- *
4
- * Standalone parsers for OOXML field codes (w:fldSimple, complex fldChar sequences)
5
- * and bookmarks (w:bookmarkStart / w:bookmarkEnd).
6
- *
7
- * These types mirror the canonical FieldNode / BookmarkStartNode / BookmarkEndNode
8
- * shapes from canonical-document.ts, but carry raw XML for preservation and are
9
- * pre-normalization (no fragmentId / warningId yet).
10
- *
11
- * Usage: call parseFieldsFromParagraphXml() or parseBookmarksFromXml() for
12
- * independent field/bookmark extraction. The functions are designed to be
13
- * imported by parse-main-document.ts when full pipeline integration is ready.
14
- */
15
-
16
- // ─── Parsed types ────────────────────────────────────────────────────────────
17
-
18
- export interface ParsedSimpleFieldNode {
19
- type: "field";
20
- fieldType: "simple";
21
- instruction: string;
22
- /** Raw XML of the content runs inside <w:fldSimple>. */
23
- contentXml: string;
24
- rawXml: string;
25
- }
26
-
27
- export interface ParsedComplexFieldNode {
28
- type: "field";
29
- fieldType: "complex";
30
- instruction: string;
31
- /** Raw XML of the content runs between the "separate" and "end" fldChar. */
32
- contentXml: string;
33
- /** Start index in the source document XML. */
34
- start: number;
35
- /** End index (exclusive) in the source document XML. */
36
- end: number;
37
- }
38
-
39
- export type ParsedFieldNode = ParsedSimpleFieldNode | ParsedComplexFieldNode;
40
-
41
- export interface ParsedBookmarkStartNode {
42
- type: "bookmark_start";
43
- bookmarkId: string;
44
- name: string;
45
- rawXml: string;
46
- }
47
-
48
- export interface ParsedBookmarkEndNode {
49
- type: "bookmark_end";
50
- bookmarkId: string;
51
- rawXml: string;
52
- }
53
-
54
- export type ParsedBookmarkNode = ParsedBookmarkStartNode | ParsedBookmarkEndNode;
55
-
56
- // ─── Internal XML types ───────────────────────────────────────────────────────
57
-
58
- interface XmlElementNode {
59
- type: "element";
60
- name: string;
61
- attributes: Record<string, string>;
62
- children: XmlNode[];
63
- start: number;
64
- end: number;
65
- }
66
-
67
- interface XmlTextNode {
68
- type: "text";
69
- text: string;
70
- start: number;
71
- end: number;
72
- }
73
-
74
- type XmlNode = XmlElementNode | XmlTextNode;
75
-
76
- // ─── Public API ───────────────────────────────────────────────────────────────
77
-
78
- /**
79
- * Parse all simple fields and bookmarks from the XML of a single paragraph
80
- * element. Complex fields that span paragraphs are not fully resolved here;
81
- * use extractComplexFieldsFromBodyXml for body-level extraction.
82
- *
83
- * @param paragraphXml Raw XML string of a <w:p> element.
84
- */
85
- export function parseFieldsFromParagraphXml(paragraphXml: string): {
86
- simpleFields: ParsedSimpleFieldNode[];
87
- bookmarks: ParsedBookmarkNode[];
88
- } {
89
- const root = parseXml(paragraphXml);
90
- const pEl = findFirstChild(root, "p");
91
- const target = pEl ?? root;
92
-
93
- const simpleFields: ParsedSimpleFieldNode[] = [];
94
- const bookmarks: ParsedBookmarkNode[] = [];
95
-
96
- for (const child of target.children) {
97
- if (child.type !== "element") continue;
98
- const name = localName(child.name);
99
-
100
- if (name === "fldSimple") {
101
- const field = parseFldSimple(child, paragraphXml);
102
- if (field) simpleFields.push(field);
103
- } else if (name === "bookmarkStart") {
104
- const bk = parseBookmarkStart(child, paragraphXml);
105
- if (bk) bookmarks.push(bk);
106
- } else if (name === "bookmarkEnd") {
107
- const bk = parseBookmarkEnd(child, paragraphXml);
108
- if (bk) bookmarks.push(bk);
109
- }
110
- }
111
-
112
- return { simpleFields, bookmarks };
113
- }
114
-
115
- /**
116
- * Extract complex field sequences from a body element XML string.
117
- * A complex field is a begin / instrText* / separate / content / end sequence
118
- * spread across multiple <w:r> siblings.
119
- *
120
- * @param bodyXml Raw XML string of a <w:body> element (or full document).
121
- */
122
- export function extractComplexFieldsFromBodyXml(bodyXml: string): ParsedComplexFieldNode[] {
123
- const root = parseXml(bodyXml);
124
- const results: ParsedComplexFieldNode[] = [];
125
-
126
- // Walk all <w:p> children of the body
127
- const bodyEl = findFirstChild(root, "body") ?? findFirstChild(root, "document");
128
- const scanTarget = bodyEl ?? root;
129
-
130
- for (const block of scanTarget.children) {
131
- if (block.type !== "element") continue;
132
- if (localName(block.name) !== "p") continue;
133
- extractComplexFieldsFromParagraph(block, bodyXml, results);
134
- }
135
-
136
- return results;
137
- }
138
-
139
- /**
140
- * Parse all bookmark start/end nodes from a full document or body XML.
141
- */
142
- export function extractBookmarksFromBodyXml(bodyXml: string): ParsedBookmarkNode[] {
143
- const root = parseXml(bodyXml);
144
- const results: ParsedBookmarkNode[] = [];
145
- collectBookmarks(root, bodyXml, results);
146
- return results;
147
- }
148
-
149
- // ─── Element-level parsers (exported for unit testing) ────────────────────────
150
-
151
- export function parseFldSimple(
152
- element: { attributes: Record<string, string>; children: XmlNode[]; start: number; end: number },
153
- sourceXml: string,
154
- ): ParsedSimpleFieldNode | undefined {
155
- const instruction = (element.attributes["w:instr"] ?? element.attributes.instr ?? "").trim();
156
- const contentXml = element.children
157
- .filter((c): c is XmlElementNode => c.type === "element")
158
- .map((c) => sourceXml.slice(c.start, c.end))
159
- .join("");
160
- return {
161
- type: "field",
162
- fieldType: "simple",
163
- instruction,
164
- contentXml,
165
- rawXml: sourceXml.slice(element.start, element.end),
166
- };
167
- }
168
-
169
- export function parseBookmarkStart(
170
- element: { attributes: Record<string, string>; start: number; end: number },
171
- sourceXml: string,
172
- ): ParsedBookmarkStartNode | undefined {
173
- const bookmarkId = element.attributes["w:id"] ?? element.attributes.id ?? "";
174
- const name = element.attributes["w:name"] ?? element.attributes.name ?? "";
175
- if (!bookmarkId) return undefined;
176
- return {
177
- type: "bookmark_start",
178
- bookmarkId,
179
- name,
180
- rawXml: sourceXml.slice(element.start, element.end),
181
- };
182
- }
183
-
184
- export function parseBookmarkEnd(
185
- element: { attributes: Record<string, string>; start: number; end: number },
186
- sourceXml: string,
187
- ): ParsedBookmarkEndNode | undefined {
188
- const bookmarkId = element.attributes["w:id"] ?? element.attributes.id ?? "";
189
- if (!bookmarkId) return undefined;
190
- return {
191
- type: "bookmark_end",
192
- bookmarkId,
193
- rawXml: sourceXml.slice(element.start, element.end),
194
- };
195
- }
196
-
197
- // ─── Field family classification ─────────────────────────────────────────────
198
-
199
- import type {
200
- CanonicalDocument,
201
- DocumentNode,
202
- FieldFamily,
203
- FieldNode,
204
- FieldRegistry,
205
- FieldRegistryEntry,
206
- FieldRefreshStatus,
207
- InlineNode,
208
- ParagraphNode,
209
- SubPartsCatalog,
210
- SupportedFieldFamily,
211
- TocEntry,
212
- TocStructure,
213
- } from "../../model/canonical-document.ts";
214
-
215
- const FIELD_FAMILY_PATTERN =
216
- /^\s*(REF|PAGEREF|NOTEREF|TOC|PAGE|NUMPAGES|DATE|TIME|AUTHOR|FILENAME|MERGEFIELD|IF|SEQ|INDEX|TC|STYLEREF)\b/i;
217
-
218
- const SUPPORTED_FAMILIES = new Set<string>(["REF", "PAGEREF", "NOTEREF", "TOC"]);
219
-
220
- /**
221
- * Classify a field instruction into its field family.
222
- * Returns the family enum value and whether it is in the supported slice.
223
- */
224
- export function classifyFieldInstruction(instruction: string): {
225
- family: FieldFamily;
226
- supported: boolean;
227
- target?: string;
228
- } {
229
- const trimmed = instruction.trim();
230
- const match = FIELD_FAMILY_PATTERN.exec(trimmed);
231
- if (!match) {
232
- return { family: "UNKNOWN", supported: false };
233
- }
234
-
235
- const family = match[1].toUpperCase() as FieldFamily;
236
- const supported = SUPPORTED_FAMILIES.has(family);
237
-
238
- let target: string | undefined;
239
- if (family === "REF" || family === "PAGEREF" || family === "NOTEREF") {
240
- const targetMatch = /^\s*(?:REF|PAGEREF|NOTEREF)\s+(?:"([^"]+)"|(\S+))/i.exec(trimmed);
241
- target = (targetMatch?.[1] ?? targetMatch?.[2])?.trim();
242
- }
243
-
244
- return { family, supported, target };
245
- }
246
-
247
- /**
248
- * Returns true if the given field family is in the supported refresh slice.
249
- */
250
- export function isSupportedFieldFamily(family: FieldFamily): family is SupportedFieldFamily {
251
- return SUPPORTED_FAMILIES.has(family);
252
- }
253
-
254
- // ─── Field registry builder ─────────────────────────────────────────────────
255
-
256
- /**
257
- * Build a field registry from a canonical document, cataloging every field
258
- * instance with its classification, dependency metadata, and refresh status.
259
- *
260
- * The registry partitions fields into `supported` (REF, PAGEREF, NOTEREF, TOC)
261
- * and `preserveOnly` (all others) slices.
262
- */
263
- export function buildFieldRegistry(
264
- document: Pick<CanonicalDocument, "content" | "styles"> & {
265
- subParts?: SubPartsCatalog;
266
- },
267
- ): FieldRegistry {
268
- const root = document.content;
269
- const supported: FieldRegistryEntry[] = [];
270
- const preserveOnly: FieldRegistryEntry[] = [];
271
- let fieldIndex = 0;
272
- let paragraphIndex = -1;
273
- let tocInstruction: string | undefined;
274
-
275
- walkFieldDocument(root, (node, pIdx) => {
276
- paragraphIndex = pIdx;
277
- if (node.type === "field") {
278
- const classification = node.fieldFamily
279
- ? { family: node.fieldFamily, supported: isSupportedFieldFamily(node.fieldFamily), target: node.fieldTarget }
280
- : classifyFieldInstruction(node.instruction);
281
- const displayText = flattenFieldText(node.children);
282
- const entry: FieldRegistryEntry = {
283
- fieldIndex,
284
- fieldFamily: classification.family,
285
- supported: classification.supported,
286
- instruction: node.instruction,
287
- ...(classification.target ? { fieldTarget: classification.target } : {}),
288
- displayText,
289
- paragraphIndex,
290
- refreshStatus: node.refreshStatus ?? (classification.supported ? "stale" : "preserve-only"),
291
- };
292
- if (classification.supported) {
293
- supported.push(entry);
294
- if (classification.family === "TOC" && !tocInstruction) {
295
- tocInstruction = node.instruction;
296
- }
297
- } else {
298
- preserveOnly.push(entry);
299
- }
300
- fieldIndex += 1;
301
- }
302
- });
303
- if (document.subParts) {
304
- walkSubPartFields(document.subParts, (node, pIdx) => {
305
- paragraphIndex = pIdx;
306
- if (node.type === "field") {
307
- const classification = node.fieldFamily
308
- ? { family: node.fieldFamily, supported: isSupportedFieldFamily(node.fieldFamily), target: node.fieldTarget }
309
- : classifyFieldInstruction(node.instruction);
310
- const displayText = flattenFieldText(node.children);
311
- const entry: FieldRegistryEntry = {
312
- fieldIndex,
313
- fieldFamily: classification.family,
314
- supported: classification.supported,
315
- instruction: node.instruction,
316
- ...(classification.target ? { fieldTarget: classification.target } : {}),
317
- displayText,
318
- paragraphIndex,
319
- refreshStatus: node.refreshStatus ?? (classification.supported ? "stale" : "preserve-only"),
320
- };
321
- if (classification.supported) {
322
- supported.push(entry);
323
- } else {
324
- preserveOnly.push(entry);
325
- }
326
- fieldIndex += 1;
327
- }
328
- });
329
- }
330
-
331
- const tocStructure = tocInstruction
332
- ? buildTocStructure(document, tocInstruction)
333
- : undefined;
334
-
335
- return {
336
- supported,
337
- preserveOnly,
338
- ...(tocStructure ? { tocStructure } : {}),
339
- };
340
- }
341
-
342
- /**
343
- * Parse the heading level range from a TOC field instruction.
344
- * The \\o switch specifies the outline level range (e.g. \\o "1-3").
345
- * Defaults to 1-9 if no \\o switch is present.
346
- */
347
- export function parseTocLevelRange(instruction: string): { from: number; to: number } {
348
- const match = /\\o\s+"(\d+)-(\d+)"/.exec(instruction);
349
- if (match) {
350
- return { from: Number.parseInt(match[1], 10), to: Number.parseInt(match[2], 10) };
351
- }
352
- return { from: 1, to: 9 };
353
- }
354
-
355
- /**
356
- * Build a TocStructure from the document's heading paragraphs and the
357
- * TOC field instruction. This produces a deterministic, package-backed
358
- * TOC model that the runtime can use for refresh without DOM recomputation.
359
- */
360
- export function buildTocStructure(
361
- document: Pick<CanonicalDocument, "content" | "styles">,
362
- instruction: string,
363
- ): TocStructure {
364
- const levelRange = parseTocLevelRange(instruction);
365
- const entries: TocEntry[] = [];
366
- let paragraphIndex = -1;
367
-
368
- walkFieldDocument(document.content, (node, pIdx) => {
369
- paragraphIndex = pIdx;
370
- if (node.type !== "paragraph") return;
371
- const paragraph = node as ParagraphNode;
372
-
373
- // Determine heading level from outlineLevel or style
374
- let level: number | undefined = paragraph.outlineLevel;
375
- if (level === undefined && paragraph.styleId) {
376
- const style = document.styles.paragraphs[paragraph.styleId];
377
- if (style?.outlineLevel !== undefined) {
378
- level = style.outlineLevel;
379
- }
380
- }
381
-
382
- if (level === undefined) return;
383
- // TOC outline levels are 0-based internally, 1-based in TOC notation
384
- const tocLevel = level + 1;
385
- if (tocLevel < levelRange.from || tocLevel > levelRange.to) return;
386
-
387
- const text = flattenParagraphInlineText(paragraph.children);
388
- if (text.trim().length === 0) return;
389
-
390
- // Find bookmark anchoring this heading
391
- let bookmarkName: string | undefined;
392
- for (const child of paragraph.children) {
393
- if (child.type === "bookmark_start" && child.name) {
394
- bookmarkName = child.name;
395
- break;
396
- }
397
- }
398
-
399
- entries.push({
400
- text: text.trim(),
401
- level: tocLevel,
402
- paragraphIndex,
403
- ...(paragraph.styleId ? { styleId: paragraph.styleId } : {}),
404
- ...(bookmarkName ? { bookmarkName } : {}),
405
- });
406
- });
407
-
408
- return {
409
- instruction,
410
- levelRange,
411
- entries,
412
- status: "stale",
413
- };
414
- }
415
-
416
- /**
417
- * Deterministic refresh helper for REF fields.
418
- * Given a bookmark name map and the document content, resolves the display
419
- * text for a REF field by extracting text from the bookmarked paragraph.
420
- *
421
- * Returns the resolved text, or undefined if the bookmark is not found.
422
- */
423
- export function resolveRefFieldText(
424
- document: Pick<CanonicalDocument, "content">,
425
- bookmarkNameMap: Map<string, { bookmarkId: string; paragraphIndex: number }>,
426
- fieldTarget: string,
427
- ): { text: string; refreshStatus: "current" | "unresolvable" } | undefined {
428
- const bookmark = bookmarkNameMap.get(fieldTarget);
429
- if (!bookmark) {
430
- return { text: "", refreshStatus: "unresolvable" };
431
- }
432
-
433
- // Find the paragraph at bookmarkIndex and extract its text content
434
- let paragraphIndex = -1;
435
- let resolvedText: string | undefined;
436
-
437
- walkFieldDocument(document.content, (node, pIdx) => {
438
- if (node.type !== "paragraph") return;
439
- paragraphIndex = pIdx;
440
- if (paragraphIndex === bookmark.paragraphIndex) {
441
- resolvedText = flattenBookmarkContent(node as ParagraphNode, bookmark.bookmarkId);
442
- }
443
- });
444
-
445
- if (resolvedText !== undefined) {
446
- return { text: resolvedText, refreshStatus: "current" };
447
- }
448
- return { text: "", refreshStatus: "unresolvable" };
449
- }
450
-
451
- /**
452
- * Deterministic refresh helper that updates all supported field entries
453
- * in a registry with their current resolved status.
454
- *
455
- * This does NOT mutate the document nodes — it returns a new registry
456
- * with updated refresh statuses. A3 owns the runtime wiring that
457
- * applies these to the live document.
458
- */
459
- export function refreshFieldRegistry(
460
- registry: FieldRegistry,
461
- bookmarkNameMap: Map<string, { bookmarkId: string; paragraphIndex: number }>,
462
- ): FieldRegistry {
463
- const refreshed: FieldRegistryEntry[] = registry.supported.map((entry) => {
464
- if (entry.fieldFamily === "TOC") {
465
- // TOC refresh is handled through tocStructure, not individual entries
466
- return { ...entry, refreshStatus: registry.tocStructure ? "current" : "stale" as FieldRefreshStatus };
467
- }
468
- if (!entry.fieldTarget) {
469
- return { ...entry, refreshStatus: "unresolvable" as FieldRefreshStatus };
470
- }
471
- const bookmark = bookmarkNameMap.get(entry.fieldTarget);
472
- if (!bookmark) {
473
- return { ...entry, refreshStatus: "unresolvable" as FieldRefreshStatus };
474
- }
475
- return { ...entry, refreshStatus: "current" as FieldRefreshStatus };
476
- });
477
-
478
- return {
479
- supported: refreshed,
480
- preserveOnly: registry.preserveOnly,
481
- ...(registry.tocStructure ? { tocStructure: registry.tocStructure } : {}),
482
- };
483
- }
484
-
485
- // ─── Field registry internal helpers ────────────────────────────────────────
486
-
487
- function walkFieldDocument(
488
- node: DocumentNode,
489
- visit: (node: DocumentNode, paragraphIndex: number) => void,
490
- paragraphIndex = -1,
491
- ): number {
492
- if (node.type === "paragraph") {
493
- paragraphIndex += 1;
494
- }
495
- visit(node, paragraphIndex);
496
-
497
- if ("children" in node && Array.isArray(node.children)) {
498
- for (const child of node.children) {
499
- paragraphIndex = walkFieldDocument(child as DocumentNode, visit, paragraphIndex);
500
- }
501
- }
502
- if (node.type === "table") {
503
- for (const row of node.rows) {
504
- paragraphIndex = walkFieldDocument(row, visit, paragraphIndex);
505
- }
506
- } else if (node.type === "table_row") {
507
- for (const cell of node.cells) {
508
- paragraphIndex = walkFieldDocument(cell, visit, paragraphIndex);
509
- }
510
- }
511
- return paragraphIndex;
512
- }
513
-
514
- function walkSubPartFields(
515
- subParts: SubPartsCatalog,
516
- visit: (node: DocumentNode, paragraphIndex: number) => void,
517
- ): void {
518
- for (const header of subParts.headers) {
519
- for (const block of header.blocks) {
520
- walkFieldDocument(block, visit);
521
- }
522
- }
523
- for (const footer of subParts.footers) {
524
- for (const block of footer.blocks) {
525
- walkFieldDocument(block, visit);
526
- }
527
- }
528
- if (subParts.footnoteCollection) {
529
- for (const note of Object.values(subParts.footnoteCollection.footnotes)) {
530
- for (const block of note.blocks) {
531
- walkFieldDocument(block, visit);
532
- }
533
- }
534
- for (const note of Object.values(subParts.footnoteCollection.endnotes)) {
535
- for (const block of note.blocks) {
536
- walkFieldDocument(block, visit);
537
- }
538
- }
539
- }
540
- }
541
-
542
- function flattenFieldText(children: InlineNode[]): string {
543
- return children
544
- .map((child) => {
545
- if (child.type === "text") return child.text;
546
- if (child.type === "tab") return "\t";
547
- if (child.type === "hard_break" || child.type === "column_break") return "\n";
548
- return "";
549
- })
550
- .join("");
551
- }
552
-
553
- function flattenParagraphInlineText(children: InlineNode[]): string {
554
- return children
555
- .map((child) => {
556
- if (child.type === "text") return child.text;
557
- if (child.type === "tab") return "\t";
558
- if (child.type === "hard_break" || child.type === "column_break") return "\n";
559
- if (child.type === "hyperlink") return flattenFieldText(child.children);
560
- if (child.type === "field") return flattenFieldText(child.children);
561
- return "";
562
- })
563
- .join("");
564
- }
565
-
566
- function flattenBookmarkContent(
567
- paragraph: ParagraphNode,
568
- bookmarkId: string,
569
- ): string {
570
- let inside = false;
571
- const parts: string[] = [];
572
- for (const child of paragraph.children) {
573
- if (child.type === "bookmark_start" && child.bookmarkId === bookmarkId) {
574
- inside = true;
575
- continue;
576
- }
577
- if (child.type === "bookmark_end" && child.bookmarkId === bookmarkId) {
578
- break;
579
- }
580
- if (inside) {
581
- if (child.type === "text") parts.push(child.text);
582
- else if (child.type === "tab") parts.push("\t");
583
- else if (child.type === "hard_break") parts.push("\n");
584
- }
585
- }
586
- // If no bookmark boundaries found in this paragraph, return full paragraph text
587
- if (!inside) {
588
- return flattenParagraphInlineText(paragraph.children);
589
- }
590
- return parts.join("");
591
- }
592
-
593
- // ─── Internal helpers ─────────────────────────────────────────────────────────
594
-
595
- function extractComplexFieldsFromParagraph(
596
- paragraph: XmlElementNode,
597
- sourceXml: string,
598
- results: ParsedComplexFieldNode[],
599
- ): void {
600
- type FieldState = "idle" | "in-instr" | "in-content";
601
- let state: FieldState = "idle";
602
- let instrParts: string[] = [];
603
- let contentStart = -1;
604
- let contentEnd = -1;
605
- let fieldStart = -1;
606
-
607
- for (const child of paragraph.children) {
608
- if (child.type !== "element" || localName(child.name) !== "r") continue;
609
-
610
- const fldChar = findFirstChildEl(child, "fldChar");
611
- const instrText = findFirstChildEl(child, "instrText");
612
-
613
- if (fldChar) {
614
- const charType = (
615
- fldChar.attributes["w:fldCharType"] ??
616
- fldChar.attributes.fldCharType ??
617
- ""
618
- ).toLowerCase();
619
-
620
- if (charType === "begin") {
621
- state = "in-instr";
622
- instrParts = [];
623
- fieldStart = child.start;
624
- contentStart = -1;
625
- contentEnd = -1;
626
- } else if (charType === "separate" && state === "in-instr") {
627
- state = "in-content";
628
- contentStart = child.end;
629
- } else if (charType === "end") {
630
- if (state === "in-content" || state === "in-instr") {
631
- if (state === "in-content") {
632
- contentEnd = child.start;
633
- }
634
- const instruction = instrParts.join("").trim();
635
- const contentXml =
636
- contentStart >= 0 && contentEnd >= contentStart
637
- ? sourceXml.slice(contentStart, contentEnd)
638
- : "";
639
- results.push({
640
- type: "field",
641
- fieldType: "complex",
642
- instruction,
643
- contentXml,
644
- start: fieldStart,
645
- end: child.end,
646
- });
647
- }
648
- state = "idle";
649
- instrParts = [];
650
- }
651
- } else if (instrText && state === "in-instr") {
652
- const text = instrText.children
653
- .filter((c): c is XmlTextNode => c.type === "text")
654
- .map((c) => c.text)
655
- .join("");
656
- instrParts.push(text);
657
- }
658
- }
659
- }
660
-
661
- function collectBookmarks(
662
- node: XmlElementNode,
663
- sourceXml: string,
664
- results: ParsedBookmarkNode[],
665
- ): void {
666
- for (const child of node.children) {
667
- if (child.type !== "element") continue;
668
- const name = localName(child.name);
669
- if (name === "bookmarkStart") {
670
- const bk = parseBookmarkStart(child, sourceXml);
671
- if (bk) results.push(bk);
672
- } else if (name === "bookmarkEnd") {
673
- const bk = parseBookmarkEnd(child, sourceXml);
674
- if (bk) results.push(bk);
675
- } else {
676
- collectBookmarks(child, sourceXml, results);
677
- }
678
- }
679
- }
680
-
681
- function findFirstChild(node: XmlElementNode, childLocalName: string): XmlElementNode | undefined {
682
- return node.children.find(
683
- (c): c is XmlElementNode => c.type === "element" && localName(c.name) === childLocalName,
684
- );
685
- }
686
-
687
- function findFirstChildEl(node: XmlElementNode, childLocalName: string): XmlElementNode | undefined {
688
- return node.children.find(
689
- (c): c is XmlElementNode => c.type === "element" && localName(c.name) === childLocalName,
690
- );
691
- }
692
-
693
- function localName(name: string): string {
694
- const sep = name.indexOf(":");
695
- return sep >= 0 ? name.slice(sep + 1) : name;
696
- }
697
-
698
- // ─── Minimal XML parser (same pattern as parse-tables.ts) ────────────────────
699
-
700
- function parseXml(xml: string): XmlElementNode {
701
- const root: XmlElementNode = {
702
- type: "element",
703
- name: "__root__",
704
- attributes: {},
705
- children: [],
706
- start: 0,
707
- end: xml.length,
708
- };
709
- const stack: XmlElementNode[] = [root];
710
- let cursor = 0;
711
-
712
- while (cursor < xml.length) {
713
- if (xml.startsWith("<!--", cursor)) {
714
- const end = xml.indexOf("-->", cursor);
715
- cursor = end >= 0 ? end + 3 : xml.length;
716
- continue;
717
- }
718
- if (xml.startsWith("<?", cursor)) {
719
- const end = xml.indexOf("?>", cursor);
720
- cursor = end >= 0 ? end + 2 : xml.length;
721
- continue;
722
- }
723
- if (xml.startsWith("<![CDATA[", cursor)) {
724
- const end = xml.indexOf("]]>", cursor);
725
- const textEnd = end >= 0 ? end : xml.length;
726
- stack[stack.length - 1]?.children.push({
727
- type: "text",
728
- text: xml.slice(cursor + 9, textEnd),
729
- start: cursor,
730
- end: end >= 0 ? end + 3 : xml.length,
731
- });
732
- cursor = end >= 0 ? end + 3 : xml.length;
733
- continue;
734
- }
735
- if (xml[cursor] !== "<") {
736
- const nextTag = xml.indexOf("<", cursor);
737
- const end = nextTag >= 0 ? nextTag : xml.length;
738
- const text = decodeXmlEntities(xml.slice(cursor, end));
739
- if (text.length > 0) {
740
- stack[stack.length - 1]?.children.push({ type: "text", text, start: cursor, end });
741
- }
742
- cursor = end;
743
- continue;
744
- }
745
- if (xml[cursor + 1] === "/") {
746
- const end = xml.indexOf(">", cursor);
747
- if (end < 0) throw new Error("Malformed XML: missing >.");
748
- const name = xml.slice(cursor + 2, end).trim();
749
- const current = stack.pop();
750
- if (!current || localName(current.name) !== localName(name)) {
751
- throw new Error(`Malformed XML: unexpected closing tag </${name}>.`);
752
- }
753
- current.end = end + 1;
754
- cursor = end + 1;
755
- continue;
756
- }
757
- const tagEnd = findTagEnd(xml, cursor);
758
- const tagBody = xml.slice(cursor + 1, tagEnd);
759
- const selfClosing = /\/\s*$/.test(tagBody);
760
- const { name, attributes } = parseTag(tagBody.replace(/\/\s*$/, "").trim());
761
- const element: XmlElementNode = {
762
- type: "element",
763
- name,
764
- attributes,
765
- children: [],
766
- start: cursor,
767
- end: tagEnd + 1,
768
- };
769
- stack[stack.length - 1]?.children.push(element);
770
- if (!selfClosing) stack.push(element);
771
- cursor = tagEnd + 1;
772
- }
773
-
774
- if (stack.length !== 1) throw new Error("Malformed XML: unclosed element.");
775
- return root;
776
- }
777
-
778
- function parseTag(tagBody: string): { name: string; attributes: Record<string, string> } {
779
- let cursor = 0;
780
- while (cursor < tagBody.length && /\s/.test(tagBody[cursor] ?? "")) cursor += 1;
781
- const nameStart = cursor;
782
- while (cursor < tagBody.length && !/\s/.test(tagBody[cursor] ?? "")) cursor += 1;
783
- const name = tagBody.slice(nameStart, cursor);
784
- const attributes: Record<string, string> = {};
785
-
786
- while (cursor < tagBody.length) {
787
- while (cursor < tagBody.length && /\s/.test(tagBody[cursor] ?? "")) cursor += 1;
788
- if (cursor >= tagBody.length) break;
789
- const keyStart = cursor;
790
- while (cursor < tagBody.length && !/[\s=]/.test(tagBody[cursor] ?? "")) cursor += 1;
791
- const key = tagBody.slice(keyStart, cursor);
792
- while (cursor < tagBody.length && /\s/.test(tagBody[cursor] ?? "")) cursor += 1;
793
- if (tagBody[cursor] !== "=") { attributes[key] = ""; continue; }
794
- cursor += 1;
795
- while (cursor < tagBody.length && /\s/.test(tagBody[cursor] ?? "")) cursor += 1;
796
- const quote = tagBody[cursor];
797
- if (quote !== `"` && quote !== `'`) throw new Error(`Malformed XML attribute ${key}.`);
798
- cursor += 1;
799
- const valueStart = cursor;
800
- while (cursor < tagBody.length && tagBody[cursor] !== quote) cursor += 1;
801
- attributes[key] = decodeXmlEntities(tagBody.slice(valueStart, cursor));
802
- cursor += 1;
803
- }
804
- return { name, attributes };
805
- }
806
-
807
- function findTagEnd(xml: string, start: number): number {
808
- let cursor = start + 1;
809
- let quote: string | null = null;
810
- while (cursor < xml.length) {
811
- const c = xml[cursor];
812
- if (quote) { if (c === quote) quote = null; cursor += 1; continue; }
813
- if (c === `"` || c === `'`) { quote = c; cursor += 1; continue; }
814
- if (c === ">") return cursor;
815
- cursor += 1;
816
- }
817
- throw new Error("Malformed XML: missing >.");
818
- }
819
-
820
- function decodeXmlEntities(value: string): string {
821
- return value.replace(/&(#x[0-9a-fA-F]+|#\d+|amp|lt|gt|quot|apos);/g, (match, entity) => {
822
- switch (entity) {
823
- case "amp": return "&";
824
- case "lt": return "<";
825
- case "gt": return ">";
826
- case "quot": return `"`;
827
- case "apos": return `'`;
828
- default:
829
- if (entity.startsWith("#x")) return String.fromCodePoint(Number.parseInt(entity.slice(2), 16));
830
- if (entity.startsWith("#")) return String.fromCodePoint(Number.parseInt(entity.slice(1), 10));
831
- return match;
832
- }
833
- });
834
- }