@beyondwork/docx-react-component 1.0.27 → 1.0.29

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (356) hide show
  1. package/dist/canonical-document-BLEbzL2J.d.cts +844 -0
  2. package/dist/canonical-document-BLEbzL2J.d.ts +844 -0
  3. package/dist/chunk-2FJS5GZM.js +763 -0
  4. package/dist/chunk-2FJS5GZM.js.map +1 -0
  5. package/{src/core/commands/section-layout-commands.ts → dist/chunk-2OQBZS3F.js} +106 -340
  6. package/dist/chunk-2OQBZS3F.js.map +1 -0
  7. package/dist/chunk-2S7W4KFO.js +127 -0
  8. package/dist/chunk-2S7W4KFO.js.map +1 -0
  9. package/dist/chunk-2TG72QSW.js +3874 -0
  10. package/dist/chunk-2TG72QSW.js.map +1 -0
  11. package/{src/core/commands/table-structure-commands.ts → dist/chunk-36QNIZBO.js} +126 -315
  12. package/dist/chunk-36QNIZBO.js.map +1 -0
  13. package/dist/chunk-4AQOYAW4.js +3069 -0
  14. package/dist/chunk-4AQOYAW4.js.map +1 -0
  15. package/dist/chunk-4D5EWJ3P.js +77 -0
  16. package/dist/chunk-4D5EWJ3P.js.map +1 -0
  17. package/dist/chunk-5FN54NDH.js +2257 -0
  18. package/dist/chunk-5FN54NDH.js.map +1 -0
  19. package/dist/chunk-BOYGQYRQ.js +7306 -0
  20. package/dist/chunk-BOYGQYRQ.js.map +1 -0
  21. package/dist/chunk-CN3XMECL.js +212 -0
  22. package/dist/chunk-CN3XMECL.js.map +1 -0
  23. package/dist/chunk-EBI3BX6U.js +164 -0
  24. package/dist/chunk-EBI3BX6U.js.map +1 -0
  25. package/dist/chunk-EILUG3VB.js +1275 -0
  26. package/dist/chunk-EILUG3VB.js.map +1 -0
  27. package/dist/chunk-FUDY333O.js +70 -0
  28. package/dist/chunk-FUDY333O.js.map +1 -0
  29. package/dist/chunk-GBVOWFIK.js +1237 -0
  30. package/dist/chunk-GBVOWFIK.js.map +1 -0
  31. package/dist/chunk-H4TQ3H3Y.js +262 -0
  32. package/dist/chunk-H4TQ3H3Y.js.map +1 -0
  33. package/{src/core/commands/style-commands.ts → dist/chunk-JGB3IXZO.js} +40 -113
  34. package/dist/chunk-JGB3IXZO.js.map +1 -0
  35. package/dist/chunk-KD2QRQPY.js +4342 -0
  36. package/dist/chunk-KD2QRQPY.js.map +1 -0
  37. package/dist/chunk-KLMXQVYK.js +369 -0
  38. package/dist/chunk-KLMXQVYK.js.map +1 -0
  39. package/dist/chunk-KZUG5KFQ.js +214 -0
  40. package/dist/chunk-KZUG5KFQ.js.map +1 -0
  41. package/{src/core/state/text-transaction.ts → dist/chunk-QDAQ4CJU.js} +79 -236
  42. package/dist/chunk-QDAQ4CJU.js.map +1 -0
  43. package/{src/legal/bookmarks.ts → dist/chunk-RMH72RZI.js} +44 -130
  44. package/dist/chunk-RMH72RZI.js.map +1 -0
  45. package/dist/chunk-SWKWQZXM.js +117 -0
  46. package/dist/chunk-SWKWQZXM.js.map +1 -0
  47. package/{src/core/commands/formatting-commands.ts → dist/chunk-TJBP2K4T.js} +196 -536
  48. package/dist/chunk-TJBP2K4T.js.map +1 -0
  49. package/dist/chunk-TLCEAQDQ.js +542 -0
  50. package/dist/chunk-TLCEAQDQ.js.map +1 -0
  51. package/{src/core/commands/text-commands.ts → dist/chunk-UZXBISGO.js} +86 -142
  52. package/dist/chunk-UZXBISGO.js.map +1 -0
  53. package/dist/chunk-WGBAKP3Q.js +3220 -0
  54. package/dist/chunk-WGBAKP3Q.js.map +1 -0
  55. package/dist/compare/index.cjs +5475 -0
  56. package/dist/compare/index.cjs.map +1 -0
  57. package/dist/compare/index.d.cts +114 -0
  58. package/dist/compare/index.d.ts +114 -0
  59. package/dist/compare/index.js +731 -0
  60. package/dist/compare/index.js.map +1 -0
  61. package/dist/core/commands/formatting-commands.cjs +828 -0
  62. package/dist/core/commands/formatting-commands.cjs.map +1 -0
  63. package/dist/core/commands/formatting-commands.d.cts +63 -0
  64. package/dist/core/commands/formatting-commands.d.ts +63 -0
  65. package/dist/core/commands/formatting-commands.js +37 -0
  66. package/dist/core/commands/formatting-commands.js.map +1 -0
  67. package/dist/core/commands/image-commands.cjs +2023 -0
  68. package/dist/core/commands/image-commands.cjs.map +1 -0
  69. package/dist/core/commands/image-commands.d.cts +58 -0
  70. package/dist/core/commands/image-commands.d.ts +58 -0
  71. package/dist/core/commands/image-commands.js +18 -0
  72. package/dist/core/commands/image-commands.js.map +1 -0
  73. package/dist/core/commands/section-layout-commands.cjs +477 -0
  74. package/dist/core/commands/section-layout-commands.cjs.map +1 -0
  75. package/dist/core/commands/section-layout-commands.d.cts +62 -0
  76. package/dist/core/commands/section-layout-commands.d.ts +62 -0
  77. package/dist/core/commands/section-layout-commands.js +21 -0
  78. package/dist/core/commands/section-layout-commands.js.map +1 -0
  79. package/dist/core/commands/style-commands.cjs +214 -0
  80. package/dist/core/commands/style-commands.cjs.map +1 -0
  81. package/dist/core/commands/style-commands.d.cts +13 -0
  82. package/dist/core/commands/style-commands.d.ts +13 -0
  83. package/dist/core/commands/style-commands.js +9 -0
  84. package/dist/core/commands/style-commands.js.map +1 -0
  85. package/dist/core/commands/table-structure-commands.cjs +1883 -0
  86. package/dist/core/commands/table-structure-commands.cjs.map +1 -0
  87. package/dist/core/commands/table-structure-commands.d.cts +59 -0
  88. package/dist/core/commands/table-structure-commands.d.ts +59 -0
  89. package/dist/core/commands/table-structure-commands.js +12 -0
  90. package/dist/core/commands/table-structure-commands.js.map +1 -0
  91. package/dist/core/commands/text-commands.cjs +2391 -0
  92. package/dist/core/commands/text-commands.cjs.map +1 -0
  93. package/dist/core/commands/text-commands.d.cts +24 -0
  94. package/dist/core/commands/text-commands.d.ts +24 -0
  95. package/dist/core/commands/text-commands.js +28 -0
  96. package/dist/core/commands/text-commands.js.map +1 -0
  97. package/dist/core/selection/mapping.cjs +200 -0
  98. package/dist/core/selection/mapping.cjs.map +1 -0
  99. package/dist/core/selection/mapping.d.cts +2 -0
  100. package/dist/core/selection/mapping.d.ts +2 -0
  101. package/dist/core/selection/mapping.js +31 -0
  102. package/dist/core/selection/mapping.js.map +1 -0
  103. package/dist/core/state/editor-state.cjs +2278 -0
  104. package/dist/core/state/editor-state.cjs.map +1 -0
  105. package/dist/core/state/editor-state.d.cts +2 -0
  106. package/dist/core/state/editor-state.d.ts +2 -0
  107. package/dist/core/state/editor-state.js +26 -0
  108. package/dist/core/state/editor-state.js.map +1 -0
  109. package/dist/index.cjs +38553 -0
  110. package/dist/index.cjs.map +1 -0
  111. package/dist/index.d.cts +15 -0
  112. package/dist/index.d.ts +15 -0
  113. package/dist/index.js +7856 -0
  114. package/dist/index.js.map +1 -0
  115. package/dist/io/docx-session.cjs +16236 -0
  116. package/dist/io/docx-session.cjs.map +1 -0
  117. package/dist/io/docx-session.d.cts +21 -0
  118. package/dist/io/docx-session.d.ts +21 -0
  119. package/dist/io/docx-session.js +18 -0
  120. package/dist/io/docx-session.js.map +1 -0
  121. package/dist/legal/index.cjs +3900 -0
  122. package/dist/legal/index.cjs.map +1 -0
  123. package/dist/legal/index.d.cts +86 -0
  124. package/dist/legal/index.d.ts +86 -0
  125. package/dist/legal/index.js +616 -0
  126. package/dist/legal/index.js.map +1 -0
  127. package/dist/public-types-7ZL_94cz.d.ts +1573 -0
  128. package/dist/public-types-CeMaDueh.d.cts +1573 -0
  129. package/dist/public-types.cjs +19 -0
  130. package/dist/public-types.cjs.map +1 -0
  131. package/dist/public-types.d.cts +2 -0
  132. package/dist/public-types.d.ts +2 -0
  133. package/dist/public-types.js +1 -0
  134. package/dist/public-types.js.map +1 -0
  135. package/dist/runtime/document-runtime.cjs +11140 -0
  136. package/dist/runtime/document-runtime.cjs.map +1 -0
  137. package/dist/runtime/document-runtime.d.cts +231 -0
  138. package/dist/runtime/document-runtime.d.ts +231 -0
  139. package/dist/runtime/document-runtime.js +21 -0
  140. package/dist/runtime/document-runtime.js.map +1 -0
  141. package/dist/structural-helpers-CilgOVhh.d.cts +10 -0
  142. package/dist/structural-helpers-q0Gd-eBN.d.ts +10 -0
  143. package/dist/ui-tailwind/editor-surface/search-plugin.cjs +313 -0
  144. package/dist/ui-tailwind/editor-surface/search-plugin.cjs.map +1 -0
  145. package/dist/ui-tailwind/editor-surface/search-plugin.d.cts +67 -0
  146. package/dist/ui-tailwind/editor-surface/search-plugin.d.ts +67 -0
  147. package/dist/ui-tailwind/editor-surface/search-plugin.js +23 -0
  148. package/dist/ui-tailwind/editor-surface/search-plugin.js.map +1 -0
  149. package/dist/ui-tailwind/index.cjs +4833 -0
  150. package/dist/ui-tailwind/index.cjs.map +1 -0
  151. package/dist/ui-tailwind/index.d.cts +617 -0
  152. package/dist/ui-tailwind/index.d.ts +617 -0
  153. package/dist/ui-tailwind/index.js +575 -0
  154. package/dist/ui-tailwind/index.js.map +1 -0
  155. package/package.json +64 -54
  156. package/src/README.md +0 -85
  157. package/src/api/README.md +0 -26
  158. package/src/api/public-types.ts +0 -1418
  159. package/src/api/session-state.ts +0 -60
  160. package/src/compare/diff-engine.ts +0 -623
  161. package/src/compare/export-redlines.ts +0 -280
  162. package/src/compare/index.ts +0 -25
  163. package/src/compare/snapshot.ts +0 -97
  164. package/src/component-inventory.md +0 -99
  165. package/src/core/README.md +0 -10
  166. package/src/core/commands/README.md +0 -3
  167. package/src/core/commands/image-commands.ts +0 -373
  168. package/src/core/commands/index.ts +0 -1757
  169. package/src/core/commands/list-commands.ts +0 -565
  170. package/src/core/commands/paragraph-layout-commands.ts +0 -339
  171. package/src/core/commands/review-commands.ts +0 -108
  172. package/src/core/commands/structural-helpers.ts +0 -309
  173. package/src/core/schema/README.md +0 -3
  174. package/src/core/schema/text-schema.ts +0 -516
  175. package/src/core/search/search-text.ts +0 -357
  176. package/src/core/selection/README.md +0 -3
  177. package/src/core/selection/mapping.ts +0 -289
  178. package/src/core/selection/review-anchors.ts +0 -183
  179. package/src/core/state/README.md +0 -3
  180. package/src/core/state/editor-state.ts +0 -892
  181. package/src/formats/xlsx/io/parse-shared-strings.ts +0 -41
  182. package/src/formats/xlsx/io/parse-sheet.ts +0 -459
  183. package/src/formats/xlsx/io/parse-styles.ts +0 -59
  184. package/src/formats/xlsx/io/parse-workbook.ts +0 -75
  185. package/src/formats/xlsx/io/serialize-shared-strings.ts +0 -72
  186. package/src/formats/xlsx/io/serialize-sheet.ts +0 -333
  187. package/src/formats/xlsx/io/serialize-styles.ts +0 -98
  188. package/src/formats/xlsx/io/serialize-workbook.ts +0 -429
  189. package/src/formats/xlsx/io/xlsx-session.ts +0 -314
  190. package/src/formats/xlsx/model/cell.ts +0 -189
  191. package/src/formats/xlsx/model/sheet.ts +0 -326
  192. package/src/formats/xlsx/model/styles.ts +0 -118
  193. package/src/formats/xlsx/model/workbook.ts +0 -453
  194. package/src/formats/xlsx/runtime/cell-commands.ts +0 -567
  195. package/src/formats/xlsx/runtime/sheet-commands.ts +0 -206
  196. package/src/formats/xlsx/runtime/workbook-runtime.ts +0 -177
  197. package/src/formats/xlsx/runtime/workbook-transaction.ts +0 -822
  198. package/src/index.ts +0 -101
  199. package/src/io/README.md +0 -10
  200. package/src/io/docx-session.ts +0 -2882
  201. package/src/io/export/README.md +0 -3
  202. package/src/io/export/export-session.ts +0 -220
  203. package/src/io/export/minimal-docx.ts +0 -115
  204. package/src/io/export/reattach-preserved-parts.ts +0 -54
  205. package/src/io/export/serialize-comments.ts +0 -947
  206. package/src/io/export/serialize-footnotes.ts +0 -399
  207. package/src/io/export/serialize-headers-footers.ts +0 -372
  208. package/src/io/export/serialize-main-document.ts +0 -1376
  209. package/src/io/export/serialize-numbering.ts +0 -118
  210. package/src/io/export/serialize-revisions.ts +0 -389
  211. package/src/io/export/serialize-runtime-revisions.ts +0 -269
  212. package/src/io/export/serialize-tables.ts +0 -174
  213. package/src/io/export/split-review-boundaries.ts +0 -356
  214. package/src/io/normalize/README.md +0 -3
  215. package/src/io/normalize/normalize-text.ts +0 -639
  216. package/src/io/ooxml/README.md +0 -3
  217. package/src/io/ooxml/highlight-colors.ts +0 -39
  218. package/src/io/ooxml/numbering-sentinels.ts +0 -44
  219. package/src/io/ooxml/parse-comments.ts +0 -846
  220. package/src/io/ooxml/parse-complex-content.ts +0 -287
  221. package/src/io/ooxml/parse-fields.ts +0 -834
  222. package/src/io/ooxml/parse-footnotes.ts +0 -896
  223. package/src/io/ooxml/parse-headers-footers.ts +0 -1169
  224. package/src/io/ooxml/parse-inline-media.ts +0 -461
  225. package/src/io/ooxml/parse-main-document.ts +0 -2877
  226. package/src/io/ooxml/parse-numbering.ts +0 -432
  227. package/src/io/ooxml/parse-revisions.ts +0 -931
  228. package/src/io/ooxml/parse-settings.ts +0 -184
  229. package/src/io/ooxml/parse-shapes.ts +0 -296
  230. package/src/io/ooxml/parse-styles.ts +0 -463
  231. package/src/io/ooxml/parse-tables.ts +0 -618
  232. package/src/io/ooxml/parse-theme.ts +0 -346
  233. package/src/io/ooxml/part-manifest.ts +0 -136
  234. package/src/io/ooxml/revision-boundaries.ts +0 -351
  235. package/src/io/opc/README.md +0 -3
  236. package/src/io/opc/corrupt-package.ts +0 -166
  237. package/src/io/opc/docx-package.ts +0 -74
  238. package/src/io/opc/package-reader.ts +0 -325
  239. package/src/io/opc/package-writer.ts +0 -273
  240. package/src/io/source-package-provenance.ts +0 -241
  241. package/src/legal/cross-references.ts +0 -414
  242. package/src/legal/defined-terms.ts +0 -203
  243. package/src/legal/index.ts +0 -32
  244. package/src/legal/signature-blocks.ts +0 -259
  245. package/src/model/README.md +0 -3
  246. package/src/model/canonical-document.ts +0 -2632
  247. package/src/model/cds-1.0.0.ts +0 -212
  248. package/src/model/snapshot.ts +0 -649
  249. package/src/preservation/README.md +0 -3
  250. package/src/preservation/markup-compatibility.ts +0 -48
  251. package/src/preservation/opaque-fragment-store.ts +0 -89
  252. package/src/preservation/opaque-region.ts +0 -233
  253. package/src/preservation/package-preservation.ts +0 -113
  254. package/src/preservation/preserved-part-manifest.ts +0 -56
  255. package/src/preservation/relationship-retention.ts +0 -57
  256. package/src/preservation/store.ts +0 -185
  257. package/src/review/README.md +0 -16
  258. package/src/review/store/README.md +0 -3
  259. package/src/review/store/comment-anchors.ts +0 -70
  260. package/src/review/store/comment-remapping.ts +0 -154
  261. package/src/review/store/comment-store.ts +0 -331
  262. package/src/review/store/comment-thread.ts +0 -109
  263. package/src/review/store/revision-actions.ts +0 -394
  264. package/src/review/store/revision-store.ts +0 -312
  265. package/src/review/store/revision-types.ts +0 -171
  266. package/src/review/store/runtime-comment-store.ts +0 -43
  267. package/src/runtime/README.md +0 -3
  268. package/src/runtime/ai-action-policy.ts +0 -764
  269. package/src/runtime/collab-review-sync.ts +0 -254
  270. package/src/runtime/document-layout.ts +0 -332
  271. package/src/runtime/document-navigation.ts +0 -603
  272. package/src/runtime/document-runtime.ts +0 -3159
  273. package/src/runtime/document-search.ts +0 -145
  274. package/src/runtime/numbering-prefix.ts +0 -216
  275. package/src/runtime/page-layout-estimation.ts +0 -212
  276. package/src/runtime/read-only-diagnostics-runtime.ts +0 -241
  277. package/src/runtime/review-runtime.ts +0 -44
  278. package/src/runtime/revision-runtime.ts +0 -107
  279. package/src/runtime/session-capabilities.ts +0 -192
  280. package/src/runtime/story-context.ts +0 -164
  281. package/src/runtime/story-targeting.ts +0 -162
  282. package/src/runtime/surface-projection.ts +0 -1357
  283. package/src/runtime/table-commands.ts +0 -173
  284. package/src/runtime/table-schema.ts +0 -309
  285. package/src/runtime/view-state.ts +0 -477
  286. package/src/runtime/virtualized-rendering.ts +0 -258
  287. package/src/runtime/workflow-markup.ts +0 -353
  288. package/src/ui/README.md +0 -30
  289. package/src/ui/WordReviewEditor.tsx +0 -4097
  290. package/src/ui/browser-export.ts +0 -52
  291. package/src/ui/comments/README.md +0 -3
  292. package/src/ui/compatibility/README.md +0 -3
  293. package/src/ui/editor-command-bag.ts +0 -120
  294. package/src/ui/editor-runtime-boundary.ts +0 -1457
  295. package/src/ui/editor-shell-view.tsx +0 -142
  296. package/src/ui/editor-surface/README.md +0 -3
  297. package/src/ui/editor-surface-controller.tsx +0 -63
  298. package/src/ui/headless/comment-decoration-model.ts +0 -124
  299. package/src/ui/headless/preserve-editor-selection.ts +0 -5
  300. package/src/ui/headless/revision-decoration-model.ts +0 -128
  301. package/src/ui/headless/selection-helpers.ts +0 -54
  302. package/src/ui/headless/selection-toolbar-model.ts +0 -34
  303. package/src/ui/headless/use-editor-keyboard.ts +0 -103
  304. package/src/ui/review/README.md +0 -3
  305. package/src/ui/runtime-snapshot-selectors.ts +0 -197
  306. package/src/ui/shared/revision-filters.ts +0 -31
  307. package/src/ui/status/README.md +0 -3
  308. package/src/ui/theme/README.md +0 -3
  309. package/src/ui/toolbar/README.md +0 -3
  310. package/src/ui/workflow-surface-blocked-rails.ts +0 -94
  311. package/src/ui-tailwind/chrome/tw-alert-banner.tsx +0 -64
  312. package/src/ui-tailwind/chrome/tw-image-context-toolbar.tsx +0 -129
  313. package/src/ui-tailwind/chrome/tw-layout-panel.tsx +0 -114
  314. package/src/ui-tailwind/chrome/tw-object-context-toolbar.tsx +0 -34
  315. package/src/ui-tailwind/chrome/tw-page-ruler.tsx +0 -386
  316. package/src/ui-tailwind/chrome/tw-selection-toolbar.tsx +0 -186
  317. package/src/ui-tailwind/chrome/tw-suggestion-card.tsx +0 -139
  318. package/src/ui-tailwind/chrome/tw-table-context-toolbar.tsx +0 -128
  319. package/src/ui-tailwind/chrome/tw-unsaved-modal.tsx +0 -58
  320. package/src/ui-tailwind/chrome/use-before-unload.ts +0 -20
  321. package/src/ui-tailwind/editor-surface/perf-probe.ts +0 -179
  322. package/src/ui-tailwind/editor-surface/pm-collab-plugins.ts +0 -40
  323. package/src/ui-tailwind/editor-surface/pm-command-bridge.ts +0 -178
  324. package/src/ui-tailwind/editor-surface/pm-contextual-ui.ts +0 -31
  325. package/src/ui-tailwind/editor-surface/pm-decorations.ts +0 -427
  326. package/src/ui-tailwind/editor-surface/pm-position-map.ts +0 -123
  327. package/src/ui-tailwind/editor-surface/pm-schema.ts +0 -876
  328. package/src/ui-tailwind/editor-surface/pm-state-from-snapshot.ts +0 -504
  329. package/src/ui-tailwind/editor-surface/search-plugin.ts +0 -168
  330. package/src/ui-tailwind/editor-surface/surface-build-keys.ts +0 -61
  331. package/src/ui-tailwind/editor-surface/tw-caret.tsx +0 -12
  332. package/src/ui-tailwind/editor-surface/tw-editor-surface.tsx +0 -150
  333. package/src/ui-tailwind/editor-surface/tw-inline-token.tsx +0 -129
  334. package/src/ui-tailwind/editor-surface/tw-opaque-block.tsx +0 -58
  335. package/src/ui-tailwind/editor-surface/tw-paragraph-block.tsx +0 -151
  336. package/src/ui-tailwind/editor-surface/tw-prosemirror-surface.tsx +0 -973
  337. package/src/ui-tailwind/editor-surface/tw-segment-view.tsx +0 -111
  338. package/src/ui-tailwind/editor-surface/tw-table-node-view.tsx +0 -436
  339. package/src/ui-tailwind/index.ts +0 -62
  340. package/src/ui-tailwind/page-chrome-model.ts +0 -27
  341. package/src/ui-tailwind/review/tw-comment-sidebar.tsx +0 -406
  342. package/src/ui-tailwind/review/tw-health-panel.tsx +0 -149
  343. package/src/ui-tailwind/review/tw-review-rail.tsx +0 -120
  344. package/src/ui-tailwind/review/tw-revision-sidebar.tsx +0 -164
  345. package/src/ui-tailwind/status/tw-status-bar.tsx +0 -61
  346. package/src/ui-tailwind/toolbar/tw-toolbar-icon-button.tsx +0 -52
  347. package/src/ui-tailwind/toolbar/tw-toolbar.tsx +0 -1064
  348. package/src/ui-tailwind/tw-review-workspace.tsx +0 -1417
  349. package/src/validation/README.md +0 -3
  350. package/src/validation/compatibility-engine.ts +0 -634
  351. package/src/validation/compatibility-report.ts +0 -161
  352. package/src/validation/diagnostics.ts +0 -204
  353. package/src/validation/docx-comment-proof.ts +0 -707
  354. package/src/validation/import-diagnostics.ts +0 -128
  355. package/src/validation/low-priority-word-surfaces.ts +0 -373
  356. /package/{src → dist}/ui-tailwind/theme/editor-theme.css +0 -0
@@ -1,834 +0,0 @@
1
- /**
2
- * parse-fields.ts
3
- *
4
- * Standalone parsers for OOXML field codes (w:fldSimple, complex fldChar sequences)
5
- * and bookmarks (w:bookmarkStart / w:bookmarkEnd).
6
- *
7
- * These types mirror the canonical FieldNode / BookmarkStartNode / BookmarkEndNode
8
- * shapes from canonical-document.ts, but carry raw XML for preservation and are
9
- * pre-normalization (no fragmentId / warningId yet).
10
- *
11
- * Usage: call parseFieldsFromParagraphXml() or parseBookmarksFromXml() for
12
- * independent field/bookmark extraction. The functions are designed to be
13
- * imported by parse-main-document.ts when full pipeline integration is ready.
14
- */
15
-
16
- // ─── Parsed types ────────────────────────────────────────────────────────────
17
-
18
- export interface ParsedSimpleFieldNode {
19
- type: "field";
20
- fieldType: "simple";
21
- instruction: string;
22
- /** Raw XML of the content runs inside <w:fldSimple>. */
23
- contentXml: string;
24
- rawXml: string;
25
- }
26
-
27
- export interface ParsedComplexFieldNode {
28
- type: "field";
29
- fieldType: "complex";
30
- instruction: string;
31
- /** Raw XML of the content runs between the "separate" and "end" fldChar. */
32
- contentXml: string;
33
- /** Start index in the source document XML. */
34
- start: number;
35
- /** End index (exclusive) in the source document XML. */
36
- end: number;
37
- }
38
-
39
- export type ParsedFieldNode = ParsedSimpleFieldNode | ParsedComplexFieldNode;
40
-
41
- export interface ParsedBookmarkStartNode {
42
- type: "bookmark_start";
43
- bookmarkId: string;
44
- name: string;
45
- rawXml: string;
46
- }
47
-
48
- export interface ParsedBookmarkEndNode {
49
- type: "bookmark_end";
50
- bookmarkId: string;
51
- rawXml: string;
52
- }
53
-
54
- export type ParsedBookmarkNode = ParsedBookmarkStartNode | ParsedBookmarkEndNode;
55
-
56
- // ─── Internal XML types ───────────────────────────────────────────────────────
57
-
58
- interface XmlElementNode {
59
- type: "element";
60
- name: string;
61
- attributes: Record<string, string>;
62
- children: XmlNode[];
63
- start: number;
64
- end: number;
65
- }
66
-
67
- interface XmlTextNode {
68
- type: "text";
69
- text: string;
70
- start: number;
71
- end: number;
72
- }
73
-
74
- type XmlNode = XmlElementNode | XmlTextNode;
75
-
76
- // ─── Public API ───────────────────────────────────────────────────────────────
77
-
78
- /**
79
- * Parse all simple fields and bookmarks from the XML of a single paragraph
80
- * element. Complex fields that span paragraphs are not fully resolved here;
81
- * use extractComplexFieldsFromBodyXml for body-level extraction.
82
- *
83
- * @param paragraphXml Raw XML string of a <w:p> element.
84
- */
85
- export function parseFieldsFromParagraphXml(paragraphXml: string): {
86
- simpleFields: ParsedSimpleFieldNode[];
87
- bookmarks: ParsedBookmarkNode[];
88
- } {
89
- const root = parseXml(paragraphXml);
90
- const pEl = findFirstChild(root, "p");
91
- const target = pEl ?? root;
92
-
93
- const simpleFields: ParsedSimpleFieldNode[] = [];
94
- const bookmarks: ParsedBookmarkNode[] = [];
95
-
96
- for (const child of target.children) {
97
- if (child.type !== "element") continue;
98
- const name = localName(child.name);
99
-
100
- if (name === "fldSimple") {
101
- const field = parseFldSimple(child, paragraphXml);
102
- if (field) simpleFields.push(field);
103
- } else if (name === "bookmarkStart") {
104
- const bk = parseBookmarkStart(child, paragraphXml);
105
- if (bk) bookmarks.push(bk);
106
- } else if (name === "bookmarkEnd") {
107
- const bk = parseBookmarkEnd(child, paragraphXml);
108
- if (bk) bookmarks.push(bk);
109
- }
110
- }
111
-
112
- return { simpleFields, bookmarks };
113
- }
114
-
115
- /**
116
- * Extract complex field sequences from a body element XML string.
117
- * A complex field is a begin / instrText* / separate / content / end sequence
118
- * spread across multiple <w:r> siblings.
119
- *
120
- * @param bodyXml Raw XML string of a <w:body> element (or full document).
121
- */
122
- export function extractComplexFieldsFromBodyXml(bodyXml: string): ParsedComplexFieldNode[] {
123
- const root = parseXml(bodyXml);
124
- const results: ParsedComplexFieldNode[] = [];
125
-
126
- // Walk all <w:p> children of the body
127
- const bodyEl = findFirstChild(root, "body") ?? findFirstChild(root, "document");
128
- const scanTarget = bodyEl ?? root;
129
-
130
- for (const block of scanTarget.children) {
131
- if (block.type !== "element") continue;
132
- if (localName(block.name) !== "p") continue;
133
- extractComplexFieldsFromParagraph(block, bodyXml, results);
134
- }
135
-
136
- return results;
137
- }
138
-
139
- /**
140
- * Parse all bookmark start/end nodes from a full document or body XML.
141
- */
142
- export function extractBookmarksFromBodyXml(bodyXml: string): ParsedBookmarkNode[] {
143
- const root = parseXml(bodyXml);
144
- const results: ParsedBookmarkNode[] = [];
145
- collectBookmarks(root, bodyXml, results);
146
- return results;
147
- }
148
-
149
- // ─── Element-level parsers (exported for unit testing) ────────────────────────
150
-
151
- export function parseFldSimple(
152
- element: { attributes: Record<string, string>; children: XmlNode[]; start: number; end: number },
153
- sourceXml: string,
154
- ): ParsedSimpleFieldNode | undefined {
155
- const instruction = (element.attributes["w:instr"] ?? element.attributes.instr ?? "").trim();
156
- const contentXml = element.children
157
- .filter((c): c is XmlElementNode => c.type === "element")
158
- .map((c) => sourceXml.slice(c.start, c.end))
159
- .join("");
160
- return {
161
- type: "field",
162
- fieldType: "simple",
163
- instruction,
164
- contentXml,
165
- rawXml: sourceXml.slice(element.start, element.end),
166
- };
167
- }
168
-
169
- export function parseBookmarkStart(
170
- element: { attributes: Record<string, string>; start: number; end: number },
171
- sourceXml: string,
172
- ): ParsedBookmarkStartNode | undefined {
173
- const bookmarkId = element.attributes["w:id"] ?? element.attributes.id ?? "";
174
- const name = element.attributes["w:name"] ?? element.attributes.name ?? "";
175
- if (!bookmarkId) return undefined;
176
- return {
177
- type: "bookmark_start",
178
- bookmarkId,
179
- name,
180
- rawXml: sourceXml.slice(element.start, element.end),
181
- };
182
- }
183
-
184
- export function parseBookmarkEnd(
185
- element: { attributes: Record<string, string>; start: number; end: number },
186
- sourceXml: string,
187
- ): ParsedBookmarkEndNode | undefined {
188
- const bookmarkId = element.attributes["w:id"] ?? element.attributes.id ?? "";
189
- if (!bookmarkId) return undefined;
190
- return {
191
- type: "bookmark_end",
192
- bookmarkId,
193
- rawXml: sourceXml.slice(element.start, element.end),
194
- };
195
- }
196
-
197
- // ─── Field family classification ─────────────────────────────────────────────
198
-
199
- import type {
200
- CanonicalDocument,
201
- DocumentNode,
202
- FieldFamily,
203
- FieldNode,
204
- FieldRegistry,
205
- FieldRegistryEntry,
206
- FieldRefreshStatus,
207
- InlineNode,
208
- ParagraphNode,
209
- SubPartsCatalog,
210
- SupportedFieldFamily,
211
- TocEntry,
212
- TocStructure,
213
- } from "../../model/canonical-document.ts";
214
-
215
- const FIELD_FAMILY_PATTERN =
216
- /^\s*(REF|PAGEREF|NOTEREF|TOC|PAGE|NUMPAGES|DATE|TIME|AUTHOR|FILENAME|MERGEFIELD|IF|SEQ|INDEX|TC|STYLEREF)\b/i;
217
-
218
- const SUPPORTED_FAMILIES = new Set<string>(["REF", "PAGEREF", "NOTEREF", "TOC"]);
219
-
220
- /**
221
- * Classify a field instruction into its field family.
222
- * Returns the family enum value and whether it is in the supported slice.
223
- */
224
- export function classifyFieldInstruction(instruction: string): {
225
- family: FieldFamily;
226
- supported: boolean;
227
- target?: string;
228
- } {
229
- const trimmed = instruction.trim();
230
- const match = FIELD_FAMILY_PATTERN.exec(trimmed);
231
- if (!match) {
232
- return { family: "UNKNOWN", supported: false };
233
- }
234
-
235
- const family = match[1].toUpperCase() as FieldFamily;
236
- const supported = SUPPORTED_FAMILIES.has(family);
237
-
238
- let target: string | undefined;
239
- if (family === "REF" || family === "PAGEREF" || family === "NOTEREF") {
240
- const targetMatch = /^\s*(?:REF|PAGEREF|NOTEREF)\s+(?:"([^"]+)"|(\S+))/i.exec(trimmed);
241
- target = (targetMatch?.[1] ?? targetMatch?.[2])?.trim();
242
- }
243
-
244
- return { family, supported, target };
245
- }
246
-
247
- /**
248
- * Returns true if the given field family is in the supported refresh slice.
249
- */
250
- export function isSupportedFieldFamily(family: FieldFamily): family is SupportedFieldFamily {
251
- return SUPPORTED_FAMILIES.has(family);
252
- }
253
-
254
- // ─── Field registry builder ─────────────────────────────────────────────────
255
-
256
- /**
257
- * Build a field registry from a canonical document, cataloging every field
258
- * instance with its classification, dependency metadata, and refresh status.
259
- *
260
- * The registry partitions fields into `supported` (REF, PAGEREF, NOTEREF, TOC)
261
- * and `preserveOnly` (all others) slices.
262
- */
263
- export function buildFieldRegistry(
264
- document: Pick<CanonicalDocument, "content" | "styles"> & {
265
- subParts?: SubPartsCatalog;
266
- },
267
- ): FieldRegistry {
268
- const root = document.content;
269
- const supported: FieldRegistryEntry[] = [];
270
- const preserveOnly: FieldRegistryEntry[] = [];
271
- let fieldIndex = 0;
272
- let paragraphIndex = -1;
273
- let tocInstruction: string | undefined;
274
-
275
- walkFieldDocument(root, (node, pIdx) => {
276
- paragraphIndex = pIdx;
277
- if (node.type === "field") {
278
- const classification = node.fieldFamily
279
- ? { family: node.fieldFamily, supported: isSupportedFieldFamily(node.fieldFamily), target: node.fieldTarget }
280
- : classifyFieldInstruction(node.instruction);
281
- const displayText = flattenFieldText(node.children);
282
- const entry: FieldRegistryEntry = {
283
- fieldIndex,
284
- fieldFamily: classification.family,
285
- supported: classification.supported,
286
- instruction: node.instruction,
287
- ...(classification.target ? { fieldTarget: classification.target } : {}),
288
- displayText,
289
- paragraphIndex,
290
- refreshStatus: node.refreshStatus ?? (classification.supported ? "stale" : "preserve-only"),
291
- };
292
- if (classification.supported) {
293
- supported.push(entry);
294
- if (classification.family === "TOC" && !tocInstruction) {
295
- tocInstruction = node.instruction;
296
- }
297
- } else {
298
- preserveOnly.push(entry);
299
- }
300
- fieldIndex += 1;
301
- }
302
- });
303
- if (document.subParts) {
304
- walkSubPartFields(document.subParts, (node, pIdx) => {
305
- paragraphIndex = pIdx;
306
- if (node.type === "field") {
307
- const classification = node.fieldFamily
308
- ? { family: node.fieldFamily, supported: isSupportedFieldFamily(node.fieldFamily), target: node.fieldTarget }
309
- : classifyFieldInstruction(node.instruction);
310
- const displayText = flattenFieldText(node.children);
311
- const entry: FieldRegistryEntry = {
312
- fieldIndex,
313
- fieldFamily: classification.family,
314
- supported: classification.supported,
315
- instruction: node.instruction,
316
- ...(classification.target ? { fieldTarget: classification.target } : {}),
317
- displayText,
318
- paragraphIndex,
319
- refreshStatus: node.refreshStatus ?? (classification.supported ? "stale" : "preserve-only"),
320
- };
321
- if (classification.supported) {
322
- supported.push(entry);
323
- } else {
324
- preserveOnly.push(entry);
325
- }
326
- fieldIndex += 1;
327
- }
328
- });
329
- }
330
-
331
- const tocStructure = tocInstruction
332
- ? buildTocStructure(document, tocInstruction)
333
- : undefined;
334
-
335
- return {
336
- supported,
337
- preserveOnly,
338
- ...(tocStructure ? { tocStructure } : {}),
339
- };
340
- }
341
-
342
- /**
343
- * Parse the heading level range from a TOC field instruction.
344
- * The \\o switch specifies the outline level range (e.g. \\o "1-3").
345
- * Defaults to 1-9 if no \\o switch is present.
346
- */
347
- export function parseTocLevelRange(instruction: string): { from: number; to: number } {
348
- const match = /\\o\s+"(\d+)-(\d+)"/.exec(instruction);
349
- if (match) {
350
- return { from: Number.parseInt(match[1], 10), to: Number.parseInt(match[2], 10) };
351
- }
352
- return { from: 1, to: 9 };
353
- }
354
-
355
- /**
356
- * Build a TocStructure from the document's heading paragraphs and the
357
- * TOC field instruction. This produces a deterministic, package-backed
358
- * TOC model that the runtime can use for refresh without DOM recomputation.
359
- */
360
- export function buildTocStructure(
361
- document: Pick<CanonicalDocument, "content" | "styles">,
362
- instruction: string,
363
- ): TocStructure {
364
- const levelRange = parseTocLevelRange(instruction);
365
- const entries: TocEntry[] = [];
366
- let paragraphIndex = -1;
367
-
368
- walkFieldDocument(document.content, (node, pIdx) => {
369
- paragraphIndex = pIdx;
370
- if (node.type !== "paragraph") return;
371
- const paragraph = node as ParagraphNode;
372
-
373
- // Determine heading level from outlineLevel or style
374
- let level: number | undefined = paragraph.outlineLevel;
375
- if (level === undefined && paragraph.styleId) {
376
- const style = document.styles.paragraphs[paragraph.styleId];
377
- if (style?.outlineLevel !== undefined) {
378
- level = style.outlineLevel;
379
- }
380
- }
381
-
382
- if (level === undefined) return;
383
- // TOC outline levels are 0-based internally, 1-based in TOC notation
384
- const tocLevel = level + 1;
385
- if (tocLevel < levelRange.from || tocLevel > levelRange.to) return;
386
-
387
- const text = flattenParagraphInlineText(paragraph.children);
388
- if (text.trim().length === 0) return;
389
-
390
- // Find bookmark anchoring this heading
391
- let bookmarkName: string | undefined;
392
- for (const child of paragraph.children) {
393
- if (child.type === "bookmark_start" && child.name) {
394
- bookmarkName = child.name;
395
- break;
396
- }
397
- }
398
-
399
- entries.push({
400
- text: text.trim(),
401
- level: tocLevel,
402
- paragraphIndex,
403
- ...(paragraph.styleId ? { styleId: paragraph.styleId } : {}),
404
- ...(bookmarkName ? { bookmarkName } : {}),
405
- });
406
- });
407
-
408
- return {
409
- instruction,
410
- levelRange,
411
- entries,
412
- status: "stale",
413
- };
414
- }
415
-
416
- /**
417
- * Deterministic refresh helper for REF fields.
418
- * Given a bookmark name map and the document content, resolves the display
419
- * text for a REF field by extracting text from the bookmarked paragraph.
420
- *
421
- * Returns the resolved text, or undefined if the bookmark is not found.
422
- */
423
- export function resolveRefFieldText(
424
- document: Pick<CanonicalDocument, "content">,
425
- bookmarkNameMap: Map<string, { bookmarkId: string; paragraphIndex: number }>,
426
- fieldTarget: string,
427
- ): { text: string; refreshStatus: "current" | "unresolvable" } | undefined {
428
- const bookmark = bookmarkNameMap.get(fieldTarget);
429
- if (!bookmark) {
430
- return { text: "", refreshStatus: "unresolvable" };
431
- }
432
-
433
- // Find the paragraph at bookmarkIndex and extract its text content
434
- let paragraphIndex = -1;
435
- let resolvedText: string | undefined;
436
-
437
- walkFieldDocument(document.content, (node, pIdx) => {
438
- if (node.type !== "paragraph") return;
439
- paragraphIndex = pIdx;
440
- if (paragraphIndex === bookmark.paragraphIndex) {
441
- resolvedText = flattenBookmarkContent(node as ParagraphNode, bookmark.bookmarkId);
442
- }
443
- });
444
-
445
- if (resolvedText !== undefined) {
446
- return { text: resolvedText, refreshStatus: "current" };
447
- }
448
- return { text: "", refreshStatus: "unresolvable" };
449
- }
450
-
451
- /**
452
- * Deterministic refresh helper that updates all supported field entries
453
- * in a registry with their current resolved status.
454
- *
455
- * This does NOT mutate the document nodes — it returns a new registry
456
- * with updated refresh statuses. A3 owns the runtime wiring that
457
- * applies these to the live document.
458
- */
459
- export function refreshFieldRegistry(
460
- registry: FieldRegistry,
461
- bookmarkNameMap: Map<string, { bookmarkId: string; paragraphIndex: number }>,
462
- ): FieldRegistry {
463
- const refreshed: FieldRegistryEntry[] = registry.supported.map((entry) => {
464
- if (entry.fieldFamily === "TOC") {
465
- // TOC refresh is handled through tocStructure, not individual entries
466
- return { ...entry, refreshStatus: registry.tocStructure ? "current" : "stale" as FieldRefreshStatus };
467
- }
468
- if (!entry.fieldTarget) {
469
- return { ...entry, refreshStatus: "unresolvable" as FieldRefreshStatus };
470
- }
471
- const bookmark = bookmarkNameMap.get(entry.fieldTarget);
472
- if (!bookmark) {
473
- return { ...entry, refreshStatus: "unresolvable" as FieldRefreshStatus };
474
- }
475
- return { ...entry, refreshStatus: "current" as FieldRefreshStatus };
476
- });
477
-
478
- return {
479
- supported: refreshed,
480
- preserveOnly: registry.preserveOnly,
481
- ...(registry.tocStructure ? { tocStructure: registry.tocStructure } : {}),
482
- };
483
- }
484
-
485
- // ─── Field registry internal helpers ────────────────────────────────────────
486
-
487
- function walkFieldDocument(
488
- node: DocumentNode,
489
- visit: (node: DocumentNode, paragraphIndex: number) => void,
490
- paragraphIndex = -1,
491
- ): number {
492
- if (node.type === "paragraph") {
493
- paragraphIndex += 1;
494
- }
495
- visit(node, paragraphIndex);
496
-
497
- if ("children" in node && Array.isArray(node.children)) {
498
- for (const child of node.children) {
499
- paragraphIndex = walkFieldDocument(child as DocumentNode, visit, paragraphIndex);
500
- }
501
- }
502
- if (node.type === "table") {
503
- for (const row of node.rows) {
504
- paragraphIndex = walkFieldDocument(row, visit, paragraphIndex);
505
- }
506
- } else if (node.type === "table_row") {
507
- for (const cell of node.cells) {
508
- paragraphIndex = walkFieldDocument(cell, visit, paragraphIndex);
509
- }
510
- }
511
- return paragraphIndex;
512
- }
513
-
514
- function walkSubPartFields(
515
- subParts: SubPartsCatalog,
516
- visit: (node: DocumentNode, paragraphIndex: number) => void,
517
- ): void {
518
- for (const header of subParts.headers) {
519
- for (const block of header.blocks) {
520
- walkFieldDocument(block, visit);
521
- }
522
- }
523
- for (const footer of subParts.footers) {
524
- for (const block of footer.blocks) {
525
- walkFieldDocument(block, visit);
526
- }
527
- }
528
- if (subParts.footnoteCollection) {
529
- for (const note of Object.values(subParts.footnoteCollection.footnotes)) {
530
- for (const block of note.blocks) {
531
- walkFieldDocument(block, visit);
532
- }
533
- }
534
- for (const note of Object.values(subParts.footnoteCollection.endnotes)) {
535
- for (const block of note.blocks) {
536
- walkFieldDocument(block, visit);
537
- }
538
- }
539
- }
540
- }
541
-
542
- function flattenFieldText(children: InlineNode[]): string {
543
- return children
544
- .map((child) => {
545
- if (child.type === "text") return child.text;
546
- if (child.type === "tab") return "\t";
547
- if (child.type === "hard_break" || child.type === "column_break") return "\n";
548
- return "";
549
- })
550
- .join("");
551
- }
552
-
553
- function flattenParagraphInlineText(children: InlineNode[]): string {
554
- return children
555
- .map((child) => {
556
- if (child.type === "text") return child.text;
557
- if (child.type === "tab") return "\t";
558
- if (child.type === "hard_break" || child.type === "column_break") return "\n";
559
- if (child.type === "hyperlink") return flattenFieldText(child.children);
560
- if (child.type === "field") return flattenFieldText(child.children);
561
- return "";
562
- })
563
- .join("");
564
- }
565
-
566
- function flattenBookmarkContent(
567
- paragraph: ParagraphNode,
568
- bookmarkId: string,
569
- ): string {
570
- let inside = false;
571
- const parts: string[] = [];
572
- for (const child of paragraph.children) {
573
- if (child.type === "bookmark_start" && child.bookmarkId === bookmarkId) {
574
- inside = true;
575
- continue;
576
- }
577
- if (child.type === "bookmark_end" && child.bookmarkId === bookmarkId) {
578
- break;
579
- }
580
- if (inside) {
581
- if (child.type === "text") parts.push(child.text);
582
- else if (child.type === "tab") parts.push("\t");
583
- else if (child.type === "hard_break") parts.push("\n");
584
- }
585
- }
586
- // If no bookmark boundaries found in this paragraph, return full paragraph text
587
- if (!inside) {
588
- return flattenParagraphInlineText(paragraph.children);
589
- }
590
- return parts.join("");
591
- }
592
-
593
- // ─── Internal helpers ─────────────────────────────────────────────────────────
594
-
595
- function extractComplexFieldsFromParagraph(
596
- paragraph: XmlElementNode,
597
- sourceXml: string,
598
- results: ParsedComplexFieldNode[],
599
- ): void {
600
- type FieldState = "idle" | "in-instr" | "in-content";
601
- let state: FieldState = "idle";
602
- let instrParts: string[] = [];
603
- let contentStart = -1;
604
- let contentEnd = -1;
605
- let fieldStart = -1;
606
-
607
- for (const child of paragraph.children) {
608
- if (child.type !== "element" || localName(child.name) !== "r") continue;
609
-
610
- const fldChar = findFirstChildEl(child, "fldChar");
611
- const instrText = findFirstChildEl(child, "instrText");
612
-
613
- if (fldChar) {
614
- const charType = (
615
- fldChar.attributes["w:fldCharType"] ??
616
- fldChar.attributes.fldCharType ??
617
- ""
618
- ).toLowerCase();
619
-
620
- if (charType === "begin") {
621
- state = "in-instr";
622
- instrParts = [];
623
- fieldStart = child.start;
624
- contentStart = -1;
625
- contentEnd = -1;
626
- } else if (charType === "separate" && state === "in-instr") {
627
- state = "in-content";
628
- contentStart = child.end;
629
- } else if (charType === "end") {
630
- if (state === "in-content" || state === "in-instr") {
631
- if (state === "in-content") {
632
- contentEnd = child.start;
633
- }
634
- const instruction = instrParts.join("").trim();
635
- const contentXml =
636
- contentStart >= 0 && contentEnd >= contentStart
637
- ? sourceXml.slice(contentStart, contentEnd)
638
- : "";
639
- results.push({
640
- type: "field",
641
- fieldType: "complex",
642
- instruction,
643
- contentXml,
644
- start: fieldStart,
645
- end: child.end,
646
- });
647
- }
648
- state = "idle";
649
- instrParts = [];
650
- }
651
- } else if (instrText && state === "in-instr") {
652
- const text = instrText.children
653
- .filter((c): c is XmlTextNode => c.type === "text")
654
- .map((c) => c.text)
655
- .join("");
656
- instrParts.push(text);
657
- }
658
- }
659
- }
660
-
661
- function collectBookmarks(
662
- node: XmlElementNode,
663
- sourceXml: string,
664
- results: ParsedBookmarkNode[],
665
- ): void {
666
- for (const child of node.children) {
667
- if (child.type !== "element") continue;
668
- const name = localName(child.name);
669
- if (name === "bookmarkStart") {
670
- const bk = parseBookmarkStart(child, sourceXml);
671
- if (bk) results.push(bk);
672
- } else if (name === "bookmarkEnd") {
673
- const bk = parseBookmarkEnd(child, sourceXml);
674
- if (bk) results.push(bk);
675
- } else {
676
- collectBookmarks(child, sourceXml, results);
677
- }
678
- }
679
- }
680
-
681
- function findFirstChild(node: XmlElementNode, childLocalName: string): XmlElementNode | undefined {
682
- return node.children.find(
683
- (c): c is XmlElementNode => c.type === "element" && localName(c.name) === childLocalName,
684
- );
685
- }
686
-
687
- function findFirstChildEl(node: XmlElementNode, childLocalName: string): XmlElementNode | undefined {
688
- return node.children.find(
689
- (c): c is XmlElementNode => c.type === "element" && localName(c.name) === childLocalName,
690
- );
691
- }
692
-
693
- function localName(name: string): string {
694
- const sep = name.indexOf(":");
695
- return sep >= 0 ? name.slice(sep + 1) : name;
696
- }
697
-
698
- // ─── Minimal XML parser (same pattern as parse-tables.ts) ────────────────────
699
-
700
- function parseXml(xml: string): XmlElementNode {
701
- const root: XmlElementNode = {
702
- type: "element",
703
- name: "__root__",
704
- attributes: {},
705
- children: [],
706
- start: 0,
707
- end: xml.length,
708
- };
709
- const stack: XmlElementNode[] = [root];
710
- let cursor = 0;
711
-
712
- while (cursor < xml.length) {
713
- if (xml.startsWith("<!--", cursor)) {
714
- const end = xml.indexOf("-->", cursor);
715
- cursor = end >= 0 ? end + 3 : xml.length;
716
- continue;
717
- }
718
- if (xml.startsWith("<?", cursor)) {
719
- const end = xml.indexOf("?>", cursor);
720
- cursor = end >= 0 ? end + 2 : xml.length;
721
- continue;
722
- }
723
- if (xml.startsWith("<![CDATA[", cursor)) {
724
- const end = xml.indexOf("]]>", cursor);
725
- const textEnd = end >= 0 ? end : xml.length;
726
- stack[stack.length - 1]?.children.push({
727
- type: "text",
728
- text: xml.slice(cursor + 9, textEnd),
729
- start: cursor,
730
- end: end >= 0 ? end + 3 : xml.length,
731
- });
732
- cursor = end >= 0 ? end + 3 : xml.length;
733
- continue;
734
- }
735
- if (xml[cursor] !== "<") {
736
- const nextTag = xml.indexOf("<", cursor);
737
- const end = nextTag >= 0 ? nextTag : xml.length;
738
- const text = decodeXmlEntities(xml.slice(cursor, end));
739
- if (text.length > 0) {
740
- stack[stack.length - 1]?.children.push({ type: "text", text, start: cursor, end });
741
- }
742
- cursor = end;
743
- continue;
744
- }
745
- if (xml[cursor + 1] === "/") {
746
- const end = xml.indexOf(">", cursor);
747
- if (end < 0) throw new Error("Malformed XML: missing >.");
748
- const name = xml.slice(cursor + 2, end).trim();
749
- const current = stack.pop();
750
- if (!current || localName(current.name) !== localName(name)) {
751
- throw new Error(`Malformed XML: unexpected closing tag </${name}>.`);
752
- }
753
- current.end = end + 1;
754
- cursor = end + 1;
755
- continue;
756
- }
757
- const tagEnd = findTagEnd(xml, cursor);
758
- const tagBody = xml.slice(cursor + 1, tagEnd);
759
- const selfClosing = /\/\s*$/.test(tagBody);
760
- const { name, attributes } = parseTag(tagBody.replace(/\/\s*$/, "").trim());
761
- const element: XmlElementNode = {
762
- type: "element",
763
- name,
764
- attributes,
765
- children: [],
766
- start: cursor,
767
- end: tagEnd + 1,
768
- };
769
- stack[stack.length - 1]?.children.push(element);
770
- if (!selfClosing) stack.push(element);
771
- cursor = tagEnd + 1;
772
- }
773
-
774
- if (stack.length !== 1) throw new Error("Malformed XML: unclosed element.");
775
- return root;
776
- }
777
-
778
- function parseTag(tagBody: string): { name: string; attributes: Record<string, string> } {
779
- let cursor = 0;
780
- while (cursor < tagBody.length && /\s/.test(tagBody[cursor] ?? "")) cursor += 1;
781
- const nameStart = cursor;
782
- while (cursor < tagBody.length && !/\s/.test(tagBody[cursor] ?? "")) cursor += 1;
783
- const name = tagBody.slice(nameStart, cursor);
784
- const attributes: Record<string, string> = {};
785
-
786
- while (cursor < tagBody.length) {
787
- while (cursor < tagBody.length && /\s/.test(tagBody[cursor] ?? "")) cursor += 1;
788
- if (cursor >= tagBody.length) break;
789
- const keyStart = cursor;
790
- while (cursor < tagBody.length && !/[\s=]/.test(tagBody[cursor] ?? "")) cursor += 1;
791
- const key = tagBody.slice(keyStart, cursor);
792
- while (cursor < tagBody.length && /\s/.test(tagBody[cursor] ?? "")) cursor += 1;
793
- if (tagBody[cursor] !== "=") { attributes[key] = ""; continue; }
794
- cursor += 1;
795
- while (cursor < tagBody.length && /\s/.test(tagBody[cursor] ?? "")) cursor += 1;
796
- const quote = tagBody[cursor];
797
- if (quote !== `"` && quote !== `'`) throw new Error(`Malformed XML attribute ${key}.`);
798
- cursor += 1;
799
- const valueStart = cursor;
800
- while (cursor < tagBody.length && tagBody[cursor] !== quote) cursor += 1;
801
- attributes[key] = decodeXmlEntities(tagBody.slice(valueStart, cursor));
802
- cursor += 1;
803
- }
804
- return { name, attributes };
805
- }
806
-
807
- function findTagEnd(xml: string, start: number): number {
808
- let cursor = start + 1;
809
- let quote: string | null = null;
810
- while (cursor < xml.length) {
811
- const c = xml[cursor];
812
- if (quote) { if (c === quote) quote = null; cursor += 1; continue; }
813
- if (c === `"` || c === `'`) { quote = c; cursor += 1; continue; }
814
- if (c === ">") return cursor;
815
- cursor += 1;
816
- }
817
- throw new Error("Malformed XML: missing >.");
818
- }
819
-
820
- function decodeXmlEntities(value: string): string {
821
- return value.replace(/&(#x[0-9a-fA-F]+|#\d+|amp|lt|gt|quot|apos);/g, (match, entity) => {
822
- switch (entity) {
823
- case "amp": return "&";
824
- case "lt": return "<";
825
- case "gt": return ">";
826
- case "quot": return `"`;
827
- case "apos": return `'`;
828
- default:
829
- if (entity.startsWith("#x")) return String.fromCodePoint(Number.parseInt(entity.slice(2), 16));
830
- if (entity.startsWith("#")) return String.fromCodePoint(Number.parseInt(entity.slice(1), 10));
831
- return match;
832
- }
833
- });
834
- }