@intlayer/cli 8.4.3 → 8.4.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (301) hide show
  1. package/dist/cjs/IntlayerEventListener.cjs +186 -1
  2. package/dist/cjs/IntlayerEventListener.cjs.map +1 -1
  3. package/dist/cjs/_virtual/_rolldown/runtime.cjs +29 -0
  4. package/dist/cjs/_virtual/_utils_asset.cjs +98 -0
  5. package/dist/cjs/auth/login.cjs +90 -2
  6. package/dist/cjs/auth/login.cjs.map +1 -1
  7. package/dist/cjs/build.cjs +30 -1
  8. package/dist/cjs/build.cjs.map +1 -1
  9. package/dist/cjs/ci.cjs +76 -1
  10. package/dist/cjs/ci.cjs.map +1 -1
  11. package/dist/cjs/cli.cjs +485 -1
  12. package/dist/cjs/cli.cjs.map +1 -1
  13. package/dist/cjs/config.cjs +15 -1
  14. package/dist/cjs/config.cjs.map +1 -1
  15. package/dist/cjs/editor.cjs +50 -1
  16. package/dist/cjs/editor.cjs.map +1 -1
  17. package/dist/cjs/extract.cjs +108 -1
  18. package/dist/cjs/extract.cjs.map +1 -1
  19. package/dist/cjs/fill/deepMergeContent.cjs +27 -1
  20. package/dist/cjs/fill/deepMergeContent.cjs.map +1 -1
  21. package/dist/cjs/fill/fill.cjs +84 -1
  22. package/dist/cjs/fill/fill.cjs.map +1 -1
  23. package/dist/cjs/fill/formatAutoFilledFilePath.cjs +32 -1
  24. package/dist/cjs/fill/formatAutoFilledFilePath.cjs.map +1 -1
  25. package/dist/cjs/fill/formatFillData.cjs +87 -1
  26. package/dist/cjs/fill/formatFillData.cjs.map +1 -1
  27. package/dist/cjs/fill/getAvailableLocalesInDictionary.cjs +26 -1
  28. package/dist/cjs/fill/getAvailableLocalesInDictionary.cjs.map +1 -1
  29. package/dist/cjs/fill/getFilterMissingContentPerLocale.cjs +51 -1
  30. package/dist/cjs/fill/getFilterMissingContentPerLocale.cjs.map +1 -1
  31. package/dist/cjs/fill/index.cjs +6 -1
  32. package/dist/cjs/fill/listTranslationsTasks.cjs +72 -1
  33. package/dist/cjs/fill/listTranslationsTasks.cjs.map +1 -1
  34. package/dist/cjs/fill/translateDictionary.cjs +240 -1
  35. package/dist/cjs/fill/translateDictionary.cjs.map +1 -1
  36. package/dist/cjs/fill/writeFill.cjs +55 -1
  37. package/dist/cjs/fill/writeFill.cjs.map +1 -1
  38. package/dist/cjs/getTargetDictionary.cjs +36 -1
  39. package/dist/cjs/getTargetDictionary.cjs.map +1 -1
  40. package/dist/cjs/index.cjs +44 -1
  41. package/dist/cjs/init.cjs +22 -1
  42. package/dist/cjs/init.cjs.map +1 -1
  43. package/dist/cjs/initMCP.cjs +69 -1
  44. package/dist/cjs/initMCP.cjs.map +1 -1
  45. package/dist/cjs/initSkills.cjs +93 -1
  46. package/dist/cjs/initSkills.cjs.map +1 -1
  47. package/dist/cjs/listContentDeclaration.cjs +42 -1
  48. package/dist/cjs/listContentDeclaration.cjs.map +1 -1
  49. package/dist/cjs/listProjects.cjs +28 -1
  50. package/dist/cjs/listProjects.cjs.map +1 -1
  51. package/dist/cjs/liveSync.cjs +153 -8
  52. package/dist/cjs/liveSync.cjs.map +1 -1
  53. package/dist/cjs/pull.cjs +153 -1
  54. package/dist/cjs/pull.cjs.map +1 -1
  55. package/dist/cjs/push/pullLog.cjs +105 -3
  56. package/dist/cjs/push/pullLog.cjs.map +1 -1
  57. package/dist/cjs/push/push.cjs +212 -1
  58. package/dist/cjs/push/push.cjs.map +1 -1
  59. package/dist/cjs/pushConfig.cjs +22 -1
  60. package/dist/cjs/pushConfig.cjs.map +1 -1
  61. package/dist/cjs/pushLog.cjs +86 -3
  62. package/dist/cjs/pushLog.cjs.map +1 -1
  63. package/dist/cjs/reviewDoc/reviewDoc.cjs +73 -1
  64. package/dist/cjs/reviewDoc/reviewDoc.cjs.map +1 -1
  65. package/dist/cjs/reviewDoc/reviewDocBlockAware.cjs +98 -1
  66. package/dist/cjs/reviewDoc/reviewDocBlockAware.cjs.map +1 -1
  67. package/dist/cjs/searchDoc.cjs +41 -1
  68. package/dist/cjs/searchDoc.cjs.map +1 -1
  69. package/dist/cjs/test/index.cjs +7 -1
  70. package/dist/cjs/test/listMissingTranslations.cjs +52 -1
  71. package/dist/cjs/test/listMissingTranslations.cjs.map +1 -1
  72. package/dist/cjs/test/test.cjs +56 -1
  73. package/dist/cjs/test/test.cjs.map +1 -1
  74. package/dist/cjs/translateDoc/index.cjs +9 -1
  75. package/dist/cjs/translateDoc/translateDoc.cjs +79 -1
  76. package/dist/cjs/translateDoc/translateDoc.cjs.map +1 -1
  77. package/dist/cjs/translateDoc/translateFile.cjs +106 -2
  78. package/dist/cjs/translateDoc/translateFile.cjs.map +1 -1
  79. package/dist/cjs/translateDoc/validation.cjs +49 -5
  80. package/dist/cjs/translateDoc/validation.cjs.map +1 -1
  81. package/dist/cjs/translation-alignment/alignBlocks.cjs +67 -1
  82. package/dist/cjs/translation-alignment/alignBlocks.cjs.map +1 -1
  83. package/dist/cjs/translation-alignment/computeSimilarity.cjs +25 -1
  84. package/dist/cjs/translation-alignment/computeSimilarity.cjs.map +1 -1
  85. package/dist/cjs/translation-alignment/fingerprintBlock.cjs +23 -1
  86. package/dist/cjs/translation-alignment/fingerprintBlock.cjs.map +1 -1
  87. package/dist/cjs/translation-alignment/index.cjs +22 -1
  88. package/dist/cjs/translation-alignment/mapChangedLinesToBlocks.cjs +18 -1
  89. package/dist/cjs/translation-alignment/mapChangedLinesToBlocks.cjs.map +1 -1
  90. package/dist/cjs/translation-alignment/normalizeBlock.cjs +22 -1
  91. package/dist/cjs/translation-alignment/normalizeBlock.cjs.map +1 -1
  92. package/dist/cjs/translation-alignment/pipeline.cjs +37 -1
  93. package/dist/cjs/translation-alignment/pipeline.cjs.map +1 -1
  94. package/dist/cjs/translation-alignment/planActions.cjs +46 -1
  95. package/dist/cjs/translation-alignment/planActions.cjs.map +1 -1
  96. package/dist/cjs/translation-alignment/rebuildDocument.cjs +49 -2
  97. package/dist/cjs/translation-alignment/rebuildDocument.cjs.map +1 -1
  98. package/dist/cjs/translation-alignment/segmentDocument.cjs +66 -5
  99. package/dist/cjs/translation-alignment/segmentDocument.cjs.map +1 -1
  100. package/dist/cjs/utils/calculateChunks.cjs +89 -2
  101. package/dist/cjs/utils/calculateChunks.cjs.map +1 -1
  102. package/dist/cjs/utils/checkAccess.cjs +83 -1
  103. package/dist/cjs/utils/checkAccess.cjs.map +1 -1
  104. package/dist/cjs/utils/checkConfigConsistency.cjs +16 -1
  105. package/dist/cjs/utils/checkConfigConsistency.cjs.map +1 -1
  106. package/dist/cjs/utils/checkFileModifiedRange.cjs +81 -1
  107. package/dist/cjs/utils/checkFileModifiedRange.cjs.map +1 -1
  108. package/dist/cjs/utils/checkLastUpdateTime.cjs +19 -1
  109. package/dist/cjs/utils/checkLastUpdateTime.cjs.map +1 -1
  110. package/dist/cjs/utils/chunkInference.cjs +45 -1
  111. package/dist/cjs/utils/chunkInference.cjs.map +1 -1
  112. package/dist/cjs/utils/fixChunkStartEndChars.cjs +27 -3
  113. package/dist/cjs/utils/fixChunkStartEndChars.cjs.map +1 -1
  114. package/dist/cjs/utils/formatTimeDiff.cjs +20 -1
  115. package/dist/cjs/utils/formatTimeDiff.cjs.map +1 -1
  116. package/dist/cjs/utils/getIsFileUpdatedRecently.cjs +16 -1
  117. package/dist/cjs/utils/getIsFileUpdatedRecently.cjs.map +1 -1
  118. package/dist/cjs/utils/getOutputFilePath.cjs +74 -1
  119. package/dist/cjs/utils/getOutputFilePath.cjs.map +1 -1
  120. package/dist/cjs/utils/getParentPackageJSON.cjs +20 -1
  121. package/dist/cjs/utils/getParentPackageJSON.cjs.map +1 -1
  122. package/dist/cjs/utils/listSpecialChars.cjs +54 -2
  123. package/dist/cjs/utils/listSpecialChars.cjs.map +1 -1
  124. package/dist/cjs/utils/mapChunksBetweenFiles.cjs +102 -1
  125. package/dist/cjs/utils/mapChunksBetweenFiles.cjs.map +1 -1
  126. package/dist/cjs/utils/openBrowser.cjs +19 -1
  127. package/dist/cjs/utils/openBrowser.cjs.map +1 -1
  128. package/dist/cjs/utils/reorderParagraphs.cjs +91 -3
  129. package/dist/cjs/utils/reorderParagraphs.cjs.map +1 -1
  130. package/dist/cjs/utils/setupAI.cjs +66 -1
  131. package/dist/cjs/utils/setupAI.cjs.map +1 -1
  132. package/dist/cjs/watch.cjs +47 -1
  133. package/dist/cjs/watch.cjs.map +1 -1
  134. package/dist/esm/IntlayerEventListener.mjs +183 -1
  135. package/dist/esm/IntlayerEventListener.mjs.map +1 -1
  136. package/dist/esm/_virtual/_rolldown/runtime.mjs +8 -0
  137. package/dist/esm/_virtual/_utils_asset.mjs +97 -0
  138. package/dist/esm/auth/login.mjs +86 -2
  139. package/dist/esm/auth/login.mjs.map +1 -1
  140. package/dist/esm/build.mjs +28 -1
  141. package/dist/esm/build.mjs.map +1 -1
  142. package/dist/esm/ci.mjs +74 -1
  143. package/dist/esm/ci.mjs.map +1 -1
  144. package/dist/esm/cli.mjs +482 -1
  145. package/dist/esm/cli.mjs.map +1 -1
  146. package/dist/esm/config.mjs +13 -1
  147. package/dist/esm/config.mjs.map +1 -1
  148. package/dist/esm/editor.mjs +50 -1
  149. package/dist/esm/editor.mjs.map +1 -0
  150. package/dist/esm/extract.mjs +104 -1
  151. package/dist/esm/extract.mjs.map +1 -1
  152. package/dist/esm/fill/deepMergeContent.mjs +25 -1
  153. package/dist/esm/fill/deepMergeContent.mjs.map +1 -1
  154. package/dist/esm/fill/fill.mjs +81 -1
  155. package/dist/esm/fill/fill.mjs.map +1 -1
  156. package/dist/esm/fill/formatAutoFilledFilePath.mjs +30 -1
  157. package/dist/esm/fill/formatAutoFilledFilePath.mjs.map +1 -1
  158. package/dist/esm/fill/formatFillData.mjs +85 -1
  159. package/dist/esm/fill/formatFillData.mjs.map +1 -1
  160. package/dist/esm/fill/getAvailableLocalesInDictionary.mjs +24 -1
  161. package/dist/esm/fill/getAvailableLocalesInDictionary.mjs.map +1 -1
  162. package/dist/esm/fill/getFilterMissingContentPerLocale.mjs +49 -1
  163. package/dist/esm/fill/getFilterMissingContentPerLocale.mjs.map +1 -1
  164. package/dist/esm/fill/index.mjs +4 -1
  165. package/dist/esm/fill/listTranslationsTasks.mjs +69 -1
  166. package/dist/esm/fill/listTranslationsTasks.mjs.map +1 -1
  167. package/dist/esm/fill/translateDictionary.mjs +237 -1
  168. package/dist/esm/fill/translateDictionary.mjs.map +1 -1
  169. package/dist/esm/fill/writeFill.mjs +53 -1
  170. package/dist/esm/fill/writeFill.mjs.map +1 -1
  171. package/dist/esm/getTargetDictionary.mjs +33 -1
  172. package/dist/esm/getTargetDictionary.mjs.map +1 -1
  173. package/dist/esm/index.mjs +20 -1
  174. package/dist/esm/init.mjs +19 -1
  175. package/dist/esm/init.mjs.map +1 -1
  176. package/dist/esm/initMCP.mjs +65 -1
  177. package/dist/esm/initMCP.mjs.map +1 -1
  178. package/dist/esm/initSkills.mjs +87 -1
  179. package/dist/esm/initSkills.mjs.map +1 -1
  180. package/dist/esm/listContentDeclaration.mjs +39 -1
  181. package/dist/esm/listContentDeclaration.mjs.map +1 -1
  182. package/dist/esm/listProjects.mjs +26 -1
  183. package/dist/esm/listProjects.mjs.map +1 -1
  184. package/dist/esm/liveSync.mjs +150 -8
  185. package/dist/esm/liveSync.mjs.map +1 -1
  186. package/dist/esm/pull.mjs +150 -1
  187. package/dist/esm/pull.mjs.map +1 -1
  188. package/dist/esm/push/pullLog.mjs +102 -3
  189. package/dist/esm/push/pullLog.mjs.map +1 -1
  190. package/dist/esm/push/push.mjs +208 -1
  191. package/dist/esm/push/push.mjs.map +1 -1
  192. package/dist/esm/pushConfig.mjs +20 -1
  193. package/dist/esm/pushConfig.mjs.map +1 -1
  194. package/dist/esm/pushLog.mjs +83 -3
  195. package/dist/esm/pushLog.mjs.map +1 -1
  196. package/dist/esm/reviewDoc/reviewDoc.mjs +69 -1
  197. package/dist/esm/reviewDoc/reviewDoc.mjs.map +1 -1
  198. package/dist/esm/reviewDoc/reviewDocBlockAware.mjs +95 -1
  199. package/dist/esm/reviewDoc/reviewDocBlockAware.mjs.map +1 -1
  200. package/dist/esm/searchDoc.mjs +39 -1
  201. package/dist/esm/searchDoc.mjs.map +1 -1
  202. package/dist/esm/test/index.mjs +4 -1
  203. package/dist/esm/test/listMissingTranslations.mjs +49 -1
  204. package/dist/esm/test/listMissingTranslations.mjs.map +1 -1
  205. package/dist/esm/test/test.mjs +53 -1
  206. package/dist/esm/test/test.mjs.map +1 -1
  207. package/dist/esm/translateDoc/index.mjs +5 -1
  208. package/dist/esm/translateDoc/translateDoc.mjs +75 -1
  209. package/dist/esm/translateDoc/translateDoc.mjs.map +1 -1
  210. package/dist/esm/translateDoc/translateFile.mjs +103 -2
  211. package/dist/esm/translateDoc/translateFile.mjs.map +1 -1
  212. package/dist/esm/translateDoc/validation.mjs +46 -5
  213. package/dist/esm/translateDoc/validation.mjs.map +1 -1
  214. package/dist/esm/translation-alignment/alignBlocks.mjs +66 -1
  215. package/dist/esm/translation-alignment/alignBlocks.mjs.map +1 -1
  216. package/dist/esm/translation-alignment/computeSimilarity.mjs +22 -1
  217. package/dist/esm/translation-alignment/computeSimilarity.mjs.map +1 -1
  218. package/dist/esm/translation-alignment/fingerprintBlock.mjs +20 -1
  219. package/dist/esm/translation-alignment/fingerprintBlock.mjs.map +1 -1
  220. package/dist/esm/translation-alignment/index.mjs +11 -1
  221. package/dist/esm/translation-alignment/mapChangedLinesToBlocks.mjs +16 -1
  222. package/dist/esm/translation-alignment/mapChangedLinesToBlocks.mjs.map +1 -1
  223. package/dist/esm/translation-alignment/normalizeBlock.mjs +20 -1
  224. package/dist/esm/translation-alignment/normalizeBlock.mjs.map +1 -1
  225. package/dist/esm/translation-alignment/pipeline.mjs +35 -1
  226. package/dist/esm/translation-alignment/pipeline.mjs.map +1 -1
  227. package/dist/esm/translation-alignment/planActions.mjs +44 -1
  228. package/dist/esm/translation-alignment/planActions.mjs.map +1 -1
  229. package/dist/esm/translation-alignment/rebuildDocument.mjs +46 -2
  230. package/dist/esm/translation-alignment/rebuildDocument.mjs.map +1 -1
  231. package/dist/esm/translation-alignment/segmentDocument.mjs +64 -5
  232. package/dist/esm/translation-alignment/segmentDocument.mjs.map +1 -1
  233. package/dist/esm/utils/calculateChunks.mjs +87 -2
  234. package/dist/esm/utils/calculateChunks.mjs.map +1 -1
  235. package/dist/esm/utils/checkAccess.mjs +79 -1
  236. package/dist/esm/utils/checkAccess.mjs.map +1 -1
  237. package/dist/esm/utils/checkConfigConsistency.mjs +14 -1
  238. package/dist/esm/utils/checkConfigConsistency.mjs.map +1 -1
  239. package/dist/esm/utils/checkFileModifiedRange.mjs +80 -1
  240. package/dist/esm/utils/checkFileModifiedRange.mjs.map +1 -1
  241. package/dist/esm/utils/checkLastUpdateTime.mjs +17 -1
  242. package/dist/esm/utils/checkLastUpdateTime.mjs.map +1 -1
  243. package/dist/esm/utils/chunkInference.mjs +43 -1
  244. package/dist/esm/utils/chunkInference.mjs.map +1 -1
  245. package/dist/esm/utils/fixChunkStartEndChars.mjs +25 -3
  246. package/dist/esm/utils/fixChunkStartEndChars.mjs.map +1 -1
  247. package/dist/esm/utils/formatTimeDiff.mjs +18 -1
  248. package/dist/esm/utils/formatTimeDiff.mjs.map +1 -1
  249. package/dist/esm/utils/getIsFileUpdatedRecently.mjs +14 -1
  250. package/dist/esm/utils/getIsFileUpdatedRecently.mjs.map +1 -1
  251. package/dist/esm/utils/getOutputFilePath.mjs +72 -1
  252. package/dist/esm/utils/getOutputFilePath.mjs.map +1 -1
  253. package/dist/esm/utils/getParentPackageJSON.mjs +18 -1
  254. package/dist/esm/utils/getParentPackageJSON.mjs.map +1 -1
  255. package/dist/esm/utils/listSpecialChars.mjs +52 -2
  256. package/dist/esm/utils/listSpecialChars.mjs.map +1 -1
  257. package/dist/esm/utils/mapChunksBetweenFiles.mjs +100 -1
  258. package/dist/esm/utils/mapChunksBetweenFiles.mjs.map +1 -1
  259. package/dist/esm/utils/openBrowser.mjs +17 -1
  260. package/dist/esm/utils/openBrowser.mjs.map +1 -1
  261. package/dist/esm/utils/reorderParagraphs.mjs +90 -3
  262. package/dist/esm/utils/reorderParagraphs.mjs.map +1 -1
  263. package/dist/esm/utils/setupAI.mjs +63 -1
  264. package/dist/esm/utils/setupAI.mjs.map +1 -1
  265. package/dist/esm/watch.mjs +45 -1
  266. package/dist/esm/watch.mjs.map +1 -1
  267. package/dist/types/fill/fill.d.ts +1 -1
  268. package/dist/types/fill/translateDictionary.d.ts +1 -1
  269. package/dist/types/getTargetDictionary.d.ts +19 -2
  270. package/dist/types/getTargetDictionary.d.ts.map +1 -0
  271. package/dist/types/index.d.ts +2 -2
  272. package/dist/types/reviewDoc/reviewDocBlockAware.d.ts +1 -1
  273. package/dist/types/test/index.d.ts +2 -2
  274. package/dist/types/test/listMissingTranslations.d.ts +28 -2
  275. package/dist/types/test/listMissingTranslations.d.ts.map +1 -0
  276. package/dist/types/test/test.d.ts +11 -2
  277. package/dist/types/test/test.d.ts.map +1 -0
  278. package/dist/types/translateDoc/index.d.ts +1 -1
  279. package/dist/types/translateDoc/translateDoc.d.ts +1 -1
  280. package/dist/types/translateDoc/translateFile.d.ts +1 -1
  281. package/dist/types/translateDoc/types.d.ts +48 -2
  282. package/dist/types/translateDoc/types.d.ts.map +1 -0
  283. package/dist/types/utils/chunkInference.d.ts +1 -1
  284. package/dist/types/utils/setupAI.d.ts +21 -2
  285. package/dist/types/utils/setupAI.d.ts.map +1 -0
  286. package/package.json +12 -12
  287. package/dist/cjs/_utils_asset-ghp_Cjwk.cjs +0 -2
  288. package/dist/cjs/chunk-Bmb41Sf3.cjs +0 -1
  289. package/dist/esm/_utils_asset-B187VPMw.mjs +0 -2
  290. package/dist/esm/editor-D8BGlLzF.mjs +0 -2
  291. package/dist/esm/editor-D8BGlLzF.mjs.map +0 -1
  292. package/dist/types/getTargetDictionary-RBSRtaQj.d.ts +0 -19
  293. package/dist/types/getTargetDictionary-RBSRtaQj.d.ts.map +0 -1
  294. package/dist/types/listMissingTranslations-DxKw7nqI.d.ts +0 -28
  295. package/dist/types/listMissingTranslations-DxKw7nqI.d.ts.map +0 -1
  296. package/dist/types/setupAI-Bosjx7ah.d.ts +0 -21
  297. package/dist/types/setupAI-Bosjx7ah.d.ts.map +0 -1
  298. package/dist/types/test-DUTiJR5_.d.ts +0 -11
  299. package/dist/types/test-DUTiJR5_.d.ts.map +0 -1
  300. package/dist/types/types-BKvc3FmV.d.ts +0 -48
  301. package/dist/types/types-BKvc3FmV.d.ts.map +0 -1
@@ -1,2 +1,67 @@
1
- import{computeJaccardSimilarity as e}from"./computeSimilarity.mjs";const t=(t,n)=>{let r=t.length,i=n.length,a=Array.from({length:r+1},()=>Array.from({length:i+1},()=>0)),o=Array.from({length:r+1},()=>Array.from({length:i+1},()=>`diagonal`)),s=(r,i)=>{let a=t[r],o=n[i],s=a.type===o.type?2:0,c=e(a.anchorText,o.anchorText,3);return s+(Math.min(a.content.length,o.content.length)/Math.max(a.content.length,o.content.length)>.75?1:0)+c*8};for(let e=1;e<=r;e+=1)a[e][0]=a[e-1][0]+-2,o[e][0]=`up`;for(let e=1;e<=i;e+=1)a[0][e]=a[0][e-1]+-2,o[0][e]=`left`;for(let e=1;e<=r;e+=1)for(let t=1;t<=i;t+=1){let n=a[e-1][t-1]+s(e-1,t-1),r=a[e-1][t]+-2,i=a[e][t-1]+-2,c=Math.max(n,r,i);a[e][t]=c,o[e][t]=c===n?`diagonal`:c===r?`up`:`left`}let c=[],l=r,u=i;for(;l>0||u>0;)if(l>0&&u>0&&o[l][u]===`diagonal`){let r=l-1,i=u-1,a=e(t[r].anchorText,n[i].anchorText,3);c.unshift({englishIndex:r,frenchIndex:i,similarityScore:a}),--l,--u}else l>0&&(u===0||o[l][u]===`up`)?(c.unshift({englishIndex:l-1,frenchIndex:null,similarityScore:0}),--l):u>0&&(l===0||o[l][u]===`left`)&&(c.unshift({englishIndex:-1,frenchIndex:u-1,similarityScore:0}),--u);return c};export{t as alignEnglishAndFrenchBlocks};
1
+ import { computeJaccardSimilarity } from "./computeSimilarity.mjs";
2
+
3
+ //#region src/translation-alignment/alignBlocks.ts
4
+ const alignEnglishAndFrenchBlocks = (defaultBlocks, secondaryBlocks) => {
5
+ const defaultLength = defaultBlocks.length;
6
+ const secondaryLength = secondaryBlocks.length;
7
+ const scoreMatrix = Array.from({ length: defaultLength + 1 }, () => Array.from({ length: secondaryLength + 1 }, () => 0));
8
+ const traceMatrix = Array.from({ length: defaultLength + 1 }, () => Array.from({ length: secondaryLength + 1 }, () => "diagonal"));
9
+ const gapPenalty = -2;
10
+ const computeMatchScore = (defaultIndex, secondaryIndex) => {
11
+ const defaultBlock = defaultBlocks[defaultIndex];
12
+ const secondaryBlock = secondaryBlocks[secondaryIndex];
13
+ const typeBonus = defaultBlock.type === secondaryBlock.type ? 2 : 0;
14
+ const anchorSimilarity = computeJaccardSimilarity(defaultBlock.anchorText, secondaryBlock.anchorText, 3);
15
+ return typeBonus + (Math.min(defaultBlock.content.length, secondaryBlock.content.length) / Math.max(defaultBlock.content.length, secondaryBlock.content.length) > .75 ? 1 : 0) + anchorSimilarity * 8;
16
+ };
17
+ for (let i = 1; i <= defaultLength; i += 1) {
18
+ scoreMatrix[i][0] = scoreMatrix[i - 1][0] + gapPenalty;
19
+ traceMatrix[i][0] = "up";
20
+ }
21
+ for (let j = 1; j <= secondaryLength; j += 1) {
22
+ scoreMatrix[0][j] = scoreMatrix[0][j - 1] + gapPenalty;
23
+ traceMatrix[0][j] = "left";
24
+ }
25
+ for (let i = 1; i <= defaultLength; i += 1) for (let j = 1; j <= secondaryLength; j += 1) {
26
+ const match = scoreMatrix[i - 1][j - 1] + computeMatchScore(i - 1, j - 1);
27
+ const deleteGap = scoreMatrix[i - 1][j] + gapPenalty;
28
+ const insertGap = scoreMatrix[i][j - 1] + gapPenalty;
29
+ const best = Math.max(match, deleteGap, insertGap);
30
+ scoreMatrix[i][j] = best;
31
+ traceMatrix[i][j] = best === match ? "diagonal" : best === deleteGap ? "up" : "left";
32
+ }
33
+ const result = [];
34
+ let i = defaultLength;
35
+ let j = secondaryLength;
36
+ while (i > 0 || j > 0) if (i > 0 && j > 0 && traceMatrix[i][j] === "diagonal") {
37
+ const englishIndex = i - 1;
38
+ const frenchIndex = j - 1;
39
+ const similarityScore = computeJaccardSimilarity(defaultBlocks[englishIndex].anchorText, secondaryBlocks[frenchIndex].anchorText, 3);
40
+ result.unshift({
41
+ englishIndex,
42
+ frenchIndex,
43
+ similarityScore
44
+ });
45
+ i -= 1;
46
+ j -= 1;
47
+ } else if (i > 0 && (j === 0 || traceMatrix[i][j] === "up")) {
48
+ result.unshift({
49
+ englishIndex: i - 1,
50
+ frenchIndex: null,
51
+ similarityScore: 0
52
+ });
53
+ i -= 1;
54
+ } else if (j > 0 && (i === 0 || traceMatrix[i][j] === "left")) {
55
+ result.unshift({
56
+ englishIndex: -1,
57
+ frenchIndex: j - 1,
58
+ similarityScore: 0
59
+ });
60
+ j -= 1;
61
+ }
62
+ return result;
63
+ };
64
+
65
+ //#endregion
66
+ export { alignEnglishAndFrenchBlocks };
2
67
  //# sourceMappingURL=alignBlocks.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"alignBlocks.mjs","names":[],"sources":["../../../src/translation-alignment/alignBlocks.ts"],"sourcesContent":["import { computeJaccardSimilarity } from './computeSimilarity';\nimport type { AlignmentPair, FingerprintedBlock } from './types';\n\nexport const alignEnglishAndFrenchBlocks = (\n defaultBlocks: FingerprintedBlock[],\n secondaryBlocks: FingerprintedBlock[]\n): AlignmentPair[] => {\n // Needleman–Wunsch style global alignment using anchor similarity and type equality\n const defaultLength = defaultBlocks.length;\n const secondaryLength = secondaryBlocks.length;\n\n const scoreMatrix: number[][] = Array.from(\n { length: defaultLength + 1 },\n () => Array.from({ length: secondaryLength + 1 }, () => 0)\n );\n const traceMatrix: ('diagonal' | 'up' | 'left')[][] = Array.from(\n { length: defaultLength + 1 },\n () => Array.from({ length: secondaryLength + 1 }, () => 'diagonal')\n );\n\n const gapPenalty = -2;\n\n const computeMatchScore = (\n defaultIndex: number,\n secondaryIndex: number\n ): number => {\n const defaultBlock = defaultBlocks[defaultIndex];\n const secondaryBlock = secondaryBlocks[secondaryIndex];\n const typeBonus = defaultBlock.type === secondaryBlock.type ? 2 : 0;\n const anchorSimilarity = computeJaccardSimilarity(\n defaultBlock.anchorText,\n secondaryBlock.anchorText,\n 3\n );\n const lengthRatio =\n Math.min(defaultBlock.content.length, secondaryBlock.content.length) /\n Math.max(defaultBlock.content.length, secondaryBlock.content.length);\n const lengthBonus = lengthRatio > 0.75 ? 1 : 0;\n return typeBonus + lengthBonus + anchorSimilarity * 8; // weighted toward anchor similarity\n };\n\n // initialize first row and column\n for (let i = 1; i <= defaultLength; i += 1) {\n scoreMatrix[i][0] = scoreMatrix[i - 1][0] + gapPenalty;\n traceMatrix[i][0] = 'up';\n }\n for (let j = 1; j <= secondaryLength; j += 1) {\n scoreMatrix[0][j] = scoreMatrix[0][j - 1] + gapPenalty;\n traceMatrix[0][j] = 'left';\n }\n\n // fill\n for (let i = 1; i <= defaultLength; i += 1) {\n for (let j = 1; j <= secondaryLength; j += 1) {\n const match = scoreMatrix[i - 1][j - 1] + computeMatchScore(i - 1, j - 1);\n const deleteGap = scoreMatrix[i - 1][j] + gapPenalty;\n const insertGap = scoreMatrix[i][j - 1] + gapPenalty;\n\n const best = Math.max(match, deleteGap, insertGap);\n scoreMatrix[i][j] = best;\n traceMatrix[i][j] =\n best === match ? 'diagonal' : best === deleteGap ? 'up' : 'left';\n }\n }\n\n // traceback\n const result: AlignmentPair[] = [];\n let i = defaultLength;\n let j = secondaryLength;\n while (i > 0 || j > 0) {\n if (i > 0 && j > 0 && traceMatrix[i][j] === 'diagonal') {\n const englishIndex = i - 1;\n const frenchIndex = j - 1;\n const similarityScore = computeJaccardSimilarity(\n defaultBlocks[englishIndex].anchorText,\n secondaryBlocks[frenchIndex].anchorText,\n 3\n );\n result.unshift({ englishIndex, frenchIndex, similarityScore });\n i -= 1;\n j -= 1;\n } else if (i > 0 && (j === 0 || traceMatrix[i][j] === 'up')) {\n result.unshift({\n englishIndex: i - 1,\n frenchIndex: null,\n similarityScore: 0,\n });\n i -= 1;\n } else if (j > 0 && (i === 0 || traceMatrix[i][j] === 'left')) {\n // french block has no corresponding english block (deleted)\n result.unshift({\n englishIndex: -1,\n frenchIndex: j - 1,\n similarityScore: 0,\n });\n j -= 1;\n }\n }\n return result;\n};\n"],"mappings":"mEAGA,MAAa,GACX,EACA,IACoB,CAEpB,IAAM,EAAgB,EAAc,OAC9B,EAAkB,EAAgB,OAElC,EAA0B,MAAM,KACpC,CAAE,OAAQ,EAAgB,EAAG,KACvB,MAAM,KAAK,CAAE,OAAQ,EAAkB,EAAG,KAAQ,EAAE,CAC3D,CACK,EAAgD,MAAM,KAC1D,CAAE,OAAQ,EAAgB,EAAG,KACvB,MAAM,KAAK,CAAE,OAAQ,EAAkB,EAAG,KAAQ,WAAW,CACpE,CAIK,GACJ,EACA,IACW,CACX,IAAM,EAAe,EAAc,GAC7B,EAAiB,EAAgB,GACjC,EAAY,EAAa,OAAS,EAAe,KAAO,EAAI,EAC5D,EAAmB,EACvB,EAAa,WACb,EAAe,WACf,EACD,CAKD,OAAO,GAHL,KAAK,IAAI,EAAa,QAAQ,OAAQ,EAAe,QAAQ,OAAO,CACpE,KAAK,IAAI,EAAa,QAAQ,OAAQ,EAAe,QAAQ,OAAO,CACpC,IAAO,EAAI,GACZ,EAAmB,GAItD,IAAK,IAAI,EAAI,EAAG,GAAK,EAAe,GAAK,EACvC,EAAY,GAAG,GAAK,EAAY,EAAI,GAAG,GAAK,GAC5C,EAAY,GAAG,GAAK,KAEtB,IAAK,IAAI,EAAI,EAAG,GAAK,EAAiB,GAAK,EACzC,EAAY,GAAG,GAAK,EAAY,GAAG,EAAI,GAAK,GAC5C,EAAY,GAAG,GAAK,OAItB,IAAK,IAAI,EAAI,EAAG,GAAK,EAAe,GAAK,EACvC,IAAK,IAAI,EAAI,EAAG,GAAK,EAAiB,GAAK,EAAG,CAC5C,IAAM,EAAQ,EAAY,EAAI,GAAG,EAAI,GAAK,EAAkB,EAAI,EAAG,EAAI,EAAE,CACnE,EAAY,EAAY,EAAI,GAAG,GAAK,GACpC,EAAY,EAAY,GAAG,EAAI,GAAK,GAEpC,EAAO,KAAK,IAAI,EAAO,EAAW,EAAU,CAClD,EAAY,GAAG,GAAK,EACpB,EAAY,GAAG,GACb,IAAS,EAAQ,WAAa,IAAS,EAAY,KAAO,OAKhE,IAAM,EAA0B,EAAE,CAC9B,EAAI,EACJ,EAAI,EACR,KAAO,EAAI,GAAK,EAAI,GAClB,GAAI,EAAI,GAAK,EAAI,GAAK,EAAY,GAAG,KAAO,WAAY,CACtD,IAAM,EAAe,EAAI,EACnB,EAAc,EAAI,EAClB,EAAkB,EACtB,EAAc,GAAc,WAC5B,EAAgB,GAAa,WAC7B,EACD,CACD,EAAO,QAAQ,CAAE,eAAc,cAAa,kBAAiB,CAAC,CAC9D,IACA,SACS,EAAI,IAAM,IAAM,GAAK,EAAY,GAAG,KAAO,OACpD,EAAO,QAAQ,CACb,aAAc,EAAI,EAClB,YAAa,KACb,gBAAiB,EAClB,CAAC,CACF,KACS,EAAI,IAAM,IAAM,GAAK,EAAY,GAAG,KAAO,UAEpD,EAAO,QAAQ,CACb,aAAc,GACd,YAAa,EAAI,EACjB,gBAAiB,EAClB,CAAC,CACF,KAGJ,OAAO"}
1
+ {"version":3,"file":"alignBlocks.mjs","names":[],"sources":["../../../src/translation-alignment/alignBlocks.ts"],"sourcesContent":["import { computeJaccardSimilarity } from './computeSimilarity';\nimport type { AlignmentPair, FingerprintedBlock } from './types';\n\nexport const alignEnglishAndFrenchBlocks = (\n defaultBlocks: FingerprintedBlock[],\n secondaryBlocks: FingerprintedBlock[]\n): AlignmentPair[] => {\n // Needleman–Wunsch style global alignment using anchor similarity and type equality\n const defaultLength = defaultBlocks.length;\n const secondaryLength = secondaryBlocks.length;\n\n const scoreMatrix: number[][] = Array.from(\n { length: defaultLength + 1 },\n () => Array.from({ length: secondaryLength + 1 }, () => 0)\n );\n const traceMatrix: ('diagonal' | 'up' | 'left')[][] = Array.from(\n { length: defaultLength + 1 },\n () => Array.from({ length: secondaryLength + 1 }, () => 'diagonal')\n );\n\n const gapPenalty = -2;\n\n const computeMatchScore = (\n defaultIndex: number,\n secondaryIndex: number\n ): number => {\n const defaultBlock = defaultBlocks[defaultIndex];\n const secondaryBlock = secondaryBlocks[secondaryIndex];\n const typeBonus = defaultBlock.type === secondaryBlock.type ? 2 : 0;\n const anchorSimilarity = computeJaccardSimilarity(\n defaultBlock.anchorText,\n secondaryBlock.anchorText,\n 3\n );\n const lengthRatio =\n Math.min(defaultBlock.content.length, secondaryBlock.content.length) /\n Math.max(defaultBlock.content.length, secondaryBlock.content.length);\n const lengthBonus = lengthRatio > 0.75 ? 1 : 0;\n return typeBonus + lengthBonus + anchorSimilarity * 8; // weighted toward anchor similarity\n };\n\n // initialize first row and column\n for (let i = 1; i <= defaultLength; i += 1) {\n scoreMatrix[i][0] = scoreMatrix[i - 1][0] + gapPenalty;\n traceMatrix[i][0] = 'up';\n }\n for (let j = 1; j <= secondaryLength; j += 1) {\n scoreMatrix[0][j] = scoreMatrix[0][j - 1] + gapPenalty;\n traceMatrix[0][j] = 'left';\n }\n\n // fill\n for (let i = 1; i <= defaultLength; i += 1) {\n for (let j = 1; j <= secondaryLength; j += 1) {\n const match = scoreMatrix[i - 1][j - 1] + computeMatchScore(i - 1, j - 1);\n const deleteGap = scoreMatrix[i - 1][j] + gapPenalty;\n const insertGap = scoreMatrix[i][j - 1] + gapPenalty;\n\n const best = Math.max(match, deleteGap, insertGap);\n scoreMatrix[i][j] = best;\n traceMatrix[i][j] =\n best === match ? 'diagonal' : best === deleteGap ? 'up' : 'left';\n }\n }\n\n // traceback\n const result: AlignmentPair[] = [];\n let i = defaultLength;\n let j = secondaryLength;\n while (i > 0 || j > 0) {\n if (i > 0 && j > 0 && traceMatrix[i][j] === 'diagonal') {\n const englishIndex = i - 1;\n const frenchIndex = j - 1;\n const similarityScore = computeJaccardSimilarity(\n defaultBlocks[englishIndex].anchorText,\n secondaryBlocks[frenchIndex].anchorText,\n 3\n );\n result.unshift({ englishIndex, frenchIndex, similarityScore });\n i -= 1;\n j -= 1;\n } else if (i > 0 && (j === 0 || traceMatrix[i][j] === 'up')) {\n result.unshift({\n englishIndex: i - 1,\n frenchIndex: null,\n similarityScore: 0,\n });\n i -= 1;\n } else if (j > 0 && (i === 0 || traceMatrix[i][j] === 'left')) {\n // french block has no corresponding english block (deleted)\n result.unshift({\n englishIndex: -1,\n frenchIndex: j - 1,\n similarityScore: 0,\n });\n j -= 1;\n }\n }\n return result;\n};\n"],"mappings":";;;AAGA,MAAa,+BACX,eACA,oBACoB;CAEpB,MAAM,gBAAgB,cAAc;CACpC,MAAM,kBAAkB,gBAAgB;CAExC,MAAM,cAA0B,MAAM,KACpC,EAAE,QAAQ,gBAAgB,GAAG,QACvB,MAAM,KAAK,EAAE,QAAQ,kBAAkB,GAAG,QAAQ,EAAE,CAC3D;CACD,MAAM,cAAgD,MAAM,KAC1D,EAAE,QAAQ,gBAAgB,GAAG,QACvB,MAAM,KAAK,EAAE,QAAQ,kBAAkB,GAAG,QAAQ,WAAW,CACpE;CAED,MAAM,aAAa;CAEnB,MAAM,qBACJ,cACA,mBACW;EACX,MAAM,eAAe,cAAc;EACnC,MAAM,iBAAiB,gBAAgB;EACvC,MAAM,YAAY,aAAa,SAAS,eAAe,OAAO,IAAI;EAClE,MAAM,mBAAmB,yBACvB,aAAa,YACb,eAAe,YACf,EACD;AAKD,SAAO,aAHL,KAAK,IAAI,aAAa,QAAQ,QAAQ,eAAe,QAAQ,OAAO,GACpE,KAAK,IAAI,aAAa,QAAQ,QAAQ,eAAe,QAAQ,OAAO,GACpC,MAAO,IAAI,KACZ,mBAAmB;;AAItD,MAAK,IAAI,IAAI,GAAG,KAAK,eAAe,KAAK,GAAG;AAC1C,cAAY,GAAG,KAAK,YAAY,IAAI,GAAG,KAAK;AAC5C,cAAY,GAAG,KAAK;;AAEtB,MAAK,IAAI,IAAI,GAAG,KAAK,iBAAiB,KAAK,GAAG;AAC5C,cAAY,GAAG,KAAK,YAAY,GAAG,IAAI,KAAK;AAC5C,cAAY,GAAG,KAAK;;AAItB,MAAK,IAAI,IAAI,GAAG,KAAK,eAAe,KAAK,EACvC,MAAK,IAAI,IAAI,GAAG,KAAK,iBAAiB,KAAK,GAAG;EAC5C,MAAM,QAAQ,YAAY,IAAI,GAAG,IAAI,KAAK,kBAAkB,IAAI,GAAG,IAAI,EAAE;EACzE,MAAM,YAAY,YAAY,IAAI,GAAG,KAAK;EAC1C,MAAM,YAAY,YAAY,GAAG,IAAI,KAAK;EAE1C,MAAM,OAAO,KAAK,IAAI,OAAO,WAAW,UAAU;AAClD,cAAY,GAAG,KAAK;AACpB,cAAY,GAAG,KACb,SAAS,QAAQ,aAAa,SAAS,YAAY,OAAO;;CAKhE,MAAM,SAA0B,EAAE;CAClC,IAAI,IAAI;CACR,IAAI,IAAI;AACR,QAAO,IAAI,KAAK,IAAI,EAClB,KAAI,IAAI,KAAK,IAAI,KAAK,YAAY,GAAG,OAAO,YAAY;EACtD,MAAM,eAAe,IAAI;EACzB,MAAM,cAAc,IAAI;EACxB,MAAM,kBAAkB,yBACtB,cAAc,cAAc,YAC5B,gBAAgB,aAAa,YAC7B,EACD;AACD,SAAO,QAAQ;GAAE;GAAc;GAAa;GAAiB,CAAC;AAC9D,OAAK;AACL,OAAK;YACI,IAAI,MAAM,MAAM,KAAK,YAAY,GAAG,OAAO,OAAO;AAC3D,SAAO,QAAQ;GACb,cAAc,IAAI;GAClB,aAAa;GACb,iBAAiB;GAClB,CAAC;AACF,OAAK;YACI,IAAI,MAAM,MAAM,KAAK,YAAY,GAAG,OAAO,SAAS;AAE7D,SAAO,QAAQ;GACb,cAAc;GACd,aAAa,IAAI;GACjB,iBAAiB;GAClB,CAAC;AACF,OAAK;;AAGT,QAAO"}
@@ -1,2 +1,23 @@
1
- const e=(e,t)=>{let n=e.replace(/\s+/g,` `).trim(),r=new Set;if(n.length<t)return n.length>0&&r.add(n),r;for(let e=0;e<=n.length-t;e+=1)r.add(n.slice(e,e+t));return r},t=(t,n,r=3)=>{let i=e(t,r),a=e(n,r);if(i.size===0&&a.size===0)return 1;let o=Array.from(i).filter(e=>a.has(e)).length,s=new Set([...Array.from(i),...Array.from(a)]).size;return s===0?0:o/s};export{t as computeJaccardSimilarity,e as generateCharacterShingles};
1
+ //#region src/translation-alignment/computeSimilarity.ts
2
+ const generateCharacterShingles = (text, shingleLength) => {
3
+ const normalized = text.replace(/\s+/g, " ").trim();
4
+ const set = /* @__PURE__ */ new Set();
5
+ if (normalized.length < shingleLength) {
6
+ if (normalized.length > 0) set.add(normalized);
7
+ return set;
8
+ }
9
+ for (let index = 0; index <= normalized.length - shingleLength; index += 1) set.add(normalized.slice(index, index + shingleLength));
10
+ return set;
11
+ };
12
+ const computeJaccardSimilarity = (a, b, shingleLength = 3) => {
13
+ const setA = generateCharacterShingles(a, shingleLength);
14
+ const setB = generateCharacterShingles(b, shingleLength);
15
+ if (setA.size === 0 && setB.size === 0) return 1;
16
+ const intersectionSize = Array.from(setA).filter((token) => setB.has(token)).length;
17
+ const unionSize = new Set([...Array.from(setA), ...Array.from(setB)]).size;
18
+ return unionSize === 0 ? 0 : intersectionSize / unionSize;
19
+ };
20
+
21
+ //#endregion
22
+ export { computeJaccardSimilarity, generateCharacterShingles };
2
23
  //# sourceMappingURL=computeSimilarity.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"computeSimilarity.mjs","names":[],"sources":["../../../src/translation-alignment/computeSimilarity.ts"],"sourcesContent":["// Character shingle Jaccard similarity (language agnostic)\nexport const generateCharacterShingles = (\n text: string,\n shingleLength: number\n): Set<string> => {\n const normalized = text.replace(/\\s+/g, ' ').trim();\n const set = new Set<string>();\n if (normalized.length < shingleLength) {\n if (normalized.length > 0) {\n set.add(normalized);\n }\n return set;\n }\n for (let index = 0; index <= normalized.length - shingleLength; index += 1) {\n set.add(normalized.slice(index, index + shingleLength));\n }\n return set;\n};\n\nexport const computeJaccardSimilarity = (\n a: string,\n b: string,\n shingleLength: number = 3\n): number => {\n const setA = generateCharacterShingles(a, shingleLength);\n const setB = generateCharacterShingles(b, shingleLength);\n if (setA.size === 0 && setB.size === 0) return 1;\n const intersectionSize = Array.from(setA).filter((token) =>\n setB.has(token)\n ).length;\n const unionSize = new Set([...Array.from(setA), ...Array.from(setB)]).size;\n return unionSize === 0 ? 0 : intersectionSize / unionSize;\n};\n"],"mappings":"AACA,MAAa,GACX,EACA,IACgB,CAChB,IAAM,EAAa,EAAK,QAAQ,OAAQ,IAAI,CAAC,MAAM,CAC7C,EAAM,IAAI,IAChB,GAAI,EAAW,OAAS,EAItB,OAHI,EAAW,OAAS,GACtB,EAAI,IAAI,EAAW,CAEd,EAET,IAAK,IAAI,EAAQ,EAAG,GAAS,EAAW,OAAS,EAAe,GAAS,EACvE,EAAI,IAAI,EAAW,MAAM,EAAO,EAAQ,EAAc,CAAC,CAEzD,OAAO,GAGI,GACX,EACA,EACA,EAAwB,IACb,CACX,IAAM,EAAO,EAA0B,EAAG,EAAc,CAClD,EAAO,EAA0B,EAAG,EAAc,CACxD,GAAI,EAAK,OAAS,GAAK,EAAK,OAAS,EAAG,MAAO,GAC/C,IAAM,EAAmB,MAAM,KAAK,EAAK,CAAC,OAAQ,GAChD,EAAK,IAAI,EAAM,CAChB,CAAC,OACI,EAAY,IAAI,IAAI,CAAC,GAAG,MAAM,KAAK,EAAK,CAAE,GAAG,MAAM,KAAK,EAAK,CAAC,CAAC,CAAC,KACtE,OAAO,IAAc,EAAI,EAAI,EAAmB"}
1
+ {"version":3,"file":"computeSimilarity.mjs","names":[],"sources":["../../../src/translation-alignment/computeSimilarity.ts"],"sourcesContent":["// Character shingle Jaccard similarity (language agnostic)\nexport const generateCharacterShingles = (\n text: string,\n shingleLength: number\n): Set<string> => {\n const normalized = text.replace(/\\s+/g, ' ').trim();\n const set = new Set<string>();\n if (normalized.length < shingleLength) {\n if (normalized.length > 0) {\n set.add(normalized);\n }\n return set;\n }\n for (let index = 0; index <= normalized.length - shingleLength; index += 1) {\n set.add(normalized.slice(index, index + shingleLength));\n }\n return set;\n};\n\nexport const computeJaccardSimilarity = (\n a: string,\n b: string,\n shingleLength: number = 3\n): number => {\n const setA = generateCharacterShingles(a, shingleLength);\n const setB = generateCharacterShingles(b, shingleLength);\n if (setA.size === 0 && setB.size === 0) return 1;\n const intersectionSize = Array.from(setA).filter((token) =>\n setB.has(token)\n ).length;\n const unionSize = new Set([...Array.from(setA), ...Array.from(setB)]).size;\n return unionSize === 0 ? 0 : intersectionSize / unionSize;\n};\n"],"mappings":";AACA,MAAa,6BACX,MACA,kBACgB;CAChB,MAAM,aAAa,KAAK,QAAQ,QAAQ,IAAI,CAAC,MAAM;CACnD,MAAM,sBAAM,IAAI,KAAa;AAC7B,KAAI,WAAW,SAAS,eAAe;AACrC,MAAI,WAAW,SAAS,EACtB,KAAI,IAAI,WAAW;AAErB,SAAO;;AAET,MAAK,IAAI,QAAQ,GAAG,SAAS,WAAW,SAAS,eAAe,SAAS,EACvE,KAAI,IAAI,WAAW,MAAM,OAAO,QAAQ,cAAc,CAAC;AAEzD,QAAO;;AAGT,MAAa,4BACX,GACA,GACA,gBAAwB,MACb;CACX,MAAM,OAAO,0BAA0B,GAAG,cAAc;CACxD,MAAM,OAAO,0BAA0B,GAAG,cAAc;AACxD,KAAI,KAAK,SAAS,KAAK,KAAK,SAAS,EAAG,QAAO;CAC/C,MAAM,mBAAmB,MAAM,KAAK,KAAK,CAAC,QAAQ,UAChD,KAAK,IAAI,MAAM,CAChB,CAAC;CACF,MAAM,YAAY,IAAI,IAAI,CAAC,GAAG,MAAM,KAAK,KAAK,EAAE,GAAG,MAAM,KAAK,KAAK,CAAC,CAAC,CAAC;AACtE,QAAO,cAAc,IAAI,IAAI,mBAAmB"}
@@ -1,2 +1,21 @@
1
- import e from"node:crypto";const t=t=>e.createHash(`sha256`).update(t).digest(`hex`),n=(e,n,r)=>{let i=t(e.semanticText),a=t(e.anchorText),o=`${i}:${a}`,s=t(`${t(n?.semanticText??``)}:${t(r?.semanticText??``)}`);return{...e,semanticDigest:i,anchorDigest:a,compositeKey:o,contextKey:s}};export{n as fingerprintBlock};
1
+ import crypto from "node:crypto";
2
+
3
+ //#region src/translation-alignment/fingerprintBlock.ts
4
+ const computeStringDigest = (text) => crypto.createHash("sha256").update(text).digest("hex");
5
+ const fingerprintBlock = (block, previousBlock, nextBlock) => {
6
+ const semanticDigest = computeStringDigest(block.semanticText);
7
+ const anchorDigest = computeStringDigest(block.anchorText);
8
+ const compositeKey = `${semanticDigest}:${anchorDigest}`;
9
+ const contextKey = computeStringDigest(`${computeStringDigest(previousBlock?.semanticText ?? "")}:${computeStringDigest(nextBlock?.semanticText ?? "")}`);
10
+ return {
11
+ ...block,
12
+ semanticDigest,
13
+ anchorDigest,
14
+ compositeKey,
15
+ contextKey
16
+ };
17
+ };
18
+
19
+ //#endregion
20
+ export { fingerprintBlock };
2
21
  //# sourceMappingURL=fingerprintBlock.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"fingerprintBlock.mjs","names":[],"sources":["../../../src/translation-alignment/fingerprintBlock.ts"],"sourcesContent":["import crypto from 'node:crypto';\nimport type { FingerprintedBlock, NormalizedBlock } from './types';\n\nconst computeStringDigest = (text: string): string =>\n crypto.createHash('sha256').update(text).digest('hex');\n\nexport const fingerprintBlock = (\n block: NormalizedBlock,\n previousBlock: NormalizedBlock | null,\n nextBlock: NormalizedBlock | null\n): FingerprintedBlock => {\n const semanticDigest = computeStringDigest(block.semanticText);\n const anchorDigest = computeStringDigest(block.anchorText);\n const compositeKey = `${semanticDigest}:${anchorDigest}`;\n\n const previousDigest = computeStringDigest(previousBlock?.semanticText ?? '');\n const nextDigest = computeStringDigest(nextBlock?.semanticText ?? '');\n const contextKey = computeStringDigest(`${previousDigest}:${nextDigest}`);\n\n return {\n ...block,\n semanticDigest,\n anchorDigest,\n compositeKey,\n contextKey,\n };\n};\n"],"mappings":"2BAGA,MAAM,EAAuB,GAC3B,EAAO,WAAW,SAAS,CAAC,OAAO,EAAK,CAAC,OAAO,MAAM,CAE3C,GACX,EACA,EACA,IACuB,CACvB,IAAM,EAAiB,EAAoB,EAAM,aAAa,CACxD,EAAe,EAAoB,EAAM,WAAW,CACpD,EAAe,GAAG,EAAe,GAAG,IAIpC,EAAa,EAAoB,GAFhB,EAAoB,GAAe,cAAgB,GAAG,CAEpB,GADtC,EAAoB,GAAW,cAAgB,GAAG,GACI,CAEzE,MAAO,CACL,GAAG,EACH,iBACA,eACA,eACA,aACD"}
1
+ {"version":3,"file":"fingerprintBlock.mjs","names":[],"sources":["../../../src/translation-alignment/fingerprintBlock.ts"],"sourcesContent":["import crypto from 'node:crypto';\nimport type { FingerprintedBlock, NormalizedBlock } from './types';\n\nconst computeStringDigest = (text: string): string =>\n crypto.createHash('sha256').update(text).digest('hex');\n\nexport const fingerprintBlock = (\n block: NormalizedBlock,\n previousBlock: NormalizedBlock | null,\n nextBlock: NormalizedBlock | null\n): FingerprintedBlock => {\n const semanticDigest = computeStringDigest(block.semanticText);\n const anchorDigest = computeStringDigest(block.anchorText);\n const compositeKey = `${semanticDigest}:${anchorDigest}`;\n\n const previousDigest = computeStringDigest(previousBlock?.semanticText ?? '');\n const nextDigest = computeStringDigest(nextBlock?.semanticText ?? '');\n const contextKey = computeStringDigest(`${previousDigest}:${nextDigest}`);\n\n return {\n ...block,\n semanticDigest,\n anchorDigest,\n compositeKey,\n contextKey,\n };\n};\n"],"mappings":";;;AAGA,MAAM,uBAAuB,SAC3B,OAAO,WAAW,SAAS,CAAC,OAAO,KAAK,CAAC,OAAO,MAAM;AAExD,MAAa,oBACX,OACA,eACA,cACuB;CACvB,MAAM,iBAAiB,oBAAoB,MAAM,aAAa;CAC9D,MAAM,eAAe,oBAAoB,MAAM,WAAW;CAC1D,MAAM,eAAe,GAAG,eAAe,GAAG;CAI1C,MAAM,aAAa,oBAAoB,GAFhB,oBAAoB,eAAe,gBAAgB,GAAG,CAEpB,GADtC,oBAAoB,WAAW,gBAAgB,GAAG,GACI;AAEzE,QAAO;EACL,GAAG;EACH;EACA;EACA;EACA;EACD"}
@@ -1 +1,11 @@
1
- import{computeJaccardSimilarity as e,generateCharacterShingles as t}from"./computeSimilarity.mjs";import{alignEnglishAndFrenchBlocks as n}from"./alignBlocks.mjs";import{fingerprintBlock as r}from"./fingerprintBlock.mjs";import{mapChangedLinesToBlocks as i}from"./mapChangedLinesToBlocks.mjs";import{normalizeBlock as a}from"./normalizeBlock.mjs";import{planAlignmentActions as o}from"./planActions.mjs";import{identifySegmentsToReview as s,mergeReviewedSegments as c}from"./rebuildDocument.mjs";import{segmentDocument as l}from"./segmentDocument.mjs";import{buildAlignmentPlan as u}from"./pipeline.mjs";export{n as alignEnglishAndFrenchBlocks,u as buildAlignmentPlan,e as computeJaccardSimilarity,r as fingerprintBlock,t as generateCharacterShingles,s as identifySegmentsToReview,i as mapChangedLinesToBlocks,c as mergeReviewedSegments,a as normalizeBlock,o as planAlignmentActions,l as segmentDocument};
1
+ import { computeJaccardSimilarity, generateCharacterShingles } from "./computeSimilarity.mjs";
2
+ import { alignEnglishAndFrenchBlocks } from "./alignBlocks.mjs";
3
+ import { fingerprintBlock } from "./fingerprintBlock.mjs";
4
+ import { mapChangedLinesToBlocks } from "./mapChangedLinesToBlocks.mjs";
5
+ import { normalizeBlock } from "./normalizeBlock.mjs";
6
+ import { planAlignmentActions } from "./planActions.mjs";
7
+ import { identifySegmentsToReview, mergeReviewedSegments } from "./rebuildDocument.mjs";
8
+ import { segmentDocument } from "./segmentDocument.mjs";
9
+ import { buildAlignmentPlan } from "./pipeline.mjs";
10
+
11
+ export { alignEnglishAndFrenchBlocks, buildAlignmentPlan, computeJaccardSimilarity, fingerprintBlock, generateCharacterShingles, identifySegmentsToReview, mapChangedLinesToBlocks, mergeReviewedSegments, normalizeBlock, planAlignmentActions, segmentDocument };
@@ -1,2 +1,17 @@
1
- const e=(e,t)=>{let n=new Set;if(!t||t.length===0)return n;let r=new Set(t);return e.forEach((e,t)=>{for(let i=e.lineStart;i<=e.lineEnd;i+=1)if(r.has(i)){n.add(t);break}}),n};export{e as mapChangedLinesToBlocks};
1
+ //#region src/translation-alignment/mapChangedLinesToBlocks.ts
2
+ const mapChangedLinesToBlocks = (blocks, changedLines) => {
3
+ const changedSet = /* @__PURE__ */ new Set();
4
+ if (!changedLines || changedLines.length === 0) return changedSet;
5
+ const changedLookup = new Set(changedLines);
6
+ blocks.forEach((block, index) => {
7
+ for (let line = block.lineStart; line <= block.lineEnd; line += 1) if (changedLookup.has(line)) {
8
+ changedSet.add(index);
9
+ break;
10
+ }
11
+ });
12
+ return changedSet;
13
+ };
14
+
15
+ //#endregion
16
+ export { mapChangedLinesToBlocks };
2
17
  //# sourceMappingURL=mapChangedLinesToBlocks.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"mapChangedLinesToBlocks.mjs","names":[],"sources":["../../../src/translation-alignment/mapChangedLinesToBlocks.ts"],"sourcesContent":["import type { Block, LineChange } from './types';\n\nexport const mapChangedLinesToBlocks = (\n blocks: Block[],\n changedLines: LineChange[]\n): Set<number> => {\n const changedSet = new Set<number>();\n if (!changedLines || changedLines.length === 0) return changedSet;\n\n const changedLookup = new Set<number>(changedLines);\n\n blocks.forEach((block, index) => {\n for (let line = block.lineStart; line <= block.lineEnd; line += 1) {\n if (changedLookup.has(line)) {\n changedSet.add(index);\n break;\n }\n }\n });\n\n return changedSet;\n};\n"],"mappings":"AAEA,MAAa,GACX,EACA,IACgB,CAChB,IAAM,EAAa,IAAI,IACvB,GAAI,CAAC,GAAgB,EAAa,SAAW,EAAG,OAAO,EAEvD,IAAM,EAAgB,IAAI,IAAY,EAAa,CAWnD,OATA,EAAO,SAAS,EAAO,IAAU,CAC/B,IAAK,IAAI,EAAO,EAAM,UAAW,GAAQ,EAAM,QAAS,GAAQ,EAC9D,GAAI,EAAc,IAAI,EAAK,CAAE,CAC3B,EAAW,IAAI,EAAM,CACrB,QAGJ,CAEK"}
1
+ {"version":3,"file":"mapChangedLinesToBlocks.mjs","names":[],"sources":["../../../src/translation-alignment/mapChangedLinesToBlocks.ts"],"sourcesContent":["import type { Block, LineChange } from './types';\n\nexport const mapChangedLinesToBlocks = (\n blocks: Block[],\n changedLines: LineChange[]\n): Set<number> => {\n const changedSet = new Set<number>();\n if (!changedLines || changedLines.length === 0) return changedSet;\n\n const changedLookup = new Set<number>(changedLines);\n\n blocks.forEach((block, index) => {\n for (let line = block.lineStart; line <= block.lineEnd; line += 1) {\n if (changedLookup.has(line)) {\n changedSet.add(index);\n break;\n }\n }\n });\n\n return changedSet;\n};\n"],"mappings":";AAEA,MAAa,2BACX,QACA,iBACgB;CAChB,MAAM,6BAAa,IAAI,KAAa;AACpC,KAAI,CAAC,gBAAgB,aAAa,WAAW,EAAG,QAAO;CAEvD,MAAM,gBAAgB,IAAI,IAAY,aAAa;AAEnD,QAAO,SAAS,OAAO,UAAU;AAC/B,OAAK,IAAI,OAAO,MAAM,WAAW,QAAQ,MAAM,SAAS,QAAQ,EAC9D,KAAI,cAAc,IAAI,KAAK,EAAE;AAC3B,cAAW,IAAI,MAAM;AACrB;;GAGJ;AAEF,QAAO"}
@@ -1,2 +1,21 @@
1
- const e=e=>e.replace(/`{1,3}[^`]*`{1,3}/g,` `).replace(/\*\*([^*]+)\*\*/g,`$1`).replace(/\*([^*]+)\*/g,`$1`).replace(/_([^_]+)_/g,`$1`).replace(/~~([^~]+)~~/g,`$1`).replace(/!?\[[^\]]*\]\([^)]*\)/g,` `).replace(/^\s*#{1,6}\s+/gm,``).replace(/^\s*>\s?/gm,``).replace(/^\s*[-*+]\s+/gm,``).replace(/^\s*\d+\.\s+/gm,``),t=e=>e.replace(/\s+/g,` `).trim(),n=e=>e.replace(/\p{L}+/gu,``),r=r=>{let i=t(e(r.content).toLowerCase()),a=t(n(r.content));return{...r,semanticText:i,anchorText:a}};export{r as normalizeBlock};
1
+ //#region src/translation-alignment/normalizeBlock.ts
2
+ const removeMarkdownFormatting = (text) => {
3
+ return text.replace(/`{1,3}[^`]*`{1,3}/g, " ").replace(/\*\*([^*]+)\*\*/g, "$1").replace(/\*([^*]+)\*/g, "$1").replace(/_([^_]+)_/g, "$1").replace(/~~([^~]+)~~/g, "$1").replace(/!?\[[^\]]*\]\([^)]*\)/g, " ").replace(/^\s*#{1,6}\s+/gm, "").replace(/^\s*>\s?/gm, "").replace(/^\s*[-*+]\s+/gm, "").replace(/^\s*\d+\.\s+/gm, "");
4
+ };
5
+ const collapseWhitespace = (text) => text.replace(/\s+/g, " ").trim();
6
+ const stripLettersKeepDigitsAndSymbols = (text) => {
7
+ return text.replace(/\p{L}+/gu, "");
8
+ };
9
+ const normalizeBlock = (block) => {
10
+ const semanticCollapsed = collapseWhitespace(removeMarkdownFormatting(block.content).toLowerCase());
11
+ const anchorCollapsed = collapseWhitespace(stripLettersKeepDigitsAndSymbols(block.content));
12
+ return {
13
+ ...block,
14
+ semanticText: semanticCollapsed,
15
+ anchorText: anchorCollapsed
16
+ };
17
+ };
18
+
19
+ //#endregion
20
+ export { normalizeBlock };
2
21
  //# sourceMappingURL=normalizeBlock.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"normalizeBlock.mjs","names":[],"sources":["../../../src/translation-alignment/normalizeBlock.ts"],"sourcesContent":["import type { Block, NormalizedBlock } from './types';\n\nconst removeMarkdownFormatting = (text: string): string => {\n return text\n .replace(/`{1,3}[^`]*`{1,3}/g, ' ')\n .replace(/\\*\\*([^*]+)\\*\\*/g, '$1')\n .replace(/\\*([^*]+)\\*/g, '$1')\n .replace(/_([^_]+)_/g, '$1')\n .replace(/~~([^~]+)~~/g, '$1')\n .replace(/!?\\[[^\\]]*\\]\\([^)]*\\)/g, ' ')\n .replace(/^\\s*#{1,6}\\s+/gm, '')\n .replace(/^\\s*>\\s?/gm, '')\n .replace(/^\\s*[-*+]\\s+/gm, '')\n .replace(/^\\s*\\d+\\.\\s+/gm, '');\n};\n\nconst collapseWhitespace = (text: string): string =>\n text.replace(/\\s+/g, ' ').trim();\n\nconst stripLettersKeepDigitsAndSymbols = (text: string): string => {\n // Keep digits and non-letter characters, remove all letters (including accents)\n return text.replace(/\\p{L}+/gu, '');\n};\n\nexport const normalizeBlock = (block: Block): NormalizedBlock => {\n const contentWithoutMarkdown = removeMarkdownFormatting(block.content);\n const semanticLowercased = contentWithoutMarkdown.toLowerCase();\n const semanticCollapsed = collapseWhitespace(semanticLowercased);\n\n const anchorOnlySymbols = stripLettersKeepDigitsAndSymbols(block.content);\n const anchorCollapsed = collapseWhitespace(anchorOnlySymbols);\n\n return {\n ...block,\n semanticText: semanticCollapsed,\n anchorText: anchorCollapsed,\n };\n};\n"],"mappings":"AAEA,MAAM,EAA4B,GACzB,EACJ,QAAQ,qBAAsB,IAAI,CAClC,QAAQ,mBAAoB,KAAK,CACjC,QAAQ,eAAgB,KAAK,CAC7B,QAAQ,aAAc,KAAK,CAC3B,QAAQ,eAAgB,KAAK,CAC7B,QAAQ,yBAA0B,IAAI,CACtC,QAAQ,kBAAmB,GAAG,CAC9B,QAAQ,aAAc,GAAG,CACzB,QAAQ,iBAAkB,GAAG,CAC7B,QAAQ,iBAAkB,GAAG,CAG5B,EAAsB,GAC1B,EAAK,QAAQ,OAAQ,IAAI,CAAC,MAAM,CAE5B,EAAoC,GAEjC,EAAK,QAAQ,WAAY,GAAG,CAGxB,EAAkB,GAAkC,CAG/D,IAAM,EAAoB,EAFK,EAAyB,EAAM,QAAQ,CACpB,aAAa,CACC,CAG1D,EAAkB,EADE,EAAiC,EAAM,QAAQ,CACZ,CAE7D,MAAO,CACL,GAAG,EACH,aAAc,EACd,WAAY,EACb"}
1
+ {"version":3,"file":"normalizeBlock.mjs","names":[],"sources":["../../../src/translation-alignment/normalizeBlock.ts"],"sourcesContent":["import type { Block, NormalizedBlock } from './types';\n\nconst removeMarkdownFormatting = (text: string): string => {\n return text\n .replace(/`{1,3}[^`]*`{1,3}/g, ' ')\n .replace(/\\*\\*([^*]+)\\*\\*/g, '$1')\n .replace(/\\*([^*]+)\\*/g, '$1')\n .replace(/_([^_]+)_/g, '$1')\n .replace(/~~([^~]+)~~/g, '$1')\n .replace(/!?\\[[^\\]]*\\]\\([^)]*\\)/g, ' ')\n .replace(/^\\s*#{1,6}\\s+/gm, '')\n .replace(/^\\s*>\\s?/gm, '')\n .replace(/^\\s*[-*+]\\s+/gm, '')\n .replace(/^\\s*\\d+\\.\\s+/gm, '');\n};\n\nconst collapseWhitespace = (text: string): string =>\n text.replace(/\\s+/g, ' ').trim();\n\nconst stripLettersKeepDigitsAndSymbols = (text: string): string => {\n // Keep digits and non-letter characters, remove all letters (including accents)\n return text.replace(/\\p{L}+/gu, '');\n};\n\nexport const normalizeBlock = (block: Block): NormalizedBlock => {\n const contentWithoutMarkdown = removeMarkdownFormatting(block.content);\n const semanticLowercased = contentWithoutMarkdown.toLowerCase();\n const semanticCollapsed = collapseWhitespace(semanticLowercased);\n\n const anchorOnlySymbols = stripLettersKeepDigitsAndSymbols(block.content);\n const anchorCollapsed = collapseWhitespace(anchorOnlySymbols);\n\n return {\n ...block,\n semanticText: semanticCollapsed,\n anchorText: anchorCollapsed,\n };\n};\n"],"mappings":";AAEA,MAAM,4BAA4B,SAAyB;AACzD,QAAO,KACJ,QAAQ,sBAAsB,IAAI,CAClC,QAAQ,oBAAoB,KAAK,CACjC,QAAQ,gBAAgB,KAAK,CAC7B,QAAQ,cAAc,KAAK,CAC3B,QAAQ,gBAAgB,KAAK,CAC7B,QAAQ,0BAA0B,IAAI,CACtC,QAAQ,mBAAmB,GAAG,CAC9B,QAAQ,cAAc,GAAG,CACzB,QAAQ,kBAAkB,GAAG,CAC7B,QAAQ,kBAAkB,GAAG;;AAGlC,MAAM,sBAAsB,SAC1B,KAAK,QAAQ,QAAQ,IAAI,CAAC,MAAM;AAElC,MAAM,oCAAoC,SAAyB;AAEjE,QAAO,KAAK,QAAQ,YAAY,GAAG;;AAGrC,MAAa,kBAAkB,UAAkC;CAG/D,MAAM,oBAAoB,mBAFK,yBAAyB,MAAM,QAAQ,CACpB,aAAa,CACC;CAGhE,MAAM,kBAAkB,mBADE,iCAAiC,MAAM,QAAQ,CACZ;AAE7D,QAAO;EACL,GAAG;EACH,cAAc;EACd,YAAY;EACb"}
@@ -1,2 +1,36 @@
1
- import{alignEnglishAndFrenchBlocks as e}from"./alignBlocks.mjs";import{fingerprintBlock as t}from"./fingerprintBlock.mjs";import{mapChangedLinesToBlocks as n}from"./mapChangedLinesToBlocks.mjs";import{normalizeBlock as r}from"./normalizeBlock.mjs";import{planAlignmentActions as i}from"./planActions.mjs";import{identifySegmentsToReview as a,mergeReviewedSegments as o}from"./rebuildDocument.mjs";import{segmentDocument as s}from"./segmentDocument.mjs";const c=({englishText:o,frenchText:c,changedLines:l,similarityOptions:u})=>{let d=s(o),f=s(c),p=d.map(r),m=f.map(r),h=p.map((e,n,r)=>t(e,r[n-1]??null,r[n+1]??null)),g=m.map((e,n,r)=>t(e,r[n-1]??null,r[n+1]??null)),_=i(e(h,g),n(h,Array.isArray(l)?l:[]),{minimumMatchForReuse:u?.minimumMatchForReuse??.9,minimumMatchForNearDuplicate:u?.minimumMatchForNearDuplicate??.8}),{segmentsToReview:v}=a({englishBlocks:h,frenchBlocks:g,plan:_});return{englishBlocks:h,frenchBlocks:g,plan:_,segmentsToReview:v}};export{c as buildAlignmentPlan,o as mergeReviewedSegments};
1
+ import { alignEnglishAndFrenchBlocks } from "./alignBlocks.mjs";
2
+ import { fingerprintBlock } from "./fingerprintBlock.mjs";
3
+ import { mapChangedLinesToBlocks } from "./mapChangedLinesToBlocks.mjs";
4
+ import { normalizeBlock } from "./normalizeBlock.mjs";
5
+ import { planAlignmentActions } from "./planActions.mjs";
6
+ import { identifySegmentsToReview, mergeReviewedSegments } from "./rebuildDocument.mjs";
7
+ import { segmentDocument } from "./segmentDocument.mjs";
8
+
9
+ //#region src/translation-alignment/pipeline.ts
10
+ const buildAlignmentPlan = ({ englishText, frenchText, changedLines, similarityOptions }) => {
11
+ const englishBlocksRaw = segmentDocument(englishText);
12
+ const frenchBlocksRaw = segmentDocument(frenchText);
13
+ const englishNormalized = englishBlocksRaw.map(normalizeBlock);
14
+ const frenchNormalized = frenchBlocksRaw.map(normalizeBlock);
15
+ const englishBlocks = englishNormalized.map((block, index, array) => fingerprintBlock(block, array[index - 1] ?? null, array[index + 1] ?? null));
16
+ const frenchBlocks = frenchNormalized.map((block, index, array) => fingerprintBlock(block, array[index - 1] ?? null, array[index + 1] ?? null));
17
+ const plan = planAlignmentActions(alignEnglishAndFrenchBlocks(englishBlocks, frenchBlocks), mapChangedLinesToBlocks(englishBlocks, Array.isArray(changedLines) ? changedLines : []), {
18
+ minimumMatchForReuse: similarityOptions?.minimumMatchForReuse ?? .9,
19
+ minimumMatchForNearDuplicate: similarityOptions?.minimumMatchForNearDuplicate ?? .8
20
+ });
21
+ const { segmentsToReview } = identifySegmentsToReview({
22
+ englishBlocks,
23
+ frenchBlocks,
24
+ plan
25
+ });
26
+ return {
27
+ englishBlocks,
28
+ frenchBlocks,
29
+ plan,
30
+ segmentsToReview
31
+ };
32
+ };
33
+
34
+ //#endregion
35
+ export { buildAlignmentPlan, mergeReviewedSegments };
2
36
  //# sourceMappingURL=pipeline.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"pipeline.mjs","names":[],"sources":["../../../src/translation-alignment/pipeline.ts"],"sourcesContent":["import { alignEnglishAndFrenchBlocks } from './alignBlocks';\nimport { fingerprintBlock } from './fingerprintBlock';\nimport { mapChangedLinesToBlocks } from './mapChangedLinesToBlocks';\nimport { normalizeBlock } from './normalizeBlock';\nimport { planAlignmentActions } from './planActions';\nimport {\n identifySegmentsToReview,\n mergeReviewedSegments,\n type SegmentToReview,\n} from './rebuildDocument';\nimport { segmentDocument } from './segmentDocument';\nimport type {\n AlignmentPlan,\n FingerprintedBlock,\n SimilarityOptions,\n} from './types';\n\nexport type BuildAlignmentPlanInput = {\n englishText: string;\n frenchText: string;\n changedLines: number[] | undefined;\n similarityOptions?: Partial<SimilarityOptions>;\n};\n\nexport type BuildAlignmentPlanOutput = {\n englishBlocks: FingerprintedBlock[];\n frenchBlocks: FingerprintedBlock[];\n plan: AlignmentPlan;\n segmentsToReview: SegmentToReview[];\n};\n\nexport const buildAlignmentPlan = ({\n englishText,\n frenchText,\n changedLines,\n similarityOptions,\n}: BuildAlignmentPlanInput): BuildAlignmentPlanOutput => {\n const englishBlocksRaw = segmentDocument(englishText);\n const frenchBlocksRaw = segmentDocument(frenchText);\n\n const englishNormalized = englishBlocksRaw.map(normalizeBlock);\n const frenchNormalized = frenchBlocksRaw.map(normalizeBlock);\n\n const englishBlocks: FingerprintedBlock[] = englishNormalized.map(\n (block, index, array) =>\n fingerprintBlock(\n block,\n array[index - 1] ?? null,\n array[index + 1] ?? null\n )\n );\n const frenchBlocks: FingerprintedBlock[] = frenchNormalized.map(\n (block, index, array) =>\n fingerprintBlock(\n block,\n array[index - 1] ?? null,\n array[index + 1] ?? null\n )\n );\n\n const alignment = alignEnglishAndFrenchBlocks(englishBlocks, frenchBlocks);\n\n const changedIndexes = mapChangedLinesToBlocks(\n englishBlocks,\n Array.isArray(changedLines) ? changedLines : []\n );\n\n const plan = planAlignmentActions(alignment, changedIndexes, {\n minimumMatchForReuse: similarityOptions?.minimumMatchForReuse ?? 0.9,\n minimumMatchForNearDuplicate:\n similarityOptions?.minimumMatchForNearDuplicate ?? 0.8,\n });\n\n const { segmentsToReview } = identifySegmentsToReview({\n englishBlocks,\n frenchBlocks,\n plan,\n });\n\n return { englishBlocks, frenchBlocks, plan, segmentsToReview };\n};\n\nexport { mergeReviewedSegments };\nexport type { SegmentToReview };\n"],"mappings":"qcA+BA,MAAa,GAAsB,CACjC,cACA,aACA,eACA,uBACuD,CACvD,IAAM,EAAmB,EAAgB,EAAY,CAC/C,EAAkB,EAAgB,EAAW,CAE7C,EAAoB,EAAiB,IAAI,EAAe,CACxD,EAAmB,EAAgB,IAAI,EAAe,CAEtD,EAAsC,EAAkB,KAC3D,EAAO,EAAO,IACb,EACE,EACA,EAAM,EAAQ,IAAM,KACpB,EAAM,EAAQ,IAAM,KACrB,CACJ,CACK,EAAqC,EAAiB,KACzD,EAAO,EAAO,IACb,EACE,EACA,EAAM,EAAQ,IAAM,KACpB,EAAM,EAAQ,IAAM,KACrB,CACJ,CASK,EAAO,EAPK,EAA4B,EAAe,EAAa,CAEnD,EACrB,EACA,MAAM,QAAQ,EAAa,CAAG,EAAe,EAAE,CAChD,CAE4D,CAC3D,qBAAsB,GAAmB,sBAAwB,GACjE,6BACE,GAAmB,8BAAgC,GACtD,CAAC,CAEI,CAAE,oBAAqB,EAAyB,CACpD,gBACA,eACA,OACD,CAAC,CAEF,MAAO,CAAE,gBAAe,eAAc,OAAM,mBAAkB"}
1
+ {"version":3,"file":"pipeline.mjs","names":[],"sources":["../../../src/translation-alignment/pipeline.ts"],"sourcesContent":["import { alignEnglishAndFrenchBlocks } from './alignBlocks';\nimport { fingerprintBlock } from './fingerprintBlock';\nimport { mapChangedLinesToBlocks } from './mapChangedLinesToBlocks';\nimport { normalizeBlock } from './normalizeBlock';\nimport { planAlignmentActions } from './planActions';\nimport {\n identifySegmentsToReview,\n mergeReviewedSegments,\n type SegmentToReview,\n} from './rebuildDocument';\nimport { segmentDocument } from './segmentDocument';\nimport type {\n AlignmentPlan,\n FingerprintedBlock,\n SimilarityOptions,\n} from './types';\n\nexport type BuildAlignmentPlanInput = {\n englishText: string;\n frenchText: string;\n changedLines: number[] | undefined;\n similarityOptions?: Partial<SimilarityOptions>;\n};\n\nexport type BuildAlignmentPlanOutput = {\n englishBlocks: FingerprintedBlock[];\n frenchBlocks: FingerprintedBlock[];\n plan: AlignmentPlan;\n segmentsToReview: SegmentToReview[];\n};\n\nexport const buildAlignmentPlan = ({\n englishText,\n frenchText,\n changedLines,\n similarityOptions,\n}: BuildAlignmentPlanInput): BuildAlignmentPlanOutput => {\n const englishBlocksRaw = segmentDocument(englishText);\n const frenchBlocksRaw = segmentDocument(frenchText);\n\n const englishNormalized = englishBlocksRaw.map(normalizeBlock);\n const frenchNormalized = frenchBlocksRaw.map(normalizeBlock);\n\n const englishBlocks: FingerprintedBlock[] = englishNormalized.map(\n (block, index, array) =>\n fingerprintBlock(\n block,\n array[index - 1] ?? null,\n array[index + 1] ?? null\n )\n );\n const frenchBlocks: FingerprintedBlock[] = frenchNormalized.map(\n (block, index, array) =>\n fingerprintBlock(\n block,\n array[index - 1] ?? null,\n array[index + 1] ?? null\n )\n );\n\n const alignment = alignEnglishAndFrenchBlocks(englishBlocks, frenchBlocks);\n\n const changedIndexes = mapChangedLinesToBlocks(\n englishBlocks,\n Array.isArray(changedLines) ? changedLines : []\n );\n\n const plan = planAlignmentActions(alignment, changedIndexes, {\n minimumMatchForReuse: similarityOptions?.minimumMatchForReuse ?? 0.9,\n minimumMatchForNearDuplicate:\n similarityOptions?.minimumMatchForNearDuplicate ?? 0.8,\n });\n\n const { segmentsToReview } = identifySegmentsToReview({\n englishBlocks,\n frenchBlocks,\n plan,\n });\n\n return { englishBlocks, frenchBlocks, plan, segmentsToReview };\n};\n\nexport { mergeReviewedSegments };\nexport type { SegmentToReview };\n"],"mappings":";;;;;;;;;AA+BA,MAAa,sBAAsB,EACjC,aACA,YACA,cACA,wBACuD;CACvD,MAAM,mBAAmB,gBAAgB,YAAY;CACrD,MAAM,kBAAkB,gBAAgB,WAAW;CAEnD,MAAM,oBAAoB,iBAAiB,IAAI,eAAe;CAC9D,MAAM,mBAAmB,gBAAgB,IAAI,eAAe;CAE5D,MAAM,gBAAsC,kBAAkB,KAC3D,OAAO,OAAO,UACb,iBACE,OACA,MAAM,QAAQ,MAAM,MACpB,MAAM,QAAQ,MAAM,KACrB,CACJ;CACD,MAAM,eAAqC,iBAAiB,KACzD,OAAO,OAAO,UACb,iBACE,OACA,MAAM,QAAQ,MAAM,MACpB,MAAM,QAAQ,MAAM,KACrB,CACJ;CASD,MAAM,OAAO,qBAPK,4BAA4B,eAAe,aAAa,EAEnD,wBACrB,eACA,MAAM,QAAQ,aAAa,GAAG,eAAe,EAAE,CAChD,EAE4D;EAC3D,sBAAsB,mBAAmB,wBAAwB;EACjE,8BACE,mBAAmB,gCAAgC;EACtD,CAAC;CAEF,MAAM,EAAE,qBAAqB,yBAAyB;EACpD;EACA;EACA;EACD,CAAC;AAEF,QAAO;EAAE;EAAe;EAAc;EAAM;EAAkB"}
@@ -1,2 +1,45 @@
1
- const e=(e,t)=>{let n=[],r=new Set;return e.forEach(e=>{let i=e.englishIndex,a=e.frenchIndex;if(i===-1&&a!==null){r.has(a)||(n.push({kind:`delete`,frenchIndex:a}),r.add(a));return}if(i>=0&&a===null){n.push({kind:`insert_new`,englishIndex:i});return}if(i>=0&&a!==null){t.has(i)?n.push({kind:`review`,englishIndex:i,frenchIndex:a}):n.push({kind:`reuse`,englishIndex:i,frenchIndex:a}),r.add(a);return}}),{actions:n}};export{e as planAlignmentActions};
1
+ //#region src/translation-alignment/planActions.ts
2
+ const planAlignmentActions = (alignment, changedEnglishBlockIndexes) => {
3
+ const actions = [];
4
+ const seenFrench = /* @__PURE__ */ new Set();
5
+ alignment.forEach((pair) => {
6
+ const englishIndex = pair.englishIndex;
7
+ const frenchIndex = pair.frenchIndex;
8
+ if (englishIndex === -1 && frenchIndex !== null) {
9
+ if (!seenFrench.has(frenchIndex)) {
10
+ actions.push({
11
+ kind: "delete",
12
+ frenchIndex
13
+ });
14
+ seenFrench.add(frenchIndex);
15
+ }
16
+ return;
17
+ }
18
+ if (englishIndex >= 0 && frenchIndex === null) {
19
+ actions.push({
20
+ kind: "insert_new",
21
+ englishIndex
22
+ });
23
+ return;
24
+ }
25
+ if (englishIndex >= 0 && frenchIndex !== null) {
26
+ if (!changedEnglishBlockIndexes.has(englishIndex)) actions.push({
27
+ kind: "reuse",
28
+ englishIndex,
29
+ frenchIndex
30
+ });
31
+ else actions.push({
32
+ kind: "review",
33
+ englishIndex,
34
+ frenchIndex
35
+ });
36
+ seenFrench.add(frenchIndex);
37
+ return;
38
+ }
39
+ });
40
+ return { actions };
41
+ };
42
+
43
+ //#endregion
44
+ export { planAlignmentActions };
2
45
  //# sourceMappingURL=planActions.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"planActions.mjs","names":[],"sources":["../../../src/translation-alignment/planActions.ts"],"sourcesContent":["import type { AlignmentPair, AlignmentPlan, PlannedAction } from './types';\n\nexport const planAlignmentActions = (\n alignment: AlignmentPair[],\n changedEnglishBlockIndexes: Set<number>\n): AlignmentPlan => {\n const actions: PlannedAction[] = [];\n const seenFrench = new Set<number>();\n\n alignment.forEach((pair) => {\n const englishIndex = pair.englishIndex;\n const frenchIndex = pair.frenchIndex;\n\n // Case 1: Deletion (Exists in FR, not in EN)\n if (englishIndex === -1 && frenchIndex !== null) {\n if (!seenFrench.has(frenchIndex)) {\n actions.push({ kind: 'delete', frenchIndex });\n seenFrench.add(frenchIndex);\n }\n return;\n }\n\n // Case 2: New Insertion (Exists in EN, not in FR)\n if (englishIndex >= 0 && frenchIndex === null) {\n actions.push({ kind: 'insert_new', englishIndex });\n return;\n }\n\n // Case 3: Alignment (Exists in both)\n if (englishIndex >= 0 && frenchIndex !== null) {\n const isChanged = changedEnglishBlockIndexes.has(englishIndex);\n\n // If the block is NOT marked as changed by Git, we REUSE it.\n // We assume the existing translation is correct because the source hasn't been touched.\n // We ignore 'similarityScore' here because EN vs UK text will always have low similarity.\n if (!isChanged) {\n actions.push({ kind: 'reuse', englishIndex, frenchIndex });\n } else {\n // If the block IS changed, we normally Review.\n // OPTIONAL: You could add a check here for 'similarityScore > 0.99'\n // to detect whitespace-only changes, but generally, if Git says changed, we Review.\n actions.push({ kind: 'review', englishIndex, frenchIndex });\n }\n\n seenFrench.add(frenchIndex);\n return;\n }\n });\n\n return { actions };\n};\n"],"mappings":"AAEA,MAAa,GACX,EACA,IACkB,CAClB,IAAM,EAA2B,EAAE,CAC7B,EAAa,IAAI,IA0CvB,OAxCA,EAAU,QAAS,GAAS,CAC1B,IAAM,EAAe,EAAK,aACpB,EAAc,EAAK,YAGzB,GAAI,IAAiB,IAAM,IAAgB,KAAM,CAC1C,EAAW,IAAI,EAAY,GAC9B,EAAQ,KAAK,CAAE,KAAM,SAAU,cAAa,CAAC,CAC7C,EAAW,IAAI,EAAY,EAE7B,OAIF,GAAI,GAAgB,GAAK,IAAgB,KAAM,CAC7C,EAAQ,KAAK,CAAE,KAAM,aAAc,eAAc,CAAC,CAClD,OAIF,GAAI,GAAgB,GAAK,IAAgB,KAAM,CAC3B,EAA2B,IAAI,EAAa,CAW5D,EAAQ,KAAK,CAAE,KAAM,SAAU,eAAc,cAAa,CAAC,CAL3D,EAAQ,KAAK,CAAE,KAAM,QAAS,eAAc,cAAa,CAAC,CAQ5D,EAAW,IAAI,EAAY,CAC3B,SAEF,CAEK,CAAE,UAAS"}
1
+ {"version":3,"file":"planActions.mjs","names":[],"sources":["../../../src/translation-alignment/planActions.ts"],"sourcesContent":["import type { AlignmentPair, AlignmentPlan, PlannedAction } from './types';\n\nexport const planAlignmentActions = (\n alignment: AlignmentPair[],\n changedEnglishBlockIndexes: Set<number>\n): AlignmentPlan => {\n const actions: PlannedAction[] = [];\n const seenFrench = new Set<number>();\n\n alignment.forEach((pair) => {\n const englishIndex = pair.englishIndex;\n const frenchIndex = pair.frenchIndex;\n\n // Case 1: Deletion (Exists in FR, not in EN)\n if (englishIndex === -1 && frenchIndex !== null) {\n if (!seenFrench.has(frenchIndex)) {\n actions.push({ kind: 'delete', frenchIndex });\n seenFrench.add(frenchIndex);\n }\n return;\n }\n\n // Case 2: New Insertion (Exists in EN, not in FR)\n if (englishIndex >= 0 && frenchIndex === null) {\n actions.push({ kind: 'insert_new', englishIndex });\n return;\n }\n\n // Case 3: Alignment (Exists in both)\n if (englishIndex >= 0 && frenchIndex !== null) {\n const isChanged = changedEnglishBlockIndexes.has(englishIndex);\n\n // If the block is NOT marked as changed by Git, we REUSE it.\n // We assume the existing translation is correct because the source hasn't been touched.\n // We ignore 'similarityScore' here because EN vs UK text will always have low similarity.\n if (!isChanged) {\n actions.push({ kind: 'reuse', englishIndex, frenchIndex });\n } else {\n // If the block IS changed, we normally Review.\n // OPTIONAL: You could add a check here for 'similarityScore > 0.99'\n // to detect whitespace-only changes, but generally, if Git says changed, we Review.\n actions.push({ kind: 'review', englishIndex, frenchIndex });\n }\n\n seenFrench.add(frenchIndex);\n return;\n }\n });\n\n return { actions };\n};\n"],"mappings":";AAEA,MAAa,wBACX,WACA,+BACkB;CAClB,MAAM,UAA2B,EAAE;CACnC,MAAM,6BAAa,IAAI,KAAa;AAEpC,WAAU,SAAS,SAAS;EAC1B,MAAM,eAAe,KAAK;EAC1B,MAAM,cAAc,KAAK;AAGzB,MAAI,iBAAiB,MAAM,gBAAgB,MAAM;AAC/C,OAAI,CAAC,WAAW,IAAI,YAAY,EAAE;AAChC,YAAQ,KAAK;KAAE,MAAM;KAAU;KAAa,CAAC;AAC7C,eAAW,IAAI,YAAY;;AAE7B;;AAIF,MAAI,gBAAgB,KAAK,gBAAgB,MAAM;AAC7C,WAAQ,KAAK;IAAE,MAAM;IAAc;IAAc,CAAC;AAClD;;AAIF,MAAI,gBAAgB,KAAK,gBAAgB,MAAM;AAM7C,OAAI,CALc,2BAA2B,IAAI,aAAa,CAM5D,SAAQ,KAAK;IAAE,MAAM;IAAS;IAAc;IAAa,CAAC;OAK1D,SAAQ,KAAK;IAAE,MAAM;IAAU;IAAc;IAAa,CAAC;AAG7D,cAAW,IAAI,YAAY;AAC3B;;GAEF;AAEF,QAAO,EAAE,SAAS"}
@@ -1,3 +1,47 @@
1
- const e=({englishBlocks:e,frenchBlocks:t,plan:n})=>{let r=[];return n.actions.forEach((n,i)=>{if(n.kind===`review`){let a=e[n.englishIndex],o=n.frenchIndex===null?null:t[n.frenchIndex].content;r.push({englishBlock:a,frenchBlockText:o,actionIndex:i})}else if(n.kind===`insert_new`){let t=e[n.englishIndex];r.push({englishBlock:t,frenchBlockText:null,actionIndex:i})}}),{segmentsToReview:r}},t=(e,t,n)=>{let r=[];return e.actions.forEach((e,i)=>{if(e.kind===`reuse`)r.push(t[e.frenchIndex].content);else if(e.kind===`review`||e.kind===`insert_new`){let a=n.get(i);a===void 0?e.kind===`review`&&e.frenchIndex!==null?r.push(t[e.frenchIndex].content):r.push(`
2
- `):r.push(a)}}),r.join(``)};export{e as identifySegmentsToReview,t as mergeReviewedSegments};
1
+ //#region src/translation-alignment/rebuildDocument.ts
2
+ /**
3
+ * Analyzes the alignment plan and returns only the segments that need review/translation.
4
+ * Does not generate output text - that's done by mergeReviewedSegments after translation.
5
+ */
6
+ const identifySegmentsToReview = ({ englishBlocks, frenchBlocks, plan }) => {
7
+ const segmentsToReview = [];
8
+ plan.actions.forEach((action, actionIndex) => {
9
+ if (action.kind === "review") {
10
+ const englishBlock = englishBlocks[action.englishIndex];
11
+ const frenchBlockText = action.frenchIndex !== null ? frenchBlocks[action.frenchIndex].content : null;
12
+ segmentsToReview.push({
13
+ englishBlock,
14
+ frenchBlockText,
15
+ actionIndex
16
+ });
17
+ } else if (action.kind === "insert_new") {
18
+ const englishBlock = englishBlocks[action.englishIndex];
19
+ segmentsToReview.push({
20
+ englishBlock,
21
+ frenchBlockText: null,
22
+ actionIndex
23
+ });
24
+ }
25
+ });
26
+ return { segmentsToReview };
27
+ };
28
+ /**
29
+ * Merges reviewed translations back into the final document following the alignment plan.
30
+ */
31
+ const mergeReviewedSegments = (plan, frenchBlocks, reviewedSegments) => {
32
+ const outputParts = [];
33
+ plan.actions.forEach((action, actionIndex) => {
34
+ if (action.kind === "reuse") outputParts.push(frenchBlocks[action.frenchIndex].content);
35
+ else if (action.kind === "review" || action.kind === "insert_new") {
36
+ const reviewedContent = reviewedSegments.get(actionIndex);
37
+ if (reviewedContent !== void 0) outputParts.push(reviewedContent);
38
+ else if (action.kind === "review" && action.frenchIndex !== null) outputParts.push(frenchBlocks[action.frenchIndex].content);
39
+ else outputParts.push("\n");
40
+ }
41
+ });
42
+ return outputParts.join("");
43
+ };
44
+
45
+ //#endregion
46
+ export { identifySegmentsToReview, mergeReviewedSegments };
3
47
  //# sourceMappingURL=rebuildDocument.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"rebuildDocument.mjs","names":[],"sources":["../../../src/translation-alignment/rebuildDocument.ts"],"sourcesContent":["import type { AlignmentPlan, FingerprintedBlock } from './types';\n\nexport type SegmentToReview = {\n englishBlock: FingerprintedBlock;\n frenchBlockText: string | null;\n actionIndex: number;\n};\n\nexport type RebuildInput = {\n englishBlocks: FingerprintedBlock[];\n frenchBlocks: FingerprintedBlock[];\n plan: AlignmentPlan;\n};\n\nexport type RebuildResult = {\n segmentsToReview: SegmentToReview[];\n};\n\n/**\n * Analyzes the alignment plan and returns only the segments that need review/translation.\n * Does not generate output text - that's done by mergeReviewedSegments after translation.\n */\nexport const identifySegmentsToReview = ({\n englishBlocks,\n frenchBlocks,\n plan,\n}: RebuildInput): RebuildResult => {\n const segmentsToReview: SegmentToReview[] = [];\n\n plan.actions.forEach((action, actionIndex) => {\n if (action.kind === 'review') {\n const englishBlock = englishBlocks[action.englishIndex];\n const frenchBlockText =\n action.frenchIndex !== null\n ? frenchBlocks[action.frenchIndex].content\n : null;\n\n segmentsToReview.push({ englishBlock, frenchBlockText, actionIndex });\n } else if (action.kind === 'insert_new') {\n const englishBlock = englishBlocks[action.englishIndex];\n\n segmentsToReview.push({\n englishBlock,\n frenchBlockText: null,\n actionIndex,\n });\n }\n });\n\n return { segmentsToReview };\n};\n\n/**\n * Merges reviewed translations back into the final document following the alignment plan.\n */\nexport const mergeReviewedSegments = (\n plan: AlignmentPlan,\n frenchBlocks: FingerprintedBlock[],\n reviewedSegments: Map<number, string>\n): string => {\n const outputParts: string[] = [];\n\n plan.actions.forEach((action, actionIndex) => {\n if (action.kind === 'reuse') {\n outputParts.push(frenchBlocks[action.frenchIndex].content);\n } else if (action.kind === 'review' || action.kind === 'insert_new') {\n const reviewedContent = reviewedSegments.get(actionIndex);\n\n if (reviewedContent !== undefined) {\n outputParts.push(reviewedContent);\n } else {\n // Fallback: if review failed, use existing or blank\n if (action.kind === 'review' && action.frenchIndex !== null) {\n outputParts.push(frenchBlocks[action.frenchIndex].content);\n } else {\n outputParts.push('\\n');\n }\n }\n }\n // \"delete\" actions are simply skipped - no output\n });\n\n return outputParts.join('');\n};\n"],"mappings":"AAsBA,MAAa,GAA4B,CACvC,gBACA,eACA,UACiC,CACjC,IAAM,EAAsC,EAAE,CAsB9C,OApBA,EAAK,QAAQ,SAAS,EAAQ,IAAgB,CAC5C,GAAI,EAAO,OAAS,SAAU,CAC5B,IAAM,EAAe,EAAc,EAAO,cACpC,EACJ,EAAO,cAAgB,KAEnB,KADA,EAAa,EAAO,aAAa,QAGvC,EAAiB,KAAK,CAAE,eAAc,kBAAiB,cAAa,CAAC,SAC5D,EAAO,OAAS,aAAc,CACvC,IAAM,EAAe,EAAc,EAAO,cAE1C,EAAiB,KAAK,CACpB,eACA,gBAAiB,KACjB,cACD,CAAC,GAEJ,CAEK,CAAE,mBAAkB,EAMhB,GACX,EACA,EACA,IACW,CACX,IAAM,EAAwB,EAAE,CAsBhC,OApBA,EAAK,QAAQ,SAAS,EAAQ,IAAgB,CAC5C,GAAI,EAAO,OAAS,QAClB,EAAY,KAAK,EAAa,EAAO,aAAa,QAAQ,SACjD,EAAO,OAAS,UAAY,EAAO,OAAS,aAAc,CACnE,IAAM,EAAkB,EAAiB,IAAI,EAAY,CAErD,IAAoB,IAAA,GAIlB,EAAO,OAAS,UAAY,EAAO,cAAgB,KACrD,EAAY,KAAK,EAAa,EAAO,aAAa,QAAQ,CAE1D,EAAY,KAAK;EAAK,CANxB,EAAY,KAAK,EAAgB,GAWrC,CAEK,EAAY,KAAK,GAAG"}
1
+ {"version":3,"file":"rebuildDocument.mjs","names":[],"sources":["../../../src/translation-alignment/rebuildDocument.ts"],"sourcesContent":["import type { AlignmentPlan, FingerprintedBlock } from './types';\n\nexport type SegmentToReview = {\n englishBlock: FingerprintedBlock;\n frenchBlockText: string | null;\n actionIndex: number;\n};\n\nexport type RebuildInput = {\n englishBlocks: FingerprintedBlock[];\n frenchBlocks: FingerprintedBlock[];\n plan: AlignmentPlan;\n};\n\nexport type RebuildResult = {\n segmentsToReview: SegmentToReview[];\n};\n\n/**\n * Analyzes the alignment plan and returns only the segments that need review/translation.\n * Does not generate output text - that's done by mergeReviewedSegments after translation.\n */\nexport const identifySegmentsToReview = ({\n englishBlocks,\n frenchBlocks,\n plan,\n}: RebuildInput): RebuildResult => {\n const segmentsToReview: SegmentToReview[] = [];\n\n plan.actions.forEach((action, actionIndex) => {\n if (action.kind === 'review') {\n const englishBlock = englishBlocks[action.englishIndex];\n const frenchBlockText =\n action.frenchIndex !== null\n ? frenchBlocks[action.frenchIndex].content\n : null;\n\n segmentsToReview.push({ englishBlock, frenchBlockText, actionIndex });\n } else if (action.kind === 'insert_new') {\n const englishBlock = englishBlocks[action.englishIndex];\n\n segmentsToReview.push({\n englishBlock,\n frenchBlockText: null,\n actionIndex,\n });\n }\n });\n\n return { segmentsToReview };\n};\n\n/**\n * Merges reviewed translations back into the final document following the alignment plan.\n */\nexport const mergeReviewedSegments = (\n plan: AlignmentPlan,\n frenchBlocks: FingerprintedBlock[],\n reviewedSegments: Map<number, string>\n): string => {\n const outputParts: string[] = [];\n\n plan.actions.forEach((action, actionIndex) => {\n if (action.kind === 'reuse') {\n outputParts.push(frenchBlocks[action.frenchIndex].content);\n } else if (action.kind === 'review' || action.kind === 'insert_new') {\n const reviewedContent = reviewedSegments.get(actionIndex);\n\n if (reviewedContent !== undefined) {\n outputParts.push(reviewedContent);\n } else {\n // Fallback: if review failed, use existing or blank\n if (action.kind === 'review' && action.frenchIndex !== null) {\n outputParts.push(frenchBlocks[action.frenchIndex].content);\n } else {\n outputParts.push('\\n');\n }\n }\n }\n // \"delete\" actions are simply skipped - no output\n });\n\n return outputParts.join('');\n};\n"],"mappings":";;;;;AAsBA,MAAa,4BAA4B,EACvC,eACA,cACA,WACiC;CACjC,MAAM,mBAAsC,EAAE;AAE9C,MAAK,QAAQ,SAAS,QAAQ,gBAAgB;AAC5C,MAAI,OAAO,SAAS,UAAU;GAC5B,MAAM,eAAe,cAAc,OAAO;GAC1C,MAAM,kBACJ,OAAO,gBAAgB,OACnB,aAAa,OAAO,aAAa,UACjC;AAEN,oBAAiB,KAAK;IAAE;IAAc;IAAiB;IAAa,CAAC;aAC5D,OAAO,SAAS,cAAc;GACvC,MAAM,eAAe,cAAc,OAAO;AAE1C,oBAAiB,KAAK;IACpB;IACA,iBAAiB;IACjB;IACD,CAAC;;GAEJ;AAEF,QAAO,EAAE,kBAAkB;;;;;AAM7B,MAAa,yBACX,MACA,cACA,qBACW;CACX,MAAM,cAAwB,EAAE;AAEhC,MAAK,QAAQ,SAAS,QAAQ,gBAAgB;AAC5C,MAAI,OAAO,SAAS,QAClB,aAAY,KAAK,aAAa,OAAO,aAAa,QAAQ;WACjD,OAAO,SAAS,YAAY,OAAO,SAAS,cAAc;GACnE,MAAM,kBAAkB,iBAAiB,IAAI,YAAY;AAEzD,OAAI,oBAAoB,OACtB,aAAY,KAAK,gBAAgB;YAG7B,OAAO,SAAS,YAAY,OAAO,gBAAgB,KACrD,aAAY,KAAK,aAAa,OAAO,aAAa,QAAQ;OAE1D,aAAY,KAAK,KAAK;;GAK5B;AAEF,QAAO,YAAY,KAAK,GAAG"}
@@ -1,6 +1,65 @@
1
- const e=e=>e.trim().length===0,t=e=>/^\s*```/.test(e),n=e=>/^\s*#{1,6}\s+/.test(e),r=e=>/^\s*---\s*$/.test(e),i=e=>e.replace(/\n+$/g,`
2
- `),a=a=>{let o=a.split(`
3
- `),s=[],c=0,l=!1,u=[],d=1,f=e=>{if(u.length>0){let t=u.join(`
4
- `);t.trim().length>0&&s.push({type:`paragraph`,content:`${i(t)}\n`,lineStart:d,lineEnd:e}),u=[]}};for(;c<o.length;){let a=o[c];if(s.length===0&&r(a)){let e=c+1,t=[a];for(c++;c<o.length&&!r(o[c]);)t.push(o[c]),c++;c<o.length&&r(o[c])&&(t.push(o[c]),c++),s.push({type:`paragraph`,content:`${i(t.join(`
5
- `))}\n`,lineStart:e,lineEnd:c});continue}t(a)&&(l=!l),!l&&n(a)?(u.length>0&&f(c),d=c+1,u=[a]):(u.length===0&&!e(a)&&(d=c+1),u.push(a)),c++}return f(c),s};export{a as segmentDocument};
1
+ //#region src/translation-alignment/segmentDocument.ts
2
+ const isBlankLine = (line) => line.trim().length === 0;
3
+ const isFencedCodeDelimiter = (line) => /^\s*```/.test(line);
4
+ const isHeading = (line) => /^\s*#{1,6}\s+/.test(line);
5
+ const isFrontmatterDelimiter = (line) => /^\s*---\s*$/.test(line);
6
+ const trimTrailingNewlines = (text) => text.replace(/\n+$/g, "\n");
7
+ const segmentDocument = (text) => {
8
+ const lines = text.split("\n");
9
+ const blocks = [];
10
+ let index = 0;
11
+ let insideCodeBlock = false;
12
+ let currentSectionLines = [];
13
+ let currentSectionStartLine = 1;
14
+ const flushCurrentSection = (endIndex) => {
15
+ if (currentSectionLines.length > 0) {
16
+ const rawContent = currentSectionLines.join("\n");
17
+ if (rawContent.trim().length > 0) blocks.push({
18
+ type: "paragraph",
19
+ content: `${trimTrailingNewlines(rawContent)}\n`,
20
+ lineStart: currentSectionStartLine,
21
+ lineEnd: endIndex
22
+ });
23
+ currentSectionLines = [];
24
+ }
25
+ };
26
+ while (index < lines.length) {
27
+ const currentLine = lines[index];
28
+ if (blocks.length === 0 && isFrontmatterDelimiter(currentLine)) {
29
+ const startLine = index + 1;
30
+ const contentLines = [currentLine];
31
+ index++;
32
+ while (index < lines.length && !isFrontmatterDelimiter(lines[index])) {
33
+ contentLines.push(lines[index]);
34
+ index++;
35
+ }
36
+ if (index < lines.length && isFrontmatterDelimiter(lines[index])) {
37
+ contentLines.push(lines[index]);
38
+ index++;
39
+ }
40
+ blocks.push({
41
+ type: "paragraph",
42
+ content: `${trimTrailingNewlines(contentLines.join("\n"))}\n`,
43
+ lineStart: startLine,
44
+ lineEnd: index
45
+ });
46
+ continue;
47
+ }
48
+ if (isFencedCodeDelimiter(currentLine)) insideCodeBlock = !insideCodeBlock;
49
+ if (!insideCodeBlock && isHeading(currentLine)) {
50
+ if (currentSectionLines.length > 0) flushCurrentSection(index);
51
+ currentSectionStartLine = index + 1;
52
+ currentSectionLines = [currentLine];
53
+ } else {
54
+ if (currentSectionLines.length === 0 && !isBlankLine(currentLine)) currentSectionStartLine = index + 1;
55
+ currentSectionLines.push(currentLine);
56
+ }
57
+ index++;
58
+ }
59
+ flushCurrentSection(index);
60
+ return blocks;
61
+ };
62
+
63
+ //#endregion
64
+ export { segmentDocument };
6
65
  //# sourceMappingURL=segmentDocument.mjs.map
@@ -1 +1 @@
1
- {"version":3,"file":"segmentDocument.mjs","names":[],"sources":["../../../src/translation-alignment/segmentDocument.ts"],"sourcesContent":["import type { Block } from './types';\n\nconst isBlankLine = (line: string): boolean => line.trim().length === 0;\nconst isFencedCodeDelimiter = (line: string): boolean => /^\\s*```/.test(line);\nconst isHeading = (line: string): boolean => /^\\s*#{1,6}\\s+/.test(line);\nconst isFrontmatterDelimiter = (line: string): boolean =>\n /^\\s*---\\s*$/.test(line);\nconst trimTrailingNewlines = (text: string): string =>\n text.replace(/\\n+$/g, '\\n');\n\nexport const segmentDocument = (text: string): Block[] => {\n const lines = text.split('\\n');\n const blocks: Block[] = [];\n\n let index = 0;\n let insideCodeBlock = false;\n\n // Buffers\n let currentSectionLines: string[] = [];\n let currentSectionStartLine = 1;\n\n const flushCurrentSection = (endIndex: number) => {\n if (currentSectionLines.length > 0) {\n // Filter out leading blank lines from the block content to keep it clean,\n // but strictly speaking, we just want to ensure non-empty content.\n const rawContent = currentSectionLines.join('\\n');\n\n if (rawContent.trim().length > 0) {\n blocks.push({\n type: 'paragraph', // Generic type\n content: `${trimTrailingNewlines(rawContent)}\\n`,\n lineStart: currentSectionStartLine,\n lineEnd: endIndex,\n });\n }\n currentSectionLines = [];\n }\n };\n\n while (index < lines.length) {\n const currentLine = lines[index];\n\n // 1. Handle Frontmatter (Must be at start of file)\n if (blocks.length === 0 && isFrontmatterDelimiter(currentLine)) {\n const startLine = index + 1;\n const contentLines: string[] = [currentLine];\n index++;\n\n while (index < lines.length && !isFrontmatterDelimiter(lines[index])) {\n contentLines.push(lines[index]);\n index++;\n }\n\n if (index < lines.length && isFrontmatterDelimiter(lines[index])) {\n contentLines.push(lines[index]);\n index++;\n }\n\n blocks.push({\n type: 'paragraph',\n content: `${trimTrailingNewlines(contentLines.join('\\n'))}\\n`,\n lineStart: startLine,\n lineEnd: index,\n });\n continue;\n }\n\n // 2. Track Code Blocks (Headers inside code blocks are ignored)\n if (isFencedCodeDelimiter(currentLine)) {\n insideCodeBlock = !insideCodeBlock;\n }\n\n const isHeader = !insideCodeBlock && isHeading(currentLine);\n\n // 3. Split on Headers\n if (isHeader) {\n // If we have accumulated content, flush it as the previous block\n if (currentSectionLines.length > 0) {\n flushCurrentSection(index);\n }\n // Start a new section with this header\n currentSectionStartLine = index + 1;\n currentSectionLines = [currentLine];\n } else {\n // Accumulate content\n if (currentSectionLines.length === 0 && !isBlankLine(currentLine)) {\n currentSectionStartLine = index + 1;\n }\n currentSectionLines.push(currentLine);\n }\n\n index++;\n }\n\n // Flush remaining content\n flushCurrentSection(index);\n\n return blocks;\n};\n"],"mappings":"AAEA,MAAM,EAAe,GAA0B,EAAK,MAAM,CAAC,SAAW,EAChE,EAAyB,GAA0B,UAAU,KAAK,EAAK,CACvE,EAAa,GAA0B,gBAAgB,KAAK,EAAK,CACjE,EAA0B,GAC9B,cAAc,KAAK,EAAK,CACpB,EAAwB,GAC5B,EAAK,QAAQ,QAAS;EAAK,CAEhB,EAAmB,GAA0B,CACxD,IAAM,EAAQ,EAAK,MAAM;EAAK,CACxB,EAAkB,EAAE,CAEtB,EAAQ,EACR,EAAkB,GAGlB,EAAgC,EAAE,CAClC,EAA0B,EAExB,EAAuB,GAAqB,CAChD,GAAI,EAAoB,OAAS,EAAG,CAGlC,IAAM,EAAa,EAAoB,KAAK;EAAK,CAE7C,EAAW,MAAM,CAAC,OAAS,GAC7B,EAAO,KAAK,CACV,KAAM,YACN,QAAS,GAAG,EAAqB,EAAW,CAAC,IAC7C,UAAW,EACX,QAAS,EACV,CAAC,CAEJ,EAAsB,EAAE,GAI5B,KAAO,EAAQ,EAAM,QAAQ,CAC3B,IAAM,EAAc,EAAM,GAG1B,GAAI,EAAO,SAAW,GAAK,EAAuB,EAAY,CAAE,CAC9D,IAAM,EAAY,EAAQ,EACpB,EAAyB,CAAC,EAAY,CAG5C,IAFA,IAEO,EAAQ,EAAM,QAAU,CAAC,EAAuB,EAAM,GAAO,EAClE,EAAa,KAAK,EAAM,GAAO,CAC/B,IAGE,EAAQ,EAAM,QAAU,EAAuB,EAAM,GAAO,GAC9D,EAAa,KAAK,EAAM,GAAO,CAC/B,KAGF,EAAO,KAAK,CACV,KAAM,YACN,QAAS,GAAG,EAAqB,EAAa,KAAK;EAAK,CAAC,CAAC,IAC1D,UAAW,EACX,QAAS,EACV,CAAC,CACF,SAIE,EAAsB,EAAY,GACpC,EAAkB,CAAC,GAGJ,CAAC,GAAmB,EAAU,EAAY,EAKrD,EAAoB,OAAS,GAC/B,EAAoB,EAAM,CAG5B,EAA0B,EAAQ,EAClC,EAAsB,CAAC,EAAY,GAG/B,EAAoB,SAAW,GAAK,CAAC,EAAY,EAAY,GAC/D,EAA0B,EAAQ,GAEpC,EAAoB,KAAK,EAAY,EAGvC,IAMF,OAFA,EAAoB,EAAM,CAEnB"}
1
+ {"version":3,"file":"segmentDocument.mjs","names":[],"sources":["../../../src/translation-alignment/segmentDocument.ts"],"sourcesContent":["import type { Block } from './types';\n\nconst isBlankLine = (line: string): boolean => line.trim().length === 0;\nconst isFencedCodeDelimiter = (line: string): boolean => /^\\s*```/.test(line);\nconst isHeading = (line: string): boolean => /^\\s*#{1,6}\\s+/.test(line);\nconst isFrontmatterDelimiter = (line: string): boolean =>\n /^\\s*---\\s*$/.test(line);\nconst trimTrailingNewlines = (text: string): string =>\n text.replace(/\\n+$/g, '\\n');\n\nexport const segmentDocument = (text: string): Block[] => {\n const lines = text.split('\\n');\n const blocks: Block[] = [];\n\n let index = 0;\n let insideCodeBlock = false;\n\n // Buffers\n let currentSectionLines: string[] = [];\n let currentSectionStartLine = 1;\n\n const flushCurrentSection = (endIndex: number) => {\n if (currentSectionLines.length > 0) {\n // Filter out leading blank lines from the block content to keep it clean,\n // but strictly speaking, we just want to ensure non-empty content.\n const rawContent = currentSectionLines.join('\\n');\n\n if (rawContent.trim().length > 0) {\n blocks.push({\n type: 'paragraph', // Generic type\n content: `${trimTrailingNewlines(rawContent)}\\n`,\n lineStart: currentSectionStartLine,\n lineEnd: endIndex,\n });\n }\n currentSectionLines = [];\n }\n };\n\n while (index < lines.length) {\n const currentLine = lines[index];\n\n // 1. Handle Frontmatter (Must be at start of file)\n if (blocks.length === 0 && isFrontmatterDelimiter(currentLine)) {\n const startLine = index + 1;\n const contentLines: string[] = [currentLine];\n index++;\n\n while (index < lines.length && !isFrontmatterDelimiter(lines[index])) {\n contentLines.push(lines[index]);\n index++;\n }\n\n if (index < lines.length && isFrontmatterDelimiter(lines[index])) {\n contentLines.push(lines[index]);\n index++;\n }\n\n blocks.push({\n type: 'paragraph',\n content: `${trimTrailingNewlines(contentLines.join('\\n'))}\\n`,\n lineStart: startLine,\n lineEnd: index,\n });\n continue;\n }\n\n // 2. Track Code Blocks (Headers inside code blocks are ignored)\n if (isFencedCodeDelimiter(currentLine)) {\n insideCodeBlock = !insideCodeBlock;\n }\n\n const isHeader = !insideCodeBlock && isHeading(currentLine);\n\n // 3. Split on Headers\n if (isHeader) {\n // If we have accumulated content, flush it as the previous block\n if (currentSectionLines.length > 0) {\n flushCurrentSection(index);\n }\n // Start a new section with this header\n currentSectionStartLine = index + 1;\n currentSectionLines = [currentLine];\n } else {\n // Accumulate content\n if (currentSectionLines.length === 0 && !isBlankLine(currentLine)) {\n currentSectionStartLine = index + 1;\n }\n currentSectionLines.push(currentLine);\n }\n\n index++;\n }\n\n // Flush remaining content\n flushCurrentSection(index);\n\n return blocks;\n};\n"],"mappings":";AAEA,MAAM,eAAe,SAA0B,KAAK,MAAM,CAAC,WAAW;AACtE,MAAM,yBAAyB,SAA0B,UAAU,KAAK,KAAK;AAC7E,MAAM,aAAa,SAA0B,gBAAgB,KAAK,KAAK;AACvE,MAAM,0BAA0B,SAC9B,cAAc,KAAK,KAAK;AAC1B,MAAM,wBAAwB,SAC5B,KAAK,QAAQ,SAAS,KAAK;AAE7B,MAAa,mBAAmB,SAA0B;CACxD,MAAM,QAAQ,KAAK,MAAM,KAAK;CAC9B,MAAM,SAAkB,EAAE;CAE1B,IAAI,QAAQ;CACZ,IAAI,kBAAkB;CAGtB,IAAI,sBAAgC,EAAE;CACtC,IAAI,0BAA0B;CAE9B,MAAM,uBAAuB,aAAqB;AAChD,MAAI,oBAAoB,SAAS,GAAG;GAGlC,MAAM,aAAa,oBAAoB,KAAK,KAAK;AAEjD,OAAI,WAAW,MAAM,CAAC,SAAS,EAC7B,QAAO,KAAK;IACV,MAAM;IACN,SAAS,GAAG,qBAAqB,WAAW,CAAC;IAC7C,WAAW;IACX,SAAS;IACV,CAAC;AAEJ,yBAAsB,EAAE;;;AAI5B,QAAO,QAAQ,MAAM,QAAQ;EAC3B,MAAM,cAAc,MAAM;AAG1B,MAAI,OAAO,WAAW,KAAK,uBAAuB,YAAY,EAAE;GAC9D,MAAM,YAAY,QAAQ;GAC1B,MAAM,eAAyB,CAAC,YAAY;AAC5C;AAEA,UAAO,QAAQ,MAAM,UAAU,CAAC,uBAAuB,MAAM,OAAO,EAAE;AACpE,iBAAa,KAAK,MAAM,OAAO;AAC/B;;AAGF,OAAI,QAAQ,MAAM,UAAU,uBAAuB,MAAM,OAAO,EAAE;AAChE,iBAAa,KAAK,MAAM,OAAO;AAC/B;;AAGF,UAAO,KAAK;IACV,MAAM;IACN,SAAS,GAAG,qBAAqB,aAAa,KAAK,KAAK,CAAC,CAAC;IAC1D,WAAW;IACX,SAAS;IACV,CAAC;AACF;;AAIF,MAAI,sBAAsB,YAAY,CACpC,mBAAkB,CAAC;AAMrB,MAHiB,CAAC,mBAAmB,UAAU,YAAY,EAG7C;AAEZ,OAAI,oBAAoB,SAAS,EAC/B,qBAAoB,MAAM;AAG5B,6BAA0B,QAAQ;AAClC,yBAAsB,CAAC,YAAY;SAC9B;AAEL,OAAI,oBAAoB,WAAW,KAAK,CAAC,YAAY,YAAY,CAC/D,2BAA0B,QAAQ;AAEpC,uBAAoB,KAAK,YAAY;;AAGvC;;AAIF,qBAAoB,MAAM;AAE1B,QAAO"}