@lokascript/semantic 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (435) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +686 -0
  3. package/dist/browser-ar.ar.global.js +2 -0
  4. package/dist/browser-core.core.global.js +2 -0
  5. package/dist/browser-de.de.global.js +2 -0
  6. package/dist/browser-east-asian.east-asian.global.js +2 -0
  7. package/dist/browser-en-tr.en-tr.global.js +2 -0
  8. package/dist/browser-en.en.global.js +2 -0
  9. package/dist/browser-es-en.es-en.global.js +2 -0
  10. package/dist/browser-es.es.global.js +2 -0
  11. package/dist/browser-fr.fr.global.js +2 -0
  12. package/dist/browser-id.id.global.js +2 -0
  13. package/dist/browser-ja.ja.global.js +2 -0
  14. package/dist/browser-ko.ko.global.js +2 -0
  15. package/dist/browser-lazy.lazy.global.js +2 -0
  16. package/dist/browser-priority.priority.global.js +2 -0
  17. package/dist/browser-pt.pt.global.js +2 -0
  18. package/dist/browser-qu.qu.global.js +2 -0
  19. package/dist/browser-sw.sw.global.js +2 -0
  20. package/dist/browser-tr.tr.global.js +2 -0
  21. package/dist/browser-western.western.global.js +2 -0
  22. package/dist/browser-zh.zh.global.js +2 -0
  23. package/dist/browser.global.js +3 -0
  24. package/dist/browser.global.js.map +1 -0
  25. package/dist/index.cjs +35051 -0
  26. package/dist/index.cjs.map +1 -0
  27. package/dist/index.d.cts +3426 -0
  28. package/dist/index.d.ts +3426 -0
  29. package/dist/index.js +34890 -0
  30. package/dist/index.js.map +1 -0
  31. package/dist/languages/ar.d.ts +78 -0
  32. package/dist/languages/ar.js +1622 -0
  33. package/dist/languages/ar.js.map +1 -0
  34. package/dist/languages/de.d.ts +38 -0
  35. package/dist/languages/de.js +1168 -0
  36. package/dist/languages/de.js.map +1 -0
  37. package/dist/languages/en.d.ts +44 -0
  38. package/dist/languages/en.js +3491 -0
  39. package/dist/languages/en.js.map +1 -0
  40. package/dist/languages/es.d.ts +52 -0
  41. package/dist/languages/es.js +1493 -0
  42. package/dist/languages/es.js.map +1 -0
  43. package/dist/languages/fr.d.ts +37 -0
  44. package/dist/languages/fr.js +1159 -0
  45. package/dist/languages/fr.js.map +1 -0
  46. package/dist/languages/id.d.ts +35 -0
  47. package/dist/languages/id.js +1152 -0
  48. package/dist/languages/id.js.map +1 -0
  49. package/dist/languages/ja.d.ts +53 -0
  50. package/dist/languages/ja.js +1430 -0
  51. package/dist/languages/ja.js.map +1 -0
  52. package/dist/languages/ko.d.ts +51 -0
  53. package/dist/languages/ko.js +1729 -0
  54. package/dist/languages/ko.js.map +1 -0
  55. package/dist/languages/pt.d.ts +37 -0
  56. package/dist/languages/pt.js +1127 -0
  57. package/dist/languages/pt.js.map +1 -0
  58. package/dist/languages/qu.d.ts +36 -0
  59. package/dist/languages/qu.js +1143 -0
  60. package/dist/languages/qu.js.map +1 -0
  61. package/dist/languages/sw.d.ts +35 -0
  62. package/dist/languages/sw.js +1147 -0
  63. package/dist/languages/sw.js.map +1 -0
  64. package/dist/languages/tr.d.ts +45 -0
  65. package/dist/languages/tr.js +1529 -0
  66. package/dist/languages/tr.js.map +1 -0
  67. package/dist/languages/zh.d.ts +58 -0
  68. package/dist/languages/zh.js +1257 -0
  69. package/dist/languages/zh.js.map +1 -0
  70. package/dist/types-C4dcj53L.d.ts +600 -0
  71. package/package.json +202 -0
  72. package/src/__test-utils__/index.ts +7 -0
  73. package/src/__test-utils__/test-helpers.ts +8 -0
  74. package/src/__types__/test-helpers.ts +122 -0
  75. package/src/analysis/index.ts +479 -0
  76. package/src/ast-builder/command-mappers.ts +1133 -0
  77. package/src/ast-builder/expression-parser/index.ts +41 -0
  78. package/src/ast-builder/expression-parser/parser.ts +563 -0
  79. package/src/ast-builder/expression-parser/tokenizer.ts +394 -0
  80. package/src/ast-builder/expression-parser/types.ts +208 -0
  81. package/src/ast-builder/index.ts +536 -0
  82. package/src/ast-builder/value-converters.ts +172 -0
  83. package/src/bridge.ts +275 -0
  84. package/src/browser-ar.ts +162 -0
  85. package/src/browser-core.ts +231 -0
  86. package/src/browser-de.ts +162 -0
  87. package/src/browser-east-asian.ts +173 -0
  88. package/src/browser-en-tr.ts +165 -0
  89. package/src/browser-en.ts +157 -0
  90. package/src/browser-es-en.ts +200 -0
  91. package/src/browser-es.ts +170 -0
  92. package/src/browser-fr.ts +162 -0
  93. package/src/browser-id.ts +162 -0
  94. package/src/browser-ja.ts +162 -0
  95. package/src/browser-ko.ts +162 -0
  96. package/src/browser-lazy.ts +189 -0
  97. package/src/browser-priority.ts +214 -0
  98. package/src/browser-pt.ts +162 -0
  99. package/src/browser-qu.ts +162 -0
  100. package/src/browser-sw.ts +162 -0
  101. package/src/browser-tr.ts +162 -0
  102. package/src/browser-western.ts +181 -0
  103. package/src/browser-zh.ts +162 -0
  104. package/src/browser.ts +268 -0
  105. package/src/cache/index.ts +14 -0
  106. package/src/cache/semantic-cache.ts +344 -0
  107. package/src/core-bridge.ts +372 -0
  108. package/src/explicit/converter.ts +258 -0
  109. package/src/explicit/index.ts +18 -0
  110. package/src/explicit/parser.ts +236 -0
  111. package/src/explicit/renderer.ts +424 -0
  112. package/src/generators/command-schemas.ts +1636 -0
  113. package/src/generators/event-handler-generator.ts +109 -0
  114. package/src/generators/index.ts +117 -0
  115. package/src/generators/language-profiles.ts +139 -0
  116. package/src/generators/pattern-generator.ts +537 -0
  117. package/src/generators/profiles/arabic.ts +131 -0
  118. package/src/generators/profiles/bengali.ts +132 -0
  119. package/src/generators/profiles/chinese.ts +124 -0
  120. package/src/generators/profiles/english.ts +113 -0
  121. package/src/generators/profiles/french.ts +125 -0
  122. package/src/generators/profiles/german.ts +126 -0
  123. package/src/generators/profiles/hindi.ts +146 -0
  124. package/src/generators/profiles/index.ts +46 -0
  125. package/src/generators/profiles/indonesian.ts +125 -0
  126. package/src/generators/profiles/italian.ts +139 -0
  127. package/src/generators/profiles/japanese.ts +149 -0
  128. package/src/generators/profiles/korean.ts +127 -0
  129. package/src/generators/profiles/marker-templates.ts +288 -0
  130. package/src/generators/profiles/ms.ts +130 -0
  131. package/src/generators/profiles/polish.ts +249 -0
  132. package/src/generators/profiles/portuguese.ts +115 -0
  133. package/src/generators/profiles/quechua.ts +113 -0
  134. package/src/generators/profiles/russian.ts +260 -0
  135. package/src/generators/profiles/spanish.ts +130 -0
  136. package/src/generators/profiles/swahili.ts +129 -0
  137. package/src/generators/profiles/thai.ts +132 -0
  138. package/src/generators/profiles/tl.ts +128 -0
  139. package/src/generators/profiles/turkish.ts +124 -0
  140. package/src/generators/profiles/types.ts +165 -0
  141. package/src/generators/profiles/ukrainian.ts +270 -0
  142. package/src/generators/profiles/vietnamese.ts +133 -0
  143. package/src/generators/schema-error-codes.ts +160 -0
  144. package/src/generators/schema-validator.ts +391 -0
  145. package/src/index.ts +429 -0
  146. package/src/language-building-schema.ts +3170 -0
  147. package/src/language-loader.ts +394 -0
  148. package/src/languages/_all.ts +65 -0
  149. package/src/languages/ar.ts +15 -0
  150. package/src/languages/bn.ts +16 -0
  151. package/src/languages/de.ts +15 -0
  152. package/src/languages/en.ts +29 -0
  153. package/src/languages/es.ts +15 -0
  154. package/src/languages/fr.ts +15 -0
  155. package/src/languages/hi.ts +26 -0
  156. package/src/languages/id.ts +15 -0
  157. package/src/languages/index.ts +18 -0
  158. package/src/languages/it.ts +15 -0
  159. package/src/languages/ja.ts +15 -0
  160. package/src/languages/ko.ts +15 -0
  161. package/src/languages/ms.ts +16 -0
  162. package/src/languages/pl.ts +18 -0
  163. package/src/languages/pt.ts +15 -0
  164. package/src/languages/qu.ts +15 -0
  165. package/src/languages/ru.ts +26 -0
  166. package/src/languages/sw.ts +15 -0
  167. package/src/languages/th.ts +16 -0
  168. package/src/languages/tl.ts +16 -0
  169. package/src/languages/tr.ts +15 -0
  170. package/src/languages/uk.ts +26 -0
  171. package/src/languages/vi.ts +16 -0
  172. package/src/languages/zh.ts +15 -0
  173. package/src/parser/index.ts +15 -0
  174. package/src/parser/pattern-matcher.ts +1181 -0
  175. package/src/parser/semantic-parser.ts +573 -0
  176. package/src/parser/utils/index.ts +35 -0
  177. package/src/parser/utils/marker-resolution.ts +111 -0
  178. package/src/parser/utils/possessive-keywords.ts +43 -0
  179. package/src/parser/utils/role-positioning.ts +70 -0
  180. package/src/parser/utils/type-validation.ts +134 -0
  181. package/src/patterns/add/ar.ts +71 -0
  182. package/src/patterns/add/bn.ts +70 -0
  183. package/src/patterns/add/hi.ts +69 -0
  184. package/src/patterns/add/index.ts +87 -0
  185. package/src/patterns/add/it.ts +61 -0
  186. package/src/patterns/add/ja.ts +93 -0
  187. package/src/patterns/add/ko.ts +74 -0
  188. package/src/patterns/add/ms.ts +30 -0
  189. package/src/patterns/add/pl.ts +62 -0
  190. package/src/patterns/add/ru.ts +62 -0
  191. package/src/patterns/add/th.ts +49 -0
  192. package/src/patterns/add/tl.ts +30 -0
  193. package/src/patterns/add/tr.ts +71 -0
  194. package/src/patterns/add/uk.ts +62 -0
  195. package/src/patterns/add/vi.ts +61 -0
  196. package/src/patterns/add/zh.ts +71 -0
  197. package/src/patterns/builders.ts +207 -0
  198. package/src/patterns/decrement/bn.ts +70 -0
  199. package/src/patterns/decrement/de.ts +42 -0
  200. package/src/patterns/decrement/hi.ts +68 -0
  201. package/src/patterns/decrement/index.ts +79 -0
  202. package/src/patterns/decrement/it.ts +69 -0
  203. package/src/patterns/decrement/ms.ts +30 -0
  204. package/src/patterns/decrement/pl.ts +58 -0
  205. package/src/patterns/decrement/ru.ts +58 -0
  206. package/src/patterns/decrement/th.ts +49 -0
  207. package/src/patterns/decrement/tl.ts +30 -0
  208. package/src/patterns/decrement/tr.ts +48 -0
  209. package/src/patterns/decrement/uk.ts +58 -0
  210. package/src/patterns/decrement/vi.ts +61 -0
  211. package/src/patterns/decrement/zh.ts +32 -0
  212. package/src/patterns/en.ts +302 -0
  213. package/src/patterns/event-handler/ar.ts +151 -0
  214. package/src/patterns/event-handler/bn.ts +72 -0
  215. package/src/patterns/event-handler/de.ts +117 -0
  216. package/src/patterns/event-handler/en.ts +117 -0
  217. package/src/patterns/event-handler/es.ts +136 -0
  218. package/src/patterns/event-handler/fr.ts +117 -0
  219. package/src/patterns/event-handler/hi.ts +64 -0
  220. package/src/patterns/event-handler/id.ts +117 -0
  221. package/src/patterns/event-handler/index.ts +119 -0
  222. package/src/patterns/event-handler/it.ts +54 -0
  223. package/src/patterns/event-handler/ja.ts +118 -0
  224. package/src/patterns/event-handler/ko.ts +133 -0
  225. package/src/patterns/event-handler/ms.ts +30 -0
  226. package/src/patterns/event-handler/pl.ts +62 -0
  227. package/src/patterns/event-handler/pt.ts +117 -0
  228. package/src/patterns/event-handler/qu.ts +66 -0
  229. package/src/patterns/event-handler/ru.ts +62 -0
  230. package/src/patterns/event-handler/shared.ts +270 -0
  231. package/src/patterns/event-handler/sw.ts +117 -0
  232. package/src/patterns/event-handler/th.ts +53 -0
  233. package/src/patterns/event-handler/tl.ts +30 -0
  234. package/src/patterns/event-handler/tr.ts +170 -0
  235. package/src/patterns/event-handler/uk.ts +62 -0
  236. package/src/patterns/event-handler/vi.ts +61 -0
  237. package/src/patterns/event-handler/zh.ts +150 -0
  238. package/src/patterns/get/ar.ts +49 -0
  239. package/src/patterns/get/bn.ts +47 -0
  240. package/src/patterns/get/de.ts +32 -0
  241. package/src/patterns/get/hi.ts +52 -0
  242. package/src/patterns/get/index.ts +83 -0
  243. package/src/patterns/get/it.ts +56 -0
  244. package/src/patterns/get/ja.ts +53 -0
  245. package/src/patterns/get/ko.ts +53 -0
  246. package/src/patterns/get/ms.ts +30 -0
  247. package/src/patterns/get/pl.ts +57 -0
  248. package/src/patterns/get/ru.ts +57 -0
  249. package/src/patterns/get/th.ts +29 -0
  250. package/src/patterns/get/tl.ts +30 -0
  251. package/src/patterns/get/uk.ts +57 -0
  252. package/src/patterns/get/vi.ts +48 -0
  253. package/src/patterns/grammar-transformed/index.ts +39 -0
  254. package/src/patterns/grammar-transformed/ja.ts +1713 -0
  255. package/src/patterns/grammar-transformed/ko.ts +1311 -0
  256. package/src/patterns/grammar-transformed/tr.ts +1067 -0
  257. package/src/patterns/hide/ar.ts +67 -0
  258. package/src/patterns/hide/bn.ts +47 -0
  259. package/src/patterns/hide/de.ts +36 -0
  260. package/src/patterns/hide/hi.ts +61 -0
  261. package/src/patterns/hide/index.ts +91 -0
  262. package/src/patterns/hide/it.ts +56 -0
  263. package/src/patterns/hide/ja.ts +69 -0
  264. package/src/patterns/hide/ko.ts +69 -0
  265. package/src/patterns/hide/ms.ts +30 -0
  266. package/src/patterns/hide/pl.ts +57 -0
  267. package/src/patterns/hide/ru.ts +57 -0
  268. package/src/patterns/hide/th.ts +29 -0
  269. package/src/patterns/hide/tl.ts +30 -0
  270. package/src/patterns/hide/tr.ts +65 -0
  271. package/src/patterns/hide/uk.ts +57 -0
  272. package/src/patterns/hide/vi.ts +56 -0
  273. package/src/patterns/hide/zh.ts +68 -0
  274. package/src/patterns/increment/bn.ts +70 -0
  275. package/src/patterns/increment/de.ts +36 -0
  276. package/src/patterns/increment/hi.ts +68 -0
  277. package/src/patterns/increment/index.ts +79 -0
  278. package/src/patterns/increment/it.ts +69 -0
  279. package/src/patterns/increment/ms.ts +30 -0
  280. package/src/patterns/increment/pl.ts +58 -0
  281. package/src/patterns/increment/ru.ts +58 -0
  282. package/src/patterns/increment/th.ts +49 -0
  283. package/src/patterns/increment/tl.ts +30 -0
  284. package/src/patterns/increment/tr.ts +52 -0
  285. package/src/patterns/increment/uk.ts +58 -0
  286. package/src/patterns/increment/vi.ts +61 -0
  287. package/src/patterns/increment/zh.ts +32 -0
  288. package/src/patterns/index.ts +84 -0
  289. package/src/patterns/languages/en/control-flow.ts +93 -0
  290. package/src/patterns/languages/en/fetch.ts +62 -0
  291. package/src/patterns/languages/en/index.ts +42 -0
  292. package/src/patterns/languages/en/repeat.ts +67 -0
  293. package/src/patterns/languages/en/set.ts +48 -0
  294. package/src/patterns/languages/en/swap.ts +38 -0
  295. package/src/patterns/languages/en/temporal.ts +57 -0
  296. package/src/patterns/put/ar.ts +74 -0
  297. package/src/patterns/put/bn.ts +53 -0
  298. package/src/patterns/put/en.ts +74 -0
  299. package/src/patterns/put/es.ts +74 -0
  300. package/src/patterns/put/hi.ts +69 -0
  301. package/src/patterns/put/id.ts +96 -0
  302. package/src/patterns/put/index.ts +99 -0
  303. package/src/patterns/put/it.ts +56 -0
  304. package/src/patterns/put/ja.ts +75 -0
  305. package/src/patterns/put/ko.ts +67 -0
  306. package/src/patterns/put/ms.ts +30 -0
  307. package/src/patterns/put/pl.ts +81 -0
  308. package/src/patterns/put/ru.ts +85 -0
  309. package/src/patterns/put/th.ts +32 -0
  310. package/src/patterns/put/tl.ts +30 -0
  311. package/src/patterns/put/tr.ts +67 -0
  312. package/src/patterns/put/uk.ts +85 -0
  313. package/src/patterns/put/vi.ts +72 -0
  314. package/src/patterns/put/zh.ts +62 -0
  315. package/src/patterns/registry.ts +163 -0
  316. package/src/patterns/remove/ar.ts +71 -0
  317. package/src/patterns/remove/bn.ts +68 -0
  318. package/src/patterns/remove/hi.ts +69 -0
  319. package/src/patterns/remove/index.ts +87 -0
  320. package/src/patterns/remove/it.ts +69 -0
  321. package/src/patterns/remove/ja.ts +74 -0
  322. package/src/patterns/remove/ko.ts +78 -0
  323. package/src/patterns/remove/ms.ts +30 -0
  324. package/src/patterns/remove/pl.ts +62 -0
  325. package/src/patterns/remove/ru.ts +62 -0
  326. package/src/patterns/remove/th.ts +49 -0
  327. package/src/patterns/remove/tl.ts +30 -0
  328. package/src/patterns/remove/tr.ts +78 -0
  329. package/src/patterns/remove/uk.ts +62 -0
  330. package/src/patterns/remove/vi.ts +61 -0
  331. package/src/patterns/remove/zh.ts +72 -0
  332. package/src/patterns/set/ar.ts +84 -0
  333. package/src/patterns/set/bn.ts +53 -0
  334. package/src/patterns/set/de.ts +84 -0
  335. package/src/patterns/set/es.ts +92 -0
  336. package/src/patterns/set/fr.ts +88 -0
  337. package/src/patterns/set/hi.ts +56 -0
  338. package/src/patterns/set/id.ts +84 -0
  339. package/src/patterns/set/index.ts +107 -0
  340. package/src/patterns/set/it.ts +56 -0
  341. package/src/patterns/set/ja.ts +86 -0
  342. package/src/patterns/set/ko.ts +85 -0
  343. package/src/patterns/set/ms.ts +30 -0
  344. package/src/patterns/set/pl.ts +57 -0
  345. package/src/patterns/set/pt.ts +84 -0
  346. package/src/patterns/set/ru.ts +57 -0
  347. package/src/patterns/set/th.ts +31 -0
  348. package/src/patterns/set/tl.ts +30 -0
  349. package/src/patterns/set/tr.ts +107 -0
  350. package/src/patterns/set/uk.ts +57 -0
  351. package/src/patterns/set/vi.ts +53 -0
  352. package/src/patterns/set/zh.ts +84 -0
  353. package/src/patterns/show/ar.ts +67 -0
  354. package/src/patterns/show/bn.ts +47 -0
  355. package/src/patterns/show/de.ts +32 -0
  356. package/src/patterns/show/fr.ts +32 -0
  357. package/src/patterns/show/hi.ts +61 -0
  358. package/src/patterns/show/index.ts +95 -0
  359. package/src/patterns/show/it.ts +56 -0
  360. package/src/patterns/show/ja.ts +69 -0
  361. package/src/patterns/show/ko.ts +73 -0
  362. package/src/patterns/show/ms.ts +30 -0
  363. package/src/patterns/show/pl.ts +57 -0
  364. package/src/patterns/show/ru.ts +57 -0
  365. package/src/patterns/show/th.ts +29 -0
  366. package/src/patterns/show/tl.ts +30 -0
  367. package/src/patterns/show/tr.ts +65 -0
  368. package/src/patterns/show/uk.ts +57 -0
  369. package/src/patterns/show/vi.ts +56 -0
  370. package/src/patterns/show/zh.ts +68 -0
  371. package/src/patterns/take/ar.ts +51 -0
  372. package/src/patterns/take/index.ts +31 -0
  373. package/src/patterns/toggle/ar.ts +61 -0
  374. package/src/patterns/toggle/bn.ts +70 -0
  375. package/src/patterns/toggle/en.ts +61 -0
  376. package/src/patterns/toggle/es.ts +61 -0
  377. package/src/patterns/toggle/hi.ts +80 -0
  378. package/src/patterns/toggle/index.ts +95 -0
  379. package/src/patterns/toggle/it.ts +69 -0
  380. package/src/patterns/toggle/ja.ts +156 -0
  381. package/src/patterns/toggle/ko.ts +113 -0
  382. package/src/patterns/toggle/ms.ts +30 -0
  383. package/src/patterns/toggle/pl.ts +62 -0
  384. package/src/patterns/toggle/ru.ts +62 -0
  385. package/src/patterns/toggle/th.ts +50 -0
  386. package/src/patterns/toggle/tl.ts +30 -0
  387. package/src/patterns/toggle/tr.ts +88 -0
  388. package/src/patterns/toggle/uk.ts +62 -0
  389. package/src/patterns/toggle/vi.ts +61 -0
  390. package/src/patterns/toggle/zh.ts +99 -0
  391. package/src/public-api.ts +286 -0
  392. package/src/registry.ts +441 -0
  393. package/src/tokenizers/arabic.ts +723 -0
  394. package/src/tokenizers/base.ts +1300 -0
  395. package/src/tokenizers/bengali.ts +289 -0
  396. package/src/tokenizers/chinese.ts +481 -0
  397. package/src/tokenizers/english.ts +416 -0
  398. package/src/tokenizers/french.ts +326 -0
  399. package/src/tokenizers/german.ts +324 -0
  400. package/src/tokenizers/hindi.ts +319 -0
  401. package/src/tokenizers/index.ts +127 -0
  402. package/src/tokenizers/indonesian.ts +306 -0
  403. package/src/tokenizers/italian.ts +458 -0
  404. package/src/tokenizers/japanese.ts +447 -0
  405. package/src/tokenizers/korean.ts +642 -0
  406. package/src/tokenizers/morphology/arabic-normalizer.ts +242 -0
  407. package/src/tokenizers/morphology/french-normalizer.ts +268 -0
  408. package/src/tokenizers/morphology/german-normalizer.ts +256 -0
  409. package/src/tokenizers/morphology/index.ts +46 -0
  410. package/src/tokenizers/morphology/italian-normalizer.ts +329 -0
  411. package/src/tokenizers/morphology/japanese-normalizer.ts +288 -0
  412. package/src/tokenizers/morphology/korean-normalizer.ts +428 -0
  413. package/src/tokenizers/morphology/polish-normalizer.ts +264 -0
  414. package/src/tokenizers/morphology/portuguese-normalizer.ts +310 -0
  415. package/src/tokenizers/morphology/spanish-normalizer.ts +327 -0
  416. package/src/tokenizers/morphology/turkish-normalizer.ts +412 -0
  417. package/src/tokenizers/morphology/types.ts +211 -0
  418. package/src/tokenizers/ms.ts +198 -0
  419. package/src/tokenizers/polish.ts +354 -0
  420. package/src/tokenizers/portuguese.ts +304 -0
  421. package/src/tokenizers/quechua.ts +339 -0
  422. package/src/tokenizers/russian.ts +375 -0
  423. package/src/tokenizers/spanish.ts +403 -0
  424. package/src/tokenizers/swahili.ts +303 -0
  425. package/src/tokenizers/thai.ts +236 -0
  426. package/src/tokenizers/tl.ts +198 -0
  427. package/src/tokenizers/turkish.ts +411 -0
  428. package/src/tokenizers/ukrainian.ts +369 -0
  429. package/src/tokenizers/vietnamese.ts +410 -0
  430. package/src/types/grammar-types.ts +617 -0
  431. package/src/types/unified-profile.ts +267 -0
  432. package/src/types.ts +709 -0
  433. package/src/utils/confidence-calculator.ts +147 -0
  434. package/src/validators/command-validator.ts +380 -0
  435. package/src/validators/index.ts +15 -0
@@ -0,0 +1,62 @@
1
+ /**
2
+ * Chinese Put Patterns
3
+ *
4
+ * Hand-crafted patterns for "put" command.
5
+ * Chinese: 放置 "你好" 到 #output
6
+ */
7
+
8
+ import type { LanguagePattern } from '../../types';
9
+
10
+ /**
11
+ * Get Chinese put patterns.
12
+ */
13
+ export function getPutPatternsZh(): LanguagePattern[] {
14
+ return [
15
+ {
16
+ id: 'put-zh-full',
17
+ language: 'zh',
18
+ command: 'put',
19
+ priority: 100,
20
+ template: {
21
+ format: '放置 {patient} 到 {destination}',
22
+ tokens: [
23
+ { type: 'literal', value: '放置', alternatives: ['放', '放入', '置入', 'put'] },
24
+ {
25
+ type: 'role',
26
+ role: 'patient',
27
+ expectedTypes: ['literal', 'selector', 'reference', 'expression'],
28
+ },
29
+ { type: 'literal', value: '到', alternatives: ['在', '于', '入'] },
30
+ { type: 'role', role: 'destination', expectedTypes: ['selector', 'reference'] },
31
+ ],
32
+ },
33
+ extraction: {
34
+ patient: { position: 1 },
35
+ destination: { position: 3 },
36
+ },
37
+ },
38
+ {
39
+ id: 'put-zh-ba',
40
+ language: 'zh',
41
+ command: 'put',
42
+ priority: 95,
43
+ template: {
44
+ format: '把 {patient} 放到 {destination}',
45
+ tokens: [
46
+ { type: 'literal', value: '把' },
47
+ {
48
+ type: 'role',
49
+ role: 'patient',
50
+ expectedTypes: ['literal', 'selector', 'reference', 'expression'],
51
+ },
52
+ { type: 'literal', value: '放到', alternatives: ['放在', '放入'] },
53
+ { type: 'role', role: 'destination', expectedTypes: ['selector', 'reference'] },
54
+ ],
55
+ },
56
+ extraction: {
57
+ patient: { position: 1 },
58
+ destination: { position: 3 },
59
+ },
60
+ },
61
+ ];
62
+ }
@@ -0,0 +1,163 @@
1
+ /**
2
+ * Pattern Registry
3
+ *
4
+ * Pattern cache and lookup functions for the semantic parser.
5
+ */
6
+
7
+ import type { LanguagePattern, ActionType } from '../types';
8
+ import { buildPatternsForLanguage, buildAllPatterns } from './builders';
9
+
10
+ // =============================================================================
11
+ // Pattern Cache
12
+ // =============================================================================
13
+
14
+ /**
15
+ * Pattern cache for performance.
16
+ * Maps language code to array of patterns for that language.
17
+ */
18
+ const patternCache = new Map<string, LanguagePattern[]>();
19
+
20
+ // Lazy all patterns - only built when accessed
21
+ let _allPatterns: LanguagePattern[] | null = null;
22
+
23
+ /**
24
+ * Ensure all patterns are built (lazy initialization).
25
+ */
26
+ function ensureAllPatterns(): LanguagePattern[] {
27
+ if (_allPatterns === null) {
28
+ _allPatterns = buildAllPatterns();
29
+ }
30
+ return _allPatterns;
31
+ }
32
+
33
+ // =============================================================================
34
+ // All Patterns (Lazy Getter - for backwards compatibility)
35
+ // =============================================================================
36
+
37
+ /**
38
+ * All registered patterns across all languages.
39
+ * Uses a Proxy to lazily build patterns on first access.
40
+ * @deprecated Use getPatternsForLanguage() for tree-shaking.
41
+ */
42
+ export const allPatterns: LanguagePattern[] = new Proxy([] as LanguagePattern[], {
43
+ get(_target, prop) {
44
+ const arr = ensureAllPatterns();
45
+ const value = Reflect.get(arr, prop);
46
+ // Bind methods to the actual array, not the proxy target
47
+ if (typeof value === 'function') {
48
+ return value.bind(arr);
49
+ }
50
+ return value;
51
+ },
52
+ // Support iteration (for...of, spread operator)
53
+ ownKeys() {
54
+ return Reflect.ownKeys(ensureAllPatterns());
55
+ },
56
+ getOwnPropertyDescriptor(_target, prop) {
57
+ return Reflect.getOwnPropertyDescriptor(ensureAllPatterns(), prop);
58
+ },
59
+ });
60
+
61
+ // =============================================================================
62
+ // Pattern Lookup
63
+ // =============================================================================
64
+
65
+ /**
66
+ * Get all patterns.
67
+ * @deprecated Use getPatternsForLanguage() for tree-shaking.
68
+ */
69
+ export function getAllPatterns(): LanguagePattern[] {
70
+ if (_allPatterns === null) {
71
+ _allPatterns = buildAllPatterns();
72
+ }
73
+ return _allPatterns;
74
+ }
75
+
76
+ /**
77
+ * Get all patterns for a specific language.
78
+ * Uses caching for performance.
79
+ */
80
+ export function getPatternsForLanguage(language: string): LanguagePattern[] {
81
+ // Check cache first
82
+ if (patternCache.has(language)) {
83
+ return patternCache.get(language)!;
84
+ }
85
+
86
+ // Build patterns for this language
87
+ const patterns = buildPatternsForLanguage(language);
88
+ patternCache.set(language, patterns);
89
+ return patterns;
90
+ }
91
+
92
+ /**
93
+ * Get patterns for a specific language and command.
94
+ */
95
+ export function getPatternsForLanguageAndCommand(
96
+ language: string,
97
+ command: ActionType
98
+ ): LanguagePattern[] {
99
+ return getPatternsForLanguage(language)
100
+ .filter(p => p.command === command)
101
+ .sort((a, b) => b.priority - a.priority);
102
+ }
103
+
104
+ /**
105
+ * Get all supported languages.
106
+ */
107
+ export function getSupportedLanguages(): string[] {
108
+ const languages = new Set(allPatterns.map(p => p.language));
109
+ return Array.from(languages);
110
+ }
111
+
112
+ /**
113
+ * Get all supported commands.
114
+ */
115
+ export function getSupportedCommands(): ActionType[] {
116
+ const commands = new Set(allPatterns.map(p => p.command));
117
+ return Array.from(commands) as ActionType[];
118
+ }
119
+
120
+ /**
121
+ * Find a pattern by ID.
122
+ */
123
+ export function getPatternById(id: string): LanguagePattern | undefined {
124
+ return allPatterns.find(p => p.id === id);
125
+ }
126
+
127
+ // =============================================================================
128
+ // Pattern Statistics (for debugging/tooling)
129
+ // =============================================================================
130
+
131
+ export interface PatternStats {
132
+ totalPatterns: number;
133
+ byLanguage: Record<string, number>;
134
+ byCommand: Record<string, number>;
135
+ }
136
+
137
+ /**
138
+ * Get statistics about registered patterns.
139
+ */
140
+ export function getPatternStats(): PatternStats {
141
+ const byLanguage: Record<string, number> = {};
142
+ const byCommand: Record<string, number> = {};
143
+
144
+ for (const pattern of allPatterns) {
145
+ byLanguage[pattern.language] = (byLanguage[pattern.language] || 0) + 1;
146
+ byCommand[pattern.command] = (byCommand[pattern.command] || 0) + 1;
147
+ }
148
+
149
+ return {
150
+ totalPatterns: allPatterns.length,
151
+ byLanguage,
152
+ byCommand,
153
+ };
154
+ }
155
+
156
+ /**
157
+ * Clear the pattern cache.
158
+ * Useful for testing or when language profiles change.
159
+ */
160
+ export function clearPatternCache(): void {
161
+ patternCache.clear();
162
+ _allPatterns = null;
163
+ }
@@ -0,0 +1,71 @@
1
+ /**
2
+ * Arabic Remove Patterns
3
+ *
4
+ * Hand-crafted patterns for "remove" command.
5
+ * Arabic uses VSO order: احذف {patient} من {target}
6
+ */
7
+
8
+ import type { LanguagePattern } from '../../types';
9
+
10
+ /**
11
+ * Get Arabic remove patterns.
12
+ */
13
+ export function getRemovePatternsAr(): LanguagePattern[] {
14
+ return [
15
+ {
16
+ id: 'remove-ar-full',
17
+ language: 'ar',
18
+ command: 'remove',
19
+ priority: 100,
20
+ template: {
21
+ format: 'احذف {patient} من {destination}',
22
+ tokens: [
23
+ { type: 'literal', value: 'احذف', alternatives: ['أحذف', 'أزل', 'ازل', 'إزالة'] },
24
+ { type: 'role', role: 'patient' },
25
+ { type: 'literal', value: 'من' },
26
+ { type: 'role', role: 'destination' },
27
+ ],
28
+ },
29
+ extraction: {
30
+ patient: { position: 1 },
31
+ destination: { marker: 'من' },
32
+ },
33
+ },
34
+ {
35
+ id: 'remove-ar-simple',
36
+ language: 'ar',
37
+ command: 'remove',
38
+ priority: 90,
39
+ template: {
40
+ format: 'احذف {patient}',
41
+ tokens: [
42
+ { type: 'literal', value: 'احذف', alternatives: ['أحذف', 'أزل', 'ازل'] },
43
+ { type: 'role', role: 'patient' },
44
+ ],
45
+ },
46
+ extraction: {
47
+ patient: { position: 1 },
48
+ destination: { default: { type: 'reference', value: 'me' } },
49
+ },
50
+ },
51
+ {
52
+ id: 'remove-ar-with-عن',
53
+ language: 'ar',
54
+ command: 'remove',
55
+ priority: 95,
56
+ template: {
57
+ format: 'احذف {patient} عن {destination}',
58
+ tokens: [
59
+ { type: 'literal', value: 'احذف', alternatives: ['أحذف'] },
60
+ { type: 'role', role: 'patient' },
61
+ { type: 'literal', value: 'عن' },
62
+ { type: 'role', role: 'destination' },
63
+ ],
64
+ },
65
+ extraction: {
66
+ patient: { position: 1 },
67
+ destination: { marker: 'عن' },
68
+ },
69
+ },
70
+ ];
71
+ }
@@ -0,0 +1,68 @@
1
+ /**
2
+ * Bengali Remove Patterns
3
+ *
4
+ * Patterns for parsing "remove" command in Bengali.
5
+ */
6
+
7
+ import type { LanguagePattern } from '../../types';
8
+
9
+ export function getRemovePatternsBn(): LanguagePattern[] {
10
+ return [
11
+ // Full pattern: .active কে সরান
12
+ {
13
+ id: 'remove-bn-full',
14
+ language: 'bn',
15
+ command: 'remove',
16
+ priority: 100,
17
+ template: {
18
+ format: '{patient} কে সরান',
19
+ tokens: [
20
+ { type: 'role', role: 'patient' },
21
+ { type: 'literal', value: 'কে' },
22
+ { type: 'literal', value: 'সরান', alternatives: ['মুছুন'] },
23
+ ],
24
+ },
25
+ extraction: {
26
+ patient: { position: 0 },
27
+ },
28
+ },
29
+ // Simple pattern: সরান .active
30
+ {
31
+ id: 'remove-bn-simple',
32
+ language: 'bn',
33
+ command: 'remove',
34
+ priority: 90,
35
+ template: {
36
+ format: 'সরান {patient}',
37
+ tokens: [
38
+ { type: 'literal', value: 'সরান', alternatives: ['মুছুন'] },
39
+ { type: 'role', role: 'patient' },
40
+ ],
41
+ },
42
+ extraction: {
43
+ patient: { position: 1 },
44
+ },
45
+ },
46
+ // With source: #button থেকে .active কে সরান
47
+ {
48
+ id: 'remove-bn-with-source',
49
+ language: 'bn',
50
+ command: 'remove',
51
+ priority: 95,
52
+ template: {
53
+ format: '{source} থেকে {patient} কে সরান',
54
+ tokens: [
55
+ { type: 'role', role: 'source' },
56
+ { type: 'literal', value: 'থেকে' },
57
+ { type: 'role', role: 'patient' },
58
+ { type: 'literal', value: 'কে' },
59
+ { type: 'literal', value: 'সরান', alternatives: ['মুছুন'] },
60
+ ],
61
+ },
62
+ extraction: {
63
+ source: { position: 0 },
64
+ patient: { position: 2 },
65
+ },
66
+ },
67
+ ];
68
+ }
@@ -0,0 +1,69 @@
1
+ /**
2
+ * Hindi Remove Patterns
3
+ *
4
+ * Patterns for parsing "remove" command in Hindi.
5
+ */
6
+
7
+ import type { LanguagePattern } from '../../types';
8
+
9
+ export function getRemovePatternsHi(): LanguagePattern[] {
10
+ return [
11
+ // Full pattern: .class को #element से हटाएं
12
+ {
13
+ id: 'remove-hi-full',
14
+ language: 'hi',
15
+ command: 'remove',
16
+ priority: 100,
17
+ template: {
18
+ format: '{patient} को {source} से हटाएं',
19
+ tokens: [
20
+ { type: 'role', role: 'patient' },
21
+ { type: 'literal', value: 'को' },
22
+ { type: 'role', role: 'source' },
23
+ { type: 'literal', value: 'से' },
24
+ { type: 'literal', value: 'हटाएं', alternatives: ['हटा', 'मिटाएं'] },
25
+ ],
26
+ },
27
+ extraction: {
28
+ patient: { position: 0 },
29
+ source: { marker: 'से', position: 3 },
30
+ },
31
+ },
32
+ // Simple pattern: .class हटाएं
33
+ {
34
+ id: 'remove-hi-simple',
35
+ language: 'hi',
36
+ command: 'remove',
37
+ priority: 90,
38
+ template: {
39
+ format: '{patient} हटाएं',
40
+ tokens: [
41
+ { type: 'role', role: 'patient' },
42
+ { type: 'literal', value: 'हटाएं', alternatives: ['हटा', 'मिटाएं'] },
43
+ ],
44
+ },
45
+ extraction: {
46
+ patient: { position: 0 },
47
+ source: { default: { type: 'reference', value: 'me' } },
48
+ },
49
+ },
50
+ // Bare pattern: हटाएं .class
51
+ {
52
+ id: 'remove-hi-bare',
53
+ language: 'hi',
54
+ command: 'remove',
55
+ priority: 80,
56
+ template: {
57
+ format: 'हटाएं {patient}',
58
+ tokens: [
59
+ { type: 'literal', value: 'हटाएं', alternatives: ['हटा', 'मिटाएं'] },
60
+ { type: 'role', role: 'patient' },
61
+ ],
62
+ },
63
+ extraction: {
64
+ patient: { position: 1 },
65
+ source: { default: { type: 'reference', value: 'me' } },
66
+ },
67
+ },
68
+ ];
69
+ }
@@ -0,0 +1,87 @@
1
+ /**
2
+ * Remove Command Patterns
3
+ *
4
+ * Hand-crafted patterns for "remove" command across languages.
5
+ *
6
+ * @generated This file is auto-generated. Do not edit manually.
7
+ */
8
+
9
+ import type { LanguagePattern } from '../../types';
10
+
11
+ import { getRemovePatternsAr } from './ar';
12
+ import { getRemovePatternsBn } from './bn';
13
+ import { getRemovePatternsHi } from './hi';
14
+ import { getRemovePatternsIt } from './it';
15
+ import { getRemovePatternsJa } from './ja';
16
+ import { getRemovePatternsKo } from './ko';
17
+ import { getRemovePatternsMs } from './ms';
18
+ import { getRemovePatternsPl } from './pl';
19
+ import { getRemovePatternsRu } from './ru';
20
+ import { getRemovePatternsTh } from './th';
21
+ import { getRemovePatternsTl } from './tl';
22
+ import { getRemovePatternsTr } from './tr';
23
+ import { getRemovePatternsUk } from './uk';
24
+ import { getRemovePatternsVi } from './vi';
25
+ import { getRemovePatternsZh } from './zh';
26
+
27
+ /**
28
+ * Get remove patterns for a specific language.
29
+ */
30
+ export function getRemovePatternsForLanguage(language: string): LanguagePattern[] {
31
+ switch (language) {
32
+ case 'ar':
33
+ return getRemovePatternsAr();
34
+ case 'bn':
35
+ return getRemovePatternsBn();
36
+ case 'hi':
37
+ return getRemovePatternsHi();
38
+ case 'it':
39
+ return getRemovePatternsIt();
40
+ case 'ja':
41
+ return getRemovePatternsJa();
42
+ case 'ko':
43
+ return getRemovePatternsKo();
44
+ case 'ms':
45
+ return getRemovePatternsMs();
46
+ case 'pl':
47
+ return getRemovePatternsPl();
48
+ case 'ru':
49
+ return getRemovePatternsRu();
50
+ case 'th':
51
+ return getRemovePatternsTh();
52
+ case 'tl':
53
+ return getRemovePatternsTl();
54
+ case 'tr':
55
+ return getRemovePatternsTr();
56
+ case 'uk':
57
+ return getRemovePatternsUk();
58
+ case 'vi':
59
+ return getRemovePatternsVi();
60
+ case 'zh':
61
+ return getRemovePatternsZh();
62
+ default:
63
+ return [];
64
+ }
65
+ }
66
+
67
+ // Re-export language-specific getters for tree-shaking
68
+ export { getRemovePatternsAr } from './ar';
69
+ export { getRemovePatternsBn } from './bn';
70
+ export { getRemovePatternsHi } from './hi';
71
+ export { getRemovePatternsIt } from './it';
72
+ export { getRemovePatternsJa } from './ja';
73
+ export { getRemovePatternsKo } from './ko';
74
+ export { getRemovePatternsMs } from './ms';
75
+ export { getRemovePatternsPl } from './pl';
76
+ export { getRemovePatternsRu } from './ru';
77
+ export { getRemovePatternsTh } from './th';
78
+ export { getRemovePatternsTl } from './tl';
79
+ export { getRemovePatternsTr } from './tr';
80
+ export { getRemovePatternsUk } from './uk';
81
+ export { getRemovePatternsVi } from './vi';
82
+ export { getRemovePatternsZh } from './zh';
83
+
84
+ /**
85
+ * Languages that have hand-crafted remove patterns.
86
+ */
87
+ export const removePatternLanguages = ['ar', 'bn', 'hi', 'it', 'ja', 'ko', 'ms', 'pl', 'ru', 'th', 'tl', 'tr', 'uk', 'vi', 'zh'];
@@ -0,0 +1,69 @@
1
+ /**
2
+ * Italian Remove Patterns
3
+ *
4
+ * Tree-shakeable: Only included when Italian is imported.
5
+ */
6
+
7
+ import type { LanguagePattern } from '../../types';
8
+
9
+ /**
10
+ * Get Italian remove patterns.
11
+ */
12
+ export function getRemovePatternsIt(): LanguagePattern[] {
13
+ return [
14
+ {
15
+ id: 'remove-it-full',
16
+ language: 'it',
17
+ command: 'remove',
18
+ priority: 100,
19
+ template: {
20
+ format: 'rimuovere {patient} da {target}',
21
+ tokens: [
22
+ {
23
+ type: 'literal',
24
+ value: 'rimuovere',
25
+ alternatives: ['rimuovi', 'eliminare', 'togliere', 'remove'],
26
+ },
27
+ { type: 'role', role: 'patient' },
28
+ {
29
+ type: 'group',
30
+ optional: true,
31
+ tokens: [
32
+ { type: 'literal', value: 'da', alternatives: ['di'] },
33
+ { type: 'role', role: 'destination' },
34
+ ],
35
+ },
36
+ ],
37
+ },
38
+ extraction: {
39
+ patient: { position: 1 },
40
+ destination: {
41
+ marker: 'da',
42
+ markerAlternatives: ['di'],
43
+ default: { type: 'reference', value: 'me' },
44
+ },
45
+ },
46
+ },
47
+ {
48
+ id: 'remove-it-simple',
49
+ language: 'it',
50
+ command: 'remove',
51
+ priority: 90,
52
+ template: {
53
+ format: 'rimuovere {patient}',
54
+ tokens: [
55
+ {
56
+ type: 'literal',
57
+ value: 'rimuovere',
58
+ alternatives: ['rimuovi', 'eliminare', 'togliere', 'remove'],
59
+ },
60
+ { type: 'role', role: 'patient' },
61
+ ],
62
+ },
63
+ extraction: {
64
+ patient: { position: 1 },
65
+ destination: { default: { type: 'reference', value: 'me' } },
66
+ },
67
+ },
68
+ ];
69
+ }
@@ -0,0 +1,74 @@
1
+ /**
2
+ * Japanese Remove Patterns
3
+ *
4
+ * Hand-crafted patterns for "remove" command.
5
+ * Japanese uses SOV order: {target} から {patient} を 削除
6
+ */
7
+
8
+ import type { LanguagePattern } from '../../types';
9
+
10
+ /**
11
+ * Get Japanese remove patterns.
12
+ */
13
+ export function getRemovePatternsJa(): LanguagePattern[] {
14
+ return [
15
+ {
16
+ id: 'remove-ja-full',
17
+ language: 'ja',
18
+ command: 'remove',
19
+ priority: 100,
20
+ template: {
21
+ format: '{destination} から {patient} を 削除',
22
+ tokens: [
23
+ { type: 'role', role: 'destination' },
24
+ { type: 'literal', value: 'から' },
25
+ { type: 'role', role: 'patient' },
26
+ { type: 'literal', value: 'を' },
27
+ { type: 'literal', value: '削除', alternatives: ['削除する', '除去', '取り除く'] },
28
+ ],
29
+ },
30
+ extraction: {
31
+ destination: { position: 0 },
32
+ patient: { marker: 'を' },
33
+ },
34
+ },
35
+ {
36
+ id: 'remove-ja-simple',
37
+ language: 'ja',
38
+ command: 'remove',
39
+ priority: 90,
40
+ template: {
41
+ format: '{patient} を 削除',
42
+ tokens: [
43
+ { type: 'role', role: 'patient' },
44
+ { type: 'literal', value: 'を' },
45
+ { type: 'literal', value: '削除', alternatives: ['削除する', '除去', '取り除く'] },
46
+ ],
47
+ },
48
+ extraction: {
49
+ patient: { position: 0 },
50
+ destination: { default: { type: 'reference', value: 'me' } },
51
+ },
52
+ },
53
+ {
54
+ id: 'remove-ja-possessive',
55
+ language: 'ja',
56
+ command: 'remove',
57
+ priority: 95,
58
+ template: {
59
+ format: '{destination} の {patient} を 削除',
60
+ tokens: [
61
+ { type: 'role', role: 'destination' },
62
+ { type: 'literal', value: 'の' },
63
+ { type: 'role', role: 'patient' },
64
+ { type: 'literal', value: 'を' },
65
+ { type: 'literal', value: '削除', alternatives: ['削除する'] },
66
+ ],
67
+ },
68
+ extraction: {
69
+ destination: { position: 0 },
70
+ patient: { marker: 'を' },
71
+ },
72
+ },
73
+ ];
74
+ }