@genai-fi/nanogpt 0.20.0 → 0.20.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (433) hide show
  1. package/dist/BaseTokeniser-DSg9zcYq.js +221 -0
  2. package/dist/DatasetBuilder-DgURD85T.js +712 -0
  3. package/dist/Generator.d.ts +82 -0
  4. package/dist/Generator.js +2 -0
  5. package/dist/RealDiv-DBu0FQqT.js +362 -0
  6. package/dist/Reshape-CABOPB9d.js +94 -0
  7. package/dist/Reshape-DqO3r8BC.js +17 -0
  8. package/dist/TeachableLLM.d.ts +70 -0
  9. package/dist/TeachableLLM.js +2 -0
  10. package/dist/Trainer.d.ts +43 -0
  11. package/dist/Trainer.js +2 -0
  12. package/dist/backend.d.ts +2 -0
  13. package/dist/backend.js +13 -0
  14. package/dist/backend_util-Cg-roD1p.js +399 -0
  15. package/dist/binary_op_util-CrYk9LXL.js +103 -0
  16. package/dist/checks/appendCache.d.ts +1 -0
  17. package/dist/checks/appendCache.js +55 -0
  18. package/dist/checks/attentionMask.d.ts +1 -0
  19. package/dist/checks/attentionMask.js +56 -0
  20. package/dist/checks/check.d.ts +9 -0
  21. package/dist/checks/check.js +32 -0
  22. package/dist/checks/gelu.d.ts +1 -0
  23. package/dist/checks/gelu.js +46 -0
  24. package/dist/checks/index.d.ts +26 -0
  25. package/dist/checks/index.js +28 -0
  26. package/dist/checks/matMulGelu.d.ts +1 -0
  27. package/dist/checks/matMulGelu.js +84 -0
  28. package/dist/checks/normRMS.d.ts +1 -0
  29. package/dist/checks/normRMS.js +28 -0
  30. package/dist/checks/normRMSGrad.d.ts +1 -0
  31. package/dist/checks/normRMSGrad.js +22 -0
  32. package/dist/checks/packUnpack.d.ts +1 -0
  33. package/dist/checks/packUnpack.js +46 -0
  34. package/dist/checks/qkv.d.ts +1 -0
  35. package/dist/checks/qkv.js +34 -0
  36. package/dist/checks/rope.d.ts +1 -0
  37. package/dist/checks/rope.js +30 -0
  38. package/dist/checks/weights.d.ts +14 -0
  39. package/dist/checks/weights.js +27 -0
  40. package/dist/chunk-BPntVaq0.js +23 -0
  41. package/dist/complex_util-CkazZsaH.js +60 -0
  42. package/dist/concat_util-CWDZCBlA.js +19 -0
  43. package/dist/data/docx.d.ts +2 -0
  44. package/dist/data/docx.js +3046 -0
  45. package/dist/data/pdf.d.ts +2 -0
  46. package/dist/data/pdf.js +17 -0
  47. package/dist/data/textLoader.d.ts +7 -0
  48. package/dist/data/textLoader.js +613 -0
  49. package/dist/dist-BewPQWjc.js +7572 -0
  50. package/dist/dist-DVmq73nz.js +8775 -0
  51. package/dist/dist-DXwIvKxl.js +896 -0
  52. package/dist/dist-VEU5mfO0.js +7545 -0
  53. package/dist/gelu-Bf1HW1RY.js +27 -0
  54. package/dist/gpgpu_math-DvLcCH6u.js +1612 -0
  55. package/dist/inference/types.d.ts +16 -0
  56. package/dist/inference/types.js +0 -0
  57. package/dist/kernel_funcs_utils-HiXOOx3f.js +229 -0
  58. package/dist/layers/BaseLayer.d.ts +44 -0
  59. package/dist/layers/BaseLayer.js +76 -0
  60. package/dist/layers/CausalSelfAttention.d.ts +39 -0
  61. package/dist/layers/CausalSelfAttention.js +99 -0
  62. package/dist/layers/LoRA.d.ts +14 -0
  63. package/dist/layers/LoRA.js +48 -0
  64. package/dist/layers/MLP.d.ts +17 -0
  65. package/dist/layers/MLP.js +34 -0
  66. package/dist/layers/PositionEmbedding.d.ts +8 -0
  67. package/dist/layers/PositionEmbedding.js +27 -0
  68. package/dist/layers/RMSNorm.d.ts +12 -0
  69. package/dist/layers/RMSNorm.js +20 -0
  70. package/dist/layers/RoPECache.d.ts +18 -0
  71. package/dist/layers/RoPECache.js +337 -0
  72. package/dist/layers/TiedEmbedding.d.ts +13 -0
  73. package/dist/layers/TiedEmbedding.js +32 -0
  74. package/dist/layers/TransformerBlock.d.ts +27 -0
  75. package/dist/layers/TransformerBlock.js +51 -0
  76. package/dist/layers/WeightStore.d.ts +20 -0
  77. package/dist/layers/WeightStore.js +69 -0
  78. package/dist/loader/load.d.ts +6 -0
  79. package/dist/loader/load.js +2 -0
  80. package/dist/loader/loadHF.d.ts +8 -0
  81. package/dist/loader/loadHF.js +2 -0
  82. package/dist/loader/loadTransformers.d.ts +4 -0
  83. package/dist/loader/loadTransformers.js +2 -0
  84. package/dist/loader/loadZipMeta.d.ts +3 -0
  85. package/dist/loader/loadZipMeta.js +16 -0
  86. package/dist/loader/newZipLoad.d.ts +3 -0
  87. package/dist/loader/newZipLoad.js +2 -0
  88. package/dist/loader/oldZipLoad.d.ts +9 -0
  89. package/dist/loader/oldZipLoad.js +2 -0
  90. package/dist/loader/save.d.ts +16 -0
  91. package/dist/loader/save.js +2 -0
  92. package/dist/loader/types.d.ts +68 -0
  93. package/dist/loader/types.js +0 -0
  94. package/dist/main-CPjeMv0G.js +13500 -0
  95. package/dist/main.d.ts +50 -0
  96. package/dist/main.js +16 -0
  97. package/dist/matMul16-BNfZSnNM.js +81 -0
  98. package/dist/matMulGelu-CPTntosE.js +162 -0
  99. package/dist/models/NanoGPTV1.d.ts +16 -0
  100. package/dist/models/NanoGPTV1.js +2 -0
  101. package/dist/models/NanoGPTV2.d.ts +16 -0
  102. package/dist/models/NanoGPTV2.js +2 -0
  103. package/dist/models/config.d.ts +27 -0
  104. package/dist/models/config.js +37 -0
  105. package/dist/models/factory.d.ts +3 -0
  106. package/dist/models/factory.js +2 -0
  107. package/dist/models/model.d.ts +44 -0
  108. package/dist/models/model.js +2 -0
  109. package/dist/ops/adamAdjust.d.ts +2 -0
  110. package/dist/ops/adamAdjust.js +18 -0
  111. package/dist/ops/adamMoments.d.ts +2 -0
  112. package/dist/ops/adamMoments.js +16 -0
  113. package/dist/ops/add16.d.ts +2 -0
  114. package/dist/ops/add16.js +12 -0
  115. package/dist/ops/appendCache.d.ts +2 -0
  116. package/dist/ops/appendCache.js +25 -0
  117. package/dist/ops/attentionMask.d.ts +2 -0
  118. package/dist/ops/attentionMask.js +16 -0
  119. package/dist/ops/concat16.d.ts +2 -0
  120. package/dist/ops/concat16.js +8 -0
  121. package/dist/ops/cpu/adamAdjust.d.ts +1 -0
  122. package/dist/ops/cpu/adamAdjust.js +16 -0
  123. package/dist/ops/cpu/adamMoments.d.ts +1 -0
  124. package/dist/ops/cpu/adamMoments.js +16 -0
  125. package/dist/ops/cpu/appendCache.d.ts +1 -0
  126. package/dist/ops/cpu/appendCache.js +65 -0
  127. package/dist/ops/cpu/attentionMask.d.ts +1 -0
  128. package/dist/ops/cpu/attentionMask.js +16 -0
  129. package/dist/ops/cpu/fusedSoftmax.d.ts +9 -0
  130. package/dist/ops/cpu/fusedSoftmax.js +22 -0
  131. package/dist/ops/cpu/gatherSub.d.ts +1 -0
  132. package/dist/ops/cpu/gatherSub.js +12 -0
  133. package/dist/ops/cpu/gelu.d.ts +1 -0
  134. package/dist/ops/cpu/gelu.js +36 -0
  135. package/dist/ops/cpu/matMul16.d.ts +1 -0
  136. package/dist/ops/cpu/matMul16.js +14 -0
  137. package/dist/ops/cpu/matMulGelu.d.ts +1 -0
  138. package/dist/ops/cpu/matMulGelu.js +41 -0
  139. package/dist/ops/cpu/matMulMul.d.ts +1 -0
  140. package/dist/ops/cpu/matMulMul.js +20 -0
  141. package/dist/ops/cpu/mulDropout.d.ts +1 -0
  142. package/dist/ops/cpu/mulDropout.js +20 -0
  143. package/dist/ops/cpu/normRMS.d.ts +1 -0
  144. package/dist/ops/cpu/normRMS.js +35 -0
  145. package/dist/ops/cpu/qkv.d.ts +5 -0
  146. package/dist/ops/cpu/qkv.js +73 -0
  147. package/dist/ops/cpu/rope.d.ts +6 -0
  148. package/dist/ops/cpu/rope.js +81 -0
  149. package/dist/ops/cpu/scatterSub.d.ts +1 -0
  150. package/dist/ops/cpu/scatterSub.js +12 -0
  151. package/dist/ops/dot16.d.ts +2 -0
  152. package/dist/ops/dot16.js +29 -0
  153. package/dist/ops/dropout.d.ts +2 -0
  154. package/dist/ops/dropout.js +11 -0
  155. package/dist/ops/dropout16.d.ts +2 -0
  156. package/dist/ops/dropout16.js +22 -0
  157. package/dist/ops/gatherSub.d.ts +2 -0
  158. package/dist/ops/gatherSub.js +13 -0
  159. package/dist/ops/gelu.d.ts +3 -0
  160. package/dist/ops/gelu.js +2 -0
  161. package/dist/ops/globalNorm.d.ts +2 -0
  162. package/dist/ops/globalNorm.js +19 -0
  163. package/dist/ops/grads/add16.d.ts +1 -0
  164. package/dist/ops/grads/add16.js +27 -0
  165. package/dist/ops/grads/attentionMask.d.ts +1 -0
  166. package/dist/ops/grads/attentionMask.js +26 -0
  167. package/dist/ops/grads/dropout16.d.ts +1 -0
  168. package/dist/ops/grads/dropout16.js +1 -0
  169. package/dist/ops/grads/gelu.d.ts +2 -0
  170. package/dist/ops/grads/gelu.js +2 -0
  171. package/dist/ops/grads/matMul16.d.ts +2 -0
  172. package/dist/ops/grads/matMul16.js +2 -0
  173. package/dist/ops/grads/matMulGelu.d.ts +1 -0
  174. package/dist/ops/grads/matMulGelu.js +22 -0
  175. package/dist/ops/grads/mul16.d.ts +1 -0
  176. package/dist/ops/grads/mul16.js +1 -0
  177. package/dist/ops/grads/normRMS.d.ts +3 -0
  178. package/dist/ops/grads/normRMS.js +37 -0
  179. package/dist/ops/grads/pack16.d.ts +2 -0
  180. package/dist/ops/grads/pack16.js +2 -0
  181. package/dist/ops/grads/qkv.d.ts +3 -0
  182. package/dist/ops/grads/qkv.js +46 -0
  183. package/dist/ops/grads/rope.d.ts +2 -0
  184. package/dist/ops/grads/rope.js +2 -0
  185. package/dist/ops/grads/softmax16.d.ts +2 -0
  186. package/dist/ops/grads/softmax16.js +23 -0
  187. package/dist/ops/grads/unpack16.d.ts +2 -0
  188. package/dist/ops/grads/unpack16.js +2 -0
  189. package/dist/ops/grads/utils.d.ts +4 -0
  190. package/dist/ops/grads/utils.js +12 -0
  191. package/dist/ops/log.d.ts +0 -0
  192. package/dist/ops/log.js +1 -0
  193. package/dist/ops/matMul16.d.ts +15 -0
  194. package/dist/ops/matMul16.js +2 -0
  195. package/dist/ops/matMulGelu.d.ts +3 -0
  196. package/dist/ops/matMulGelu.js +20 -0
  197. package/dist/ops/matMulMul.d.ts +2 -0
  198. package/dist/ops/matMulMul.js +16 -0
  199. package/dist/ops/mul16.d.ts +2 -0
  200. package/dist/ops/mul16.js +43 -0
  201. package/dist/ops/mulDrop.d.ts +2 -0
  202. package/dist/ops/mulDrop.js +15 -0
  203. package/dist/ops/normRMS.d.ts +2 -0
  204. package/dist/ops/normRMS.js +22 -0
  205. package/dist/ops/pack16.d.ts +2 -0
  206. package/dist/ops/pack16.js +2 -0
  207. package/dist/ops/qkv.d.ts +2 -0
  208. package/dist/ops/qkv.js +16 -0
  209. package/dist/ops/reshape16.d.ts +2 -0
  210. package/dist/ops/reshape16.js +33 -0
  211. package/dist/ops/rope.d.ts +3 -0
  212. package/dist/ops/rope.js +2 -0
  213. package/dist/ops/scatterSub.d.ts +2 -0
  214. package/dist/ops/scatterSub.js +13 -0
  215. package/dist/ops/slice16.d.ts +2 -0
  216. package/dist/ops/slice16.js +11 -0
  217. package/dist/ops/softmax16.d.ts +2 -0
  218. package/dist/ops/softmax16.js +9 -0
  219. package/dist/ops/sub16.d.ts +2 -0
  220. package/dist/ops/sub16.js +11 -0
  221. package/dist/ops/sum16.d.ts +2 -0
  222. package/dist/ops/sum16.js +13 -0
  223. package/dist/ops/transpose16.d.ts +3 -0
  224. package/dist/ops/transpose16.js +32 -0
  225. package/dist/ops/unpack16.d.ts +2 -0
  226. package/dist/ops/unpack16.js +2 -0
  227. package/dist/ops/webgl/adamAdjust.d.ts +1 -0
  228. package/dist/ops/webgl/adamAdjust.js +82 -0
  229. package/dist/ops/webgl/adamMoments.d.ts +1 -0
  230. package/dist/ops/webgl/adamMoments.js +44 -0
  231. package/dist/ops/webgl/appendCache.d.ts +1 -0
  232. package/dist/ops/webgl/appendCache.js +53 -0
  233. package/dist/ops/webgl/attentionMask.d.ts +1 -0
  234. package/dist/ops/webgl/attentionMask.js +64 -0
  235. package/dist/ops/webgl/dropout16.d.ts +1 -0
  236. package/dist/ops/webgl/dropout16.js +12 -0
  237. package/dist/ops/webgl/fusedSoftmax.d.ts +11 -0
  238. package/dist/ops/webgl/fusedSoftmax.js +70 -0
  239. package/dist/ops/webgl/gatherSub.d.ts +1 -0
  240. package/dist/ops/webgl/gatherSub.js +28 -0
  241. package/dist/ops/webgl/gelu.d.ts +2 -0
  242. package/dist/ops/webgl/gelu.js +48 -0
  243. package/dist/ops/webgl/log.d.ts +17 -0
  244. package/dist/ops/webgl/log.js +14 -0
  245. package/dist/ops/webgl/matMul16.d.ts +1 -0
  246. package/dist/ops/webgl/matMul16.js +37 -0
  247. package/dist/ops/webgl/matMulGelu.d.ts +21 -0
  248. package/dist/ops/webgl/matMulGelu.js +2 -0
  249. package/dist/ops/webgl/matMulMul.d.ts +14 -0
  250. package/dist/ops/webgl/matMulMul.js +24 -0
  251. package/dist/ops/webgl/mulDropout.d.ts +1 -0
  252. package/dist/ops/webgl/mulDropout.js +32 -0
  253. package/dist/ops/webgl/normRMS.d.ts +1 -0
  254. package/dist/ops/webgl/normRMS.js +114 -0
  255. package/dist/ops/webgl/qkv.d.ts +1 -0
  256. package/dist/ops/webgl/qkv.js +54 -0
  257. package/dist/ops/webgl/rope.d.ts +1 -0
  258. package/dist/ops/webgl/rope.js +72 -0
  259. package/dist/ops/webgl/scatterSub.d.ts +1 -0
  260. package/dist/ops/webgl/scatterSub.js +28 -0
  261. package/dist/ops/webgpu/adamAdjust.d.ts +1 -0
  262. package/dist/ops/webgpu/adamAdjust.js +77 -0
  263. package/dist/ops/webgpu/adamMoments.d.ts +1 -0
  264. package/dist/ops/webgpu/adamMoments.js +76 -0
  265. package/dist/ops/webgpu/add16.d.ts +1 -0
  266. package/dist/ops/webgpu/add16.js +14 -0
  267. package/dist/ops/webgpu/appendCache.d.ts +1 -0
  268. package/dist/ops/webgpu/appendCache.js +130 -0
  269. package/dist/ops/webgpu/attentionMask.d.ts +1 -0
  270. package/dist/ops/webgpu/attentionMask.js +42 -0
  271. package/dist/ops/webgpu/attentionMask32_program.d.ts +19 -0
  272. package/dist/ops/webgpu/attentionMask32_program.js +62 -0
  273. package/dist/ops/webgpu/clipScale.d.ts +1 -0
  274. package/dist/ops/webgpu/clipScale.js +45 -0
  275. package/dist/ops/webgpu/concat16.d.ts +19 -0
  276. package/dist/ops/webgpu/concat16.js +111 -0
  277. package/dist/ops/webgpu/dropout16.d.ts +1 -0
  278. package/dist/ops/webgpu/dropout16.js +59 -0
  279. package/dist/ops/webgpu/gatherSub.d.ts +1 -0
  280. package/dist/ops/webgpu/gatherSub.js +52 -0
  281. package/dist/ops/webgpu/gelu.d.ts +14 -0
  282. package/dist/ops/webgpu/gelu.js +147 -0
  283. package/dist/ops/webgpu/index.d.ts +0 -0
  284. package/dist/ops/webgpu/index.js +26 -0
  285. package/dist/ops/webgpu/matMul16.d.ts +1 -0
  286. package/dist/ops/webgpu/matMul16.js +70 -0
  287. package/dist/ops/webgpu/matMul16_program.d.ts +42 -0
  288. package/dist/ops/webgpu/matMul16_program.js +303 -0
  289. package/dist/ops/webgpu/mul16.d.ts +1 -0
  290. package/dist/ops/webgpu/mul16.js +14 -0
  291. package/dist/ops/webgpu/norm2.d.ts +1 -0
  292. package/dist/ops/webgpu/norm2.js +46 -0
  293. package/dist/ops/webgpu/normRMS.d.ts +1 -0
  294. package/dist/ops/webgpu/normRMS.js +26 -0
  295. package/dist/ops/webgpu/normRMS16_program.d.ts +10 -0
  296. package/dist/ops/webgpu/normRMS16_program.js +28 -0
  297. package/dist/ops/webgpu/normRMS32_program.d.ts +10 -0
  298. package/dist/ops/webgpu/normRMS32_program.js +28 -0
  299. package/dist/ops/webgpu/normRMSGrad.d.ts +1 -0
  300. package/dist/ops/webgpu/normRMSGrad.js +225 -0
  301. package/dist/ops/webgpu/pack16.d.ts +1 -0
  302. package/dist/ops/webgpu/pack16.js +21 -0
  303. package/dist/ops/webgpu/pack16_program.d.ts +19 -0
  304. package/dist/ops/webgpu/pack16_program.js +93 -0
  305. package/dist/ops/webgpu/qkv.d.ts +1 -0
  306. package/dist/ops/webgpu/qkv.js +64 -0
  307. package/dist/ops/webgpu/rope.d.ts +1 -0
  308. package/dist/ops/webgpu/rope.js +163 -0
  309. package/dist/ops/webgpu/scatterSub.d.ts +1 -0
  310. package/dist/ops/webgpu/scatterSub.js +53 -0
  311. package/dist/ops/webgpu/slice16.d.ts +7 -0
  312. package/dist/ops/webgpu/slice16.js +74 -0
  313. package/dist/ops/webgpu/softmax16.d.ts +17 -0
  314. package/dist/ops/webgpu/softmax16.js +18 -0
  315. package/dist/ops/webgpu/softmax16_program.d.ts +13 -0
  316. package/dist/ops/webgpu/softmax16_program.js +89 -0
  317. package/dist/ops/webgpu/softmax16_subgroup_program.d.ts +17 -0
  318. package/dist/ops/webgpu/softmax16_subgroup_program.js +70 -0
  319. package/dist/ops/webgpu/softmax16grad.d.ts +1 -0
  320. package/dist/ops/webgpu/softmax16grad.js +31 -0
  321. package/dist/ops/webgpu/sub16.d.ts +1 -0
  322. package/dist/ops/webgpu/sub16.js +14 -0
  323. package/dist/ops/webgpu/sum16.d.ts +1 -0
  324. package/dist/ops/webgpu/sum16.js +29 -0
  325. package/dist/ops/webgpu/transpose16.d.ts +1 -0
  326. package/dist/ops/webgpu/transpose16.js +37 -0
  327. package/dist/ops/webgpu/transpose16_program.d.ts +16 -0
  328. package/dist/ops/webgpu/transpose16_program.js +51 -0
  329. package/dist/ops/webgpu/transpose16_shared_program.d.ts +15 -0
  330. package/dist/ops/webgpu/transpose16_shared_program.js +79 -0
  331. package/dist/ops/webgpu/unpack16.d.ts +1 -0
  332. package/dist/ops/webgpu/unpack16.js +60 -0
  333. package/dist/ops/webgpu/utils/binary_op.d.ts +35 -0
  334. package/dist/ops/webgpu/utils/binary_op.js +141 -0
  335. package/dist/ops/webgpu/utils/deviceInfo.d.ts +7 -0
  336. package/dist/ops/webgpu/utils/deviceInfo.js +11 -0
  337. package/dist/ops/webgpu/utils/reductions.d.ts +43 -0
  338. package/dist/ops/webgpu/utils/reductions.js +263 -0
  339. package/dist/pack16-Ck-spx_F.js +39 -0
  340. package/dist/patches/webgpu_backend.d.ts +18 -0
  341. package/dist/patches/webgpu_backend.js +43 -0
  342. package/dist/patches/webgpu_base.d.ts +21 -0
  343. package/dist/patches/webgpu_base.js +22 -0
  344. package/dist/patches/webgpu_program.d.ts +36 -0
  345. package/dist/patches/webgpu_program.js +293 -0
  346. package/dist/pdf-UoDqCYzz.js +16726 -0
  347. package/dist/picomatch-3tUnMMbd.js +1063 -0
  348. package/dist/rope-CbeGlsV8.js +25 -0
  349. package/dist/selu_util-zkAx5doH.js +24 -0
  350. package/dist/shared-D1coEFea.js +1314 -0
  351. package/dist/shared-DOgWaqvL.js +5 -0
  352. package/dist/slice_util-Dgb3ANWI.js +208 -0
  353. package/dist/tfjs_backend-BjuQ5FqB.js +614 -0
  354. package/dist/tokeniser/BaseTokeniser.d.ts +33 -0
  355. package/dist/tokeniser/BaseTokeniser.js +2 -0
  356. package/dist/tokeniser/CharTokeniser.d.ts +24 -0
  357. package/dist/tokeniser/CharTokeniser.js +92 -0
  358. package/dist/tokeniser/bpe.d.ts +28 -0
  359. package/dist/tokeniser/bpe.js +170 -0
  360. package/dist/tokeniser/messages.d.ts +61 -0
  361. package/dist/tokeniser/messages.js +0 -0
  362. package/dist/tokeniser/type.d.ts +34 -0
  363. package/dist/tokeniser/type.js +0 -0
  364. package/dist/training/AdamW.d.ts +36 -0
  365. package/dist/training/AdamW.js +128 -0
  366. package/dist/training/BasicTrainer.d.ts +63 -0
  367. package/dist/training/BasicTrainer.js +265 -0
  368. package/dist/training/DatasetBuilder.d.ts +26 -0
  369. package/dist/training/DatasetBuilder.js +2 -0
  370. package/dist/training/Evaluator.d.ts +19 -0
  371. package/dist/training/Evaluator.js +48 -0
  372. package/dist/training/LRScheduler.d.ts +12 -0
  373. package/dist/training/LRScheduler.js +38 -0
  374. package/dist/training/PreTrainer.d.ts +11 -0
  375. package/dist/training/PreTrainer.js +22 -0
  376. package/dist/training/SFTTrainer.d.ts +12 -0
  377. package/dist/training/SFTTrainer.js +24 -0
  378. package/dist/training/loss.d.ts +3 -0
  379. package/dist/training/loss.js +19 -0
  380. package/dist/training/orthoGrad.d.ts +2 -0
  381. package/dist/training/orthoGrad.js +10 -0
  382. package/dist/training/sparseCrossEntropy.d.ts +7 -0
  383. package/dist/training/sparseCrossEntropy.js +47 -0
  384. package/dist/training/tasks/ConversationTask.d.ts +18 -0
  385. package/dist/training/tasks/ConversationTask.js +38 -0
  386. package/dist/training/tasks/PretrainingTask.d.ts +17 -0
  387. package/dist/training/tasks/PretrainingTask.js +42 -0
  388. package/dist/training/tasks/StartSentenceTask.d.ts +18 -0
  389. package/dist/training/tasks/StartSentenceTask.js +45 -0
  390. package/dist/training/tasks/Task.d.ts +22 -0
  391. package/dist/training/tasks/Task.js +55 -0
  392. package/dist/training/tasks/splitter.d.ts +5 -0
  393. package/dist/training/tasks/splitter.js +18 -0
  394. package/dist/training/types.d.ts +78 -0
  395. package/dist/training/types.js +0 -0
  396. package/dist/training/validation.d.ts +17 -0
  397. package/dist/training/validation.js +2 -0
  398. package/dist/utilities/arrayClose.d.ts +1 -0
  399. package/dist/utilities/arrayClose.js +16 -0
  400. package/dist/utilities/datasetID.d.ts +2 -0
  401. package/dist/utilities/datasetID.js +18 -0
  402. package/dist/utilities/dummy.d.ts +9 -0
  403. package/dist/utilities/dummy.js +36 -0
  404. package/dist/utilities/multinomialCPU.d.ts +2 -0
  405. package/dist/utilities/multinomialCPU.js +9 -0
  406. package/dist/utilities/naming.d.ts +4 -0
  407. package/dist/utilities/naming.js +0 -0
  408. package/dist/utilities/packed.d.ts +4 -0
  409. package/dist/utilities/packed.js +13 -0
  410. package/dist/utilities/parameters.d.ts +11 -0
  411. package/dist/utilities/parameters.js +38 -0
  412. package/dist/utilities/performance.d.ts +2 -0
  413. package/dist/utilities/performance.js +16 -0
  414. package/dist/utilities/profile.d.ts +17 -0
  415. package/dist/utilities/profile.js +33 -0
  416. package/dist/utilities/safetensors.d.ts +3 -0
  417. package/dist/utilities/safetensors.js +53 -0
  418. package/dist/utilities/sentences.d.ts +5 -0
  419. package/dist/utilities/sentences.js +32 -0
  420. package/dist/utilities/tokenParse.d.ts +1 -0
  421. package/dist/utilities/tokenParse.js +17 -0
  422. package/dist/utilities/topP.d.ts +1 -0
  423. package/dist/utilities/topP.js +12 -0
  424. package/dist/utilities/waitForModel.d.ts +2 -0
  425. package/dist/utilities/waitForModel.js +12 -0
  426. package/dist/utilities/weights.d.ts +12 -0
  427. package/dist/utilities/weights.js +40 -0
  428. package/dist/utilities/yielder.d.ts +1 -0
  429. package/dist/utilities/yielder.js +7 -0
  430. package/dist/webgpu-Dt7BMzWz.js +525 -0
  431. package/dist/webgpu_program-WOyIVMlZ.js +392 -0
  432. package/dist/webgpu_util-B_F3SShA.js +106 -0
  433. package/package.json +1 -1
@@ -0,0 +1,5 @@
1
+ import { t as e } from "./shared-D1coEFea.js";
2
+ //#region node_modules/@tensorflow/tfjs-backend-webgl/dist/kernel_utils/shared.js
3
+ var { addImpl: t, bincountImpl: n, bincountReduceImpl: r, bitwiseAndImpl: i, castImpl: a, ceilImpl: o, concatImpl: s, equalImpl: c, expImpl: l, expm1Impl: u, floorImpl: d, gatherNdImpl: f, gatherV2Impl: p, greaterImpl: m, greaterEqualImpl: h, lessImpl: g, lessEqualImpl: _, linSpaceImpl: v, logImpl: y, maxImpl: b, maximumImpl: x, minimumImpl: S, multiplyImpl: C, negImpl: w, notEqualImpl: T, prodImpl: E, raggedGatherImpl: D, raggedRangeImpl: O, raggedTensorToTensorImpl: k, rangeImpl: A, rsqrtImpl: j, scatterImpl: M, sigmoidImpl: N, simpleAbsImpl: P, sliceImpl: F, sparseFillEmptyRowsImpl: I, sparseReshapeImpl: L, sparseSegmentReductionImpl: R, sqrtImpl: z, staticRegexReplaceImpl: B, stridedSliceImpl: V, stringNGramsImpl: H, stringSplitImpl: U, stringToHashBucketFastImpl: W, subImpl: G, tileImpl: K, topKImpl: q, transposeImpl: J, uniqueImpl: Y } = e;
4
+ //#endregion
5
+ export { A, B, C, D, E, F, G, H, I, J, K, L, M, N, O, P, R, S, T, U, V, W, Y, g as _, a, b, c, d, f, _ as g, m as h, i, j, k, l, h as m, n, o, p, q, r, s, t, u, v, w, x, y, z };
@@ -0,0 +1,208 @@
1
+ import { r as e } from "./chunk-BPntVaq0.js";
2
+ import { Ls as t, Ps as n } from "./dist-BewPQWjc.js";
3
+ //#region node_modules/@tensorflow/tfjs-core/dist/ops/slice_util.js
4
+ var r = /* @__PURE__ */ e({
5
+ assertParamsValid: () => o,
6
+ computeFlatOffset: () => y,
7
+ computeOutShape: () => c,
8
+ getNormalizedAxes: () => f,
9
+ isSliceContinous: () => v,
10
+ maskToAxes: () => s,
11
+ parseSliceParams: () => b,
12
+ sliceInfo: () => x,
13
+ startForAxis: () => g,
14
+ startIndicesWithElidedDims: () => p,
15
+ stopForAxis: () => _,
16
+ stopIndicesWithElidedDims: () => m,
17
+ stridesForAxis: () => h,
18
+ stridesWithElidedDims: () => l
19
+ }), i = -2, a = -1;
20
+ function o(e, t, r) {
21
+ let i = e.shape.length;
22
+ n(i === t.length, () => `Error in slice${i}D: Length of begin ${t} must match the rank of the array (${i}).`), n(i === r.length, () => `Error in slice${i}D: Length of size ${r} must match the rank of the array (${i}).`);
23
+ for (let a = 0; a < i; ++a) n(t[a] + r[a] <= e.shape[a], () => `Error in slice${i}D: begin[${a}] + size[${a}] (${t[a] + r[a]}) would overflow input.shape[${a}] (${e.shape[a]})`);
24
+ }
25
+ function s(e) {
26
+ let t = [], n = 0;
27
+ for (; e > 0;) e & 1 && t.push(n), e /= 2, n++;
28
+ return t;
29
+ }
30
+ function c(e, t, n) {
31
+ let r = [];
32
+ for (let i = 0; i < e.length; i++) r[i] = Math.ceil((t[i] - e[i]) / n[i]);
33
+ return r;
34
+ }
35
+ function l(e, t, n, r) {
36
+ let i = [...e];
37
+ for (let e = i.length; e < r.length; e++) i.push(1);
38
+ for (let e = 0; e < n; e++) e === 0 ? i[t] = 1 : (i.splice(t, 0, 1), i.pop());
39
+ return i;
40
+ }
41
+ function u(e, t, n) {
42
+ return n <= e ? n : n - (t - 1);
43
+ }
44
+ function d(e, t) {
45
+ let n = [];
46
+ for (let r = 0; r < e; r++) n.push(t + r);
47
+ return n;
48
+ }
49
+ function f(e, t, n, r, i, a, o, s, c) {
50
+ let u = e.length, d = Array(u), f = Array(u), v = Array(u);
51
+ if (t.length && n > 0) {
52
+ let c = t[0], u = n + 1;
53
+ d = p(o, c, u, r, e), f = m(s, c, u, i, e), v = l(a, c, u, e);
54
+ } else for (let t = 0; t < u; t++) d[t] = g(o, r, a, e, t, c), f[t] = _(s, i, a, e, t, c), v[t] = h(a, t, c);
55
+ return {
56
+ begin: d,
57
+ end: f,
58
+ strides: v
59
+ };
60
+ }
61
+ function p(e, t, n, r, i) {
62
+ let a = [...i], o = d(n, t);
63
+ for (let i = 0; i < a.length; i++) if (o.indexOf(i) > -1) a[i] = 0;
64
+ else {
65
+ let o = u(t, n, i), s = r[o];
66
+ e & 1 << o && (s = 0), a[i] = s;
67
+ }
68
+ return a;
69
+ }
70
+ function m(e, n, r, i, a) {
71
+ let o = [...a], s = d(r, n);
72
+ for (let t = 0; t < o.length; t++) if (s.indexOf(t) > -1) o[t] = 2 ** 53 - 1;
73
+ else {
74
+ let a = u(n, r, t), s = i[a];
75
+ e & 1 << a && (s = 2 ** 53 - 1), o[t] = s;
76
+ }
77
+ for (let e = 0; e < o.length; e++) {
78
+ let n = a[e];
79
+ o[e] < 0 && (o[e] += n), o[e] = t(0, o[e], a[e]);
80
+ }
81
+ return o;
82
+ }
83
+ function h(e, t, n) {
84
+ let r = e[t];
85
+ return (n & 1 << t || r == null) && (r = 1), r;
86
+ }
87
+ function g(e, n, r, i, a, o) {
88
+ let s = n[a], c = r[a] || 1;
89
+ (e & 1 << a || o & 1 << a || s == null) && (s = c > 0 ? -(2 ** 53 - 1) : 2 ** 53 - 1);
90
+ let l = i[a];
91
+ return s < 0 && (s += l), s = t(0, s, l - 1), s;
92
+ }
93
+ function _(e, n, r, i, a, o) {
94
+ let s = n[a], c = r[a] || 1;
95
+ (e & 1 << a || o & 1 << a || s == null) && (s = c > 0 ? 2 ** 53 - 1 : -(2 ** 53 - 1));
96
+ let l = i[a];
97
+ return s < 0 && (s += l), s = c > 0 ? t(0, s, l) : t(-1, s, l - 1), s;
98
+ }
99
+ function v(e, t, n) {
100
+ let r = n.length;
101
+ for (let e = 0; e < n.length; e++) if (n[e] > 1) {
102
+ r = e;
103
+ break;
104
+ }
105
+ for (let i = r + 1; i < n.length; i++) if (t[i] > 0 || n[i] !== e[i]) return !1;
106
+ return !0;
107
+ }
108
+ function y(e, t) {
109
+ let n = e.length > 0 ? e[e.length - 1] : 1;
110
+ for (let r = 0; r < e.length - 1; r++) n += e[r] * t[r];
111
+ return n;
112
+ }
113
+ function b(e, t, r) {
114
+ let i, a = e.shape.length;
115
+ i = typeof t == "number" ? [t, ...Array(a - 1).fill(0)] : t.length < a ? t.concat(Array(a - t.length).fill(0)) : t.slice(), i.forEach((e) => {
116
+ n(e !== -1, () => "slice() does not support negative begin indexing.");
117
+ });
118
+ let o;
119
+ return o = r == null ? Array(a).fill(-1) : typeof r == "number" ? [r, ...Array(a - 1).fill(-1)] : r.length < a ? r.concat(Array(a - r.length).fill(-1)) : r, o = o.map((t, r) => t >= 0 ? t : (n(t === -1, () => `Negative size values should be exactly -1 but got ${t} for the slice() size at index ${r}.`), e.shape[r] - i[r])), [i, o];
120
+ }
121
+ function x(e, t, n, r, a, o, s, c, l) {
122
+ let u;
123
+ if (r == null ? (u = Array(t.length), u.fill(1)) : u = r, s != null && s & s - 1) throw Error("Multiple ellipses in slice is not allowed.");
124
+ let d = !1, f = {
125
+ dims: u.length,
126
+ numAddAxisAfterEllipsis: 0,
127
+ begin: t.slice(),
128
+ end: n.slice(),
129
+ strides: u.slice(),
130
+ beginMask: a,
131
+ endMask: o,
132
+ ellipsisMask: s,
133
+ newAxisMask: c,
134
+ shrinkAxisMask: l
135
+ };
136
+ for (let e = 0; e < f.dims; e++) d && 1 << e & c && f.numAddAxisAfterEllipsis++, 1 << e & s && (d = !0);
137
+ d || (f.ellipsisMask |= 1 << f.dims, f.dims++);
138
+ let p = {
139
+ dims: e.length,
140
+ beginMask: 0,
141
+ endMask: 0,
142
+ beginValid: !1,
143
+ endValid: !1
144
+ };
145
+ S(f, p);
146
+ let m = !0, h = !0, g = !0, _ = [], v = [];
147
+ for (let t = 0; t < e.length; ++t) {
148
+ if (p.strides[t] === 0) throw Error(`strides[${t}] must be non-zero`);
149
+ let n = !!(p.shrinkAxisMask & 1 << t), r = e[t];
150
+ if (r === -1) {
151
+ _.push(n ? 1 : -1);
152
+ continue;
153
+ }
154
+ let i = [p.beginMask & 1 << t, p.endMask & 1 << t], a = [p.strides[t] > 0 ? 0 : -1, p.strides[t] > 0 ? r : r - 1];
155
+ if (n && p.strides[t] <= 0) throw Error("only stride 1 allowed on non-range indexing.");
156
+ g &&= p.strides[t] === 1;
157
+ let o = !!(p.beginMask & 1 << t && p.endMask & 1 << t);
158
+ if (p.beginValid && p.endValid) {
159
+ if (n) {
160
+ let e = p.begin[t] < 0 ? r + p.begin[t] : p.begin[t];
161
+ if (p.begin[t] = e, p.end[t] = p.begin[t] + 1, e < 0 || e >= r) throw Error(`slice index ${p.begin[t]} of dimension ${t} out of bounds.`);
162
+ } else p.begin[t] = C(p.begin[t], 0, p.strides[t], r, i, a), p.end[t] = C(p.end[t], 1, p.strides[t], r, i, a);
163
+ let e = p.strides[t] === 1 && p.begin[t] === 0 && p.end[t] === r;
164
+ m &&= e, h &&= t === 0 && p.strides[t] === 1 || e;
165
+ } else m = m && p.strides[t] === 1 && o, h &&= t === 0 && p.strides[t] === 1 || o;
166
+ let s, c = !1;
167
+ if (p.beginValid && p.endValid ? (s = p.end[t] - p.begin[t], c = !0) : n ? (s = 1, c = !0) : o && r >= 0 && (s = p.strides[t] < 0 ? -r : r, c = !0), c) {
168
+ let e;
169
+ e = s === 0 || s < 0 != p.strides[t] < 0 ? 0 : Math.trunc(s / p.strides[t]) + (s % p.strides[t] === 0 ? 0 : 1), _.push(e);
170
+ } else _.push(-1);
171
+ }
172
+ for (let e = 0; e < p.finalShapeGatherIndices.length; ++e) {
173
+ let t = p.finalShapeGatherIndices[e];
174
+ t >= 0 ? v.push(_[t]) : t === i && v.push(1);
175
+ }
176
+ return {
177
+ finalShapeSparse: v.filter((e, t) => p.finalShapeGatherIndices[t] !== i),
178
+ finalShape: v,
179
+ isIdentity: m,
180
+ sliceDim0: h,
181
+ isSimpleSlice: g,
182
+ begin: p.begin,
183
+ end: p.end,
184
+ strides: p.strides
185
+ };
186
+ }
187
+ function S(e, t) {
188
+ t.beginMask = 0, t.endMask = 0, t.shrinkAxisMask = 0;
189
+ let n = 0;
190
+ t.beginValid = e.begin != null, t.endValid = e.end != null, t.begin = Array(t.dims), t.end = Array(t.dims), t.strides = Array(t.dims), t.finalShapeGatherIndices = [], t.finalShapeGatherIndicesSparse = [], t.inputShapeGatherIndicesSparse = Array(t.dims);
191
+ for (let r = 0; r < e.dims; r++) if (1 << r & e.ellipsisMask) {
192
+ let i = Math.min(t.dims - (e.dims - r) + 1 + e.numAddAxisAfterEllipsis, t.dims);
193
+ for (; n < i; n++) t.begin[n] = 0, t.end[n] = 0, t.strides[n] = 1, t.beginMask |= 1 << n, t.endMask |= 1 << n, t.finalShapeGatherIndices.push(n), t.finalShapeGatherIndicesSparse.push(-1), t.inputShapeGatherIndicesSparse[n] = r;
194
+ } else if (1 << r & e.newAxisMask) t.finalShapeGatherIndices.push(i), t.finalShapeGatherIndicesSparse.push(-1);
195
+ else {
196
+ if (n === t.begin.length) throw Error(`Index out of range using input dim ${n}; input has only ${t.dims} dims, ${t.begin.length}.`);
197
+ e.begin != null && (t.begin[n] = e.begin[r]), e.end != null && (t.end[n] = e.end[r]), t.strides[n] = e.strides[r], e.beginMask & 1 << r && (t.beginMask |= 1 << n), e.endMask & 1 << r && (t.endMask |= 1 << n), e.shrinkAxisMask & 1 << r ? (t.finalShapeGatherIndices.push(a), t.finalShapeGatherIndicesSparse.push(-1), t.shrinkAxisMask |= 1 << n) : (t.finalShapeGatherIndices.push(n), t.finalShapeGatherIndicesSparse.push(r)), t.inputShapeGatherIndicesSparse[n] = r, n++;
198
+ }
199
+ }
200
+ function C(e, t, n, r, i, a) {
201
+ if (i[t]) return n > 0 ? a[t] : a[t + 1 & 1];
202
+ {
203
+ let t = e < 0 ? r + e : e;
204
+ return t < a[0] ? a[0] : t > a[1] ? a[1] : t;
205
+ }
206
+ }
207
+ //#endregion
208
+ export { b as a, v as i, y as n, x as o, c as r, r as s, o as t };