@genai-fi/nanogpt 0.11.0 → 0.12.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (236) hide show
  1. package/dist/Generator.js +29 -29
  2. package/dist/{RealDiv-Ds-jvL09.js → RealDiv-C8neBwFi.js} +17 -17
  3. package/dist/{Reshape-Cd6e-Otn.js → Reshape-Bd4V_4X7.js} +1 -1
  4. package/dist/{Reshape-Ct266DEk.js → Reshape-Ck29jQSY.js} +7 -7
  5. package/dist/TeachableLLM.d.ts +2 -1
  6. package/dist/TeachableLLM.js +9 -9
  7. package/dist/Trainer.d.ts +4 -2
  8. package/dist/Trainer.js +12 -9
  9. package/dist/{axis_util-DofAuy0p.js → axis_util-DGqbT-FX.js} +1 -1
  10. package/dist/backend.js +2 -2
  11. package/dist/{backend_util-C7NWHpv7.js → backend_util-DC3rBo_H.js} +18 -18
  12. package/dist/{backend_webgpu-B0Vls736.js → backend_webgpu-mbhNnlx9.js} +10 -10
  13. package/dist/{broadcast_to-DDaNMbX7.js → broadcast_to-D1Dmg2Oz.js} +2 -2
  14. package/dist/checks/appendCache.js +2 -2
  15. package/dist/checks/attentionMask.js +3 -3
  16. package/dist/checks/gelu.js +2 -2
  17. package/dist/checks/matMulGelu.js +2 -2
  18. package/dist/checks/normRMS.js +4 -4
  19. package/dist/checks/normRMSGrad.js +3 -3
  20. package/dist/checks/packUnpack.js +2 -2
  21. package/dist/checks/qkv.js +2 -2
  22. package/dist/checks/rope.js +2 -2
  23. package/dist/clip_by_value-fg2aKzUy.js +12 -0
  24. package/dist/{complex-DClmWqJt.js → complex-Cyg-eQeZ.js} +1 -1
  25. package/dist/concat-CSm2rMwe.js +17 -0
  26. package/dist/{concat_util-CHsJFZJJ.js → concat_util-D0je5Ppu.js} +1 -1
  27. package/dist/{dataset-DcjWqUVQ.js → dataset-CVIJu7Xa.js} +3 -3
  28. package/dist/{dropout-OxuaJz6z.js → dropout-DLhSMNTZ.js} +14 -14
  29. package/dist/expand_dims-ChkuOp6I.js +11 -0
  30. package/dist/{exports_initializers-eS9QJ6ut.js → exports_initializers-1KWPiStI.js} +1 -1
  31. package/dist/{floor-DIb-lN_u.js → floor-BRMPgeIs.js} +1 -1
  32. package/dist/gather-BSULDalH.js +9 -0
  33. package/dist/{gelu-DqTbCx5x.js → gelu-BK1k-n1i.js} +1 -1
  34. package/dist/{gpgpu_math-CJcbnKPC.js → gpgpu_math-BJSTk_mW.js} +25 -25
  35. package/dist/{index-Dj5TkmPY.js → index-BBVLAXZD.js} +14 -14
  36. package/dist/{index-D0RBWjq8.js → index-Duu1Lvvv.js} +45 -45
  37. package/dist/{kernel_funcs_utils-CSaumNDs.js → kernel_funcs_utils-BtYrPoJu.js} +8 -8
  38. package/dist/layers/BaseLayer.js +2 -2
  39. package/dist/layers/CausalSelfAttention.js +6 -6
  40. package/dist/layers/MLP.js +4 -4
  41. package/dist/layers/PositionEmbedding.js +5 -5
  42. package/dist/layers/RMSNorm.js +3 -3
  43. package/dist/layers/RoPECache.js +4 -4
  44. package/dist/layers/TiedEmbedding.js +6 -6
  45. package/dist/layers/TransformerBlock.js +1 -1
  46. package/dist/loader/loadTransformers.js +1 -1
  47. package/dist/loader/oldZipLoad.js +17 -17
  48. package/dist/{log_sum_exp-VLZgbFAH.js → log_sum_exp-CVqLsVLl.js} +4 -4
  49. package/dist/main.d.ts +9 -0
  50. package/dist/main.js +69 -58
  51. package/dist/{matMul16-cDxwemKj.js → matMul16-xswmhSuF.js} +7 -7
  52. package/dist/{matMulGelu-B2s_80-H.js → matMulGelu-BpvgnYG8.js} +26 -26
  53. package/dist/mat_mul-Bn2BDpT4.js +11 -0
  54. package/dist/{mod-PrOKlFxH.js → mod-B4AUd1Np.js} +1 -1
  55. package/dist/models/NanoGPTV1.js +2 -2
  56. package/dist/models/model.js +9 -9
  57. package/dist/{ones-BX_wEgzB.js → ones-CBI1AQjb.js} +3 -3
  58. package/dist/ops/adamAdjust.js +1 -1
  59. package/dist/ops/adamMoments.js +1 -1
  60. package/dist/ops/add16.js +1 -1
  61. package/dist/ops/appendCache.js +3 -3
  62. package/dist/ops/attentionMask.js +1 -1
  63. package/dist/ops/concat16.js +2 -2
  64. package/dist/ops/cpu/adamAdjust.js +7 -7
  65. package/dist/ops/cpu/adamMoments.js +5 -5
  66. package/dist/ops/cpu/appendCache.js +6 -6
  67. package/dist/ops/cpu/attentionMask.js +6 -6
  68. package/dist/ops/cpu/fusedSoftmax.js +5 -5
  69. package/dist/ops/cpu/gatherSub.js +7 -7
  70. package/dist/ops/cpu/gelu.js +5 -5
  71. package/dist/ops/cpu/matMul16.js +2 -2
  72. package/dist/ops/cpu/matMulGelu.js +3 -3
  73. package/dist/ops/cpu/matMulMul.js +5 -5
  74. package/dist/ops/cpu/mulDropout.js +1 -1
  75. package/dist/ops/cpu/normRMS.js +5 -5
  76. package/dist/ops/cpu/qkv.js +3 -3
  77. package/dist/ops/cpu/rope.js +9 -9
  78. package/dist/ops/cpu/scatterSub.js +5 -5
  79. package/dist/ops/dot16.js +2 -2
  80. package/dist/ops/gatherSub.js +1 -1
  81. package/dist/ops/gelu.js +2 -2
  82. package/dist/ops/grads/add16.js +1 -1
  83. package/dist/ops/grads/attentionMask.js +2 -2
  84. package/dist/ops/grads/gelu.js +2 -2
  85. package/dist/ops/grads/matMul16.js +3 -3
  86. package/dist/ops/grads/matMulGelu.js +5 -5
  87. package/dist/ops/grads/normRMS.js +6 -6
  88. package/dist/ops/grads/pack16.js +3 -3
  89. package/dist/ops/grads/qkv.js +9 -9
  90. package/dist/ops/grads/rope.js +2 -2
  91. package/dist/ops/grads/softmax16.js +1 -1
  92. package/dist/ops/grads/unpack16.js +2 -2
  93. package/dist/ops/matMul16.js +3 -3
  94. package/dist/ops/matMulGelu.js +2 -2
  95. package/dist/ops/matMulMul.js +1 -1
  96. package/dist/ops/mul16.js +1 -1
  97. package/dist/ops/mulDrop.js +1 -1
  98. package/dist/ops/normRMS.js +1 -1
  99. package/dist/ops/pack16.js +2 -2
  100. package/dist/ops/qkv.js +1 -1
  101. package/dist/ops/reshape16.js +6 -6
  102. package/dist/ops/rope.js +2 -2
  103. package/dist/ops/scatterSub.js +1 -1
  104. package/dist/ops/slice16.js +2 -2
  105. package/dist/ops/softmax16.js +1 -1
  106. package/dist/ops/sub16.js +1 -1
  107. package/dist/ops/sum16.js +2 -2
  108. package/dist/ops/transpose16.js +6 -6
  109. package/dist/ops/unpack16.js +2 -2
  110. package/dist/ops/webgl/adamAdjust.js +2 -2
  111. package/dist/ops/webgl/adamMoments.js +1 -1
  112. package/dist/ops/webgl/appendCache.js +1 -1
  113. package/dist/ops/webgl/attentionMask.js +4 -4
  114. package/dist/ops/webgl/fusedSoftmax.js +6 -6
  115. package/dist/ops/webgl/gatherSub.js +1 -1
  116. package/dist/ops/webgl/gelu.js +2 -2
  117. package/dist/ops/webgl/log.js +3 -3
  118. package/dist/ops/webgl/matMul16.js +10 -10
  119. package/dist/ops/webgl/matMulGelu.js +4 -4
  120. package/dist/ops/webgl/matMulMul.js +2 -2
  121. package/dist/ops/webgl/mulDropout.js +1 -1
  122. package/dist/ops/webgl/normRMS.js +2 -2
  123. package/dist/ops/webgl/qkv.js +1 -1
  124. package/dist/ops/webgl/rope.js +4 -4
  125. package/dist/ops/webgl/scatterSub.js +1 -1
  126. package/dist/ops/webgpu/adamAdjust.js +3 -3
  127. package/dist/ops/webgpu/adamMoments.js +5 -5
  128. package/dist/ops/webgpu/add16.js +1 -1
  129. package/dist/ops/webgpu/appendCache.js +3 -3
  130. package/dist/ops/webgpu/attentionMask.js +5 -5
  131. package/dist/ops/webgpu/attentionMask32_program.js +2 -2
  132. package/dist/ops/webgpu/concat16.js +5 -5
  133. package/dist/ops/webgpu/gatherSub.js +3 -3
  134. package/dist/ops/webgpu/gelu.js +3 -3
  135. package/dist/ops/webgpu/matMul16.js +19 -19
  136. package/dist/ops/webgpu/matMul16_program.js +2 -2
  137. package/dist/ops/webgpu/mul16.js +1 -1
  138. package/dist/ops/webgpu/normRMS.js +2 -2
  139. package/dist/ops/webgpu/normRMSGrad.js +4 -4
  140. package/dist/ops/webgpu/pack16.js +3 -3
  141. package/dist/ops/webgpu/pack16_program.js +2 -2
  142. package/dist/ops/webgpu/qkv.js +4 -4
  143. package/dist/ops/webgpu/rope.js +3 -3
  144. package/dist/ops/webgpu/scatterSub.js +3 -3
  145. package/dist/ops/webgpu/slice16.js +4 -4
  146. package/dist/ops/webgpu/softmax16.js +4 -4
  147. package/dist/ops/webgpu/softmax16_program.js +2 -2
  148. package/dist/ops/webgpu/softmax16_subgroup_program.js +2 -2
  149. package/dist/ops/webgpu/softmax16grad.js +1 -1
  150. package/dist/ops/webgpu/sub16.js +1 -1
  151. package/dist/ops/webgpu/sum16.js +5 -5
  152. package/dist/ops/webgpu/transpose16.js +2 -2
  153. package/dist/ops/webgpu/transpose16_program.js +2 -2
  154. package/dist/ops/webgpu/transpose16_shared_program.js +3 -3
  155. package/dist/ops/webgpu/unpack16.js +5 -5
  156. package/dist/ops/webgpu/utils/binary_op.js +3 -3
  157. package/dist/ops/webgpu/utils/reductions.js +4 -4
  158. package/dist/{ops-FJapAPfm.js → ops-C2_OXuZ4.js} +35 -35
  159. package/dist/{pack16-k4jq6aMX.js → pack16-atD0eYRm.js} +6 -6
  160. package/dist/patches/webgpu_backend.js +8 -8
  161. package/dist/patches/webgpu_base.js +1 -1
  162. package/dist/patches/webgpu_program.js +2 -2
  163. package/dist/{random_width-UGQn4OWb.js → random_width-BN4wGJaW.js} +33 -33
  164. package/dist/{range-CuGvVN2c.js → range-DKmP1-OQ.js} +1 -1
  165. package/dist/relu-BsXmGzzu.js +9 -0
  166. package/dist/{reshape-CkjKPPqB.js → reshape-BI0yzp1T.js} +1 -1
  167. package/dist/{resize_nearest_neighbor-DB8k9KN_.js → resize_nearest_neighbor-BA_BX-ub.js} +25 -25
  168. package/dist/{rope-BmZmp9uP.js → rope-DJ7Y7c-u.js} +1 -1
  169. package/dist/{scatter_nd_util-BY22Cc-C.js → scatter_nd_util-k9MUVUkn.js} +1 -1
  170. package/dist/{selu_util-BuLbmbrl.js → selu_util-DyW0X1WG.js} +5 -5
  171. package/dist/{shared-B7USJZgw.js → shared-Q3BS6T03.js} +1 -1
  172. package/dist/{shared-BQboIImQ.js → shared-nnSWpC3u.js} +6 -6
  173. package/dist/{slice-Aqy7KbJh.js → slice-wBNvzVyz.js} +3 -3
  174. package/dist/{slice_util-D8CQRenR.js → slice_util-zN8KFC5I.js} +7 -7
  175. package/dist/{softmax-faLoUZVT.js → softmax-DfuYyjMh.js} +1 -1
  176. package/dist/split-BYrLboMq.js +9 -0
  177. package/dist/squeeze-Bk8Brcct.js +10 -0
  178. package/dist/{stack-WJK22CFn.js → stack-CDWShFHF.js} +1 -1
  179. package/dist/{step-dXR33iOg.js → step-BS5JXRR6.js} +14 -14
  180. package/dist/sum-BPUfDB2X.js +11 -0
  181. package/dist/{tensor-BQqrDvpx.js → tensor-CEt9Nm2s.js} +1 -1
  182. package/dist/{tensor1d-LxP9asMm.js → tensor1d-Cc_KCIDg.js} +1 -1
  183. package/dist/{tensor2d-BN1sSfQO.js → tensor2d-BN97fF71.js} +1 -1
  184. package/dist/{tensor4d-DVwr7pLF.js → tensor4d-vuDDgdUI.js} +1 -1
  185. package/dist/{tfjs_backend-Vi4JfLzT.js → tfjs_backend-806hyYve.js} +36 -36
  186. package/dist/tile-OWUvpIVt.js +11 -0
  187. package/dist/tokeniser/BaseTokeniser.d.ts +6 -8
  188. package/dist/tokeniser/BaseTokeniser.js +6 -6
  189. package/dist/tokeniser/CharTokeniser.d.ts +6 -6
  190. package/dist/tokeniser/CharTokeniser.js +26 -26
  191. package/dist/tokeniser/bpe.d.ts +6 -6
  192. package/dist/tokeniser/bpe.js +9 -9
  193. package/dist/tokeniser/type.d.ts +6 -8
  194. package/dist/training/Adam.js +2 -2
  195. package/dist/training/AdamExt.js +1 -1
  196. package/dist/training/DatasetBuilder.d.ts +1 -1
  197. package/dist/training/DatasetBuilder.js +29 -29
  198. package/dist/training/FullTrainer.js +1 -1
  199. package/dist/training/Trainer.d.ts +5 -4
  200. package/dist/training/Trainer.js +37 -40
  201. package/dist/training/sparseCrossEntropy.js +3 -3
  202. package/dist/training/tasks/ConversationTask.d.ts +11 -0
  203. package/dist/training/tasks/ConversationTask.js +26 -0
  204. package/dist/training/tasks/PretrainingTask.d.ts +11 -0
  205. package/dist/training/tasks/PretrainingTask.js +34 -0
  206. package/dist/training/tasks/StartSentenceTask.d.ts +12 -0
  207. package/dist/training/tasks/StartSentenceTask.js +42 -0
  208. package/dist/training/tasks/Task.d.ts +8 -0
  209. package/dist/training/tasks/Task.js +44 -0
  210. package/dist/{transpose-JawVKyZy.js → transpose-BUkQCJp9.js} +7 -7
  211. package/dist/{unsorted_segment_sum-LAbmE9G4.js → unsorted_segment_sum-BljxHhCY.js} +78 -78
  212. package/dist/utilities/dummy.js +3 -3
  213. package/dist/utilities/multinomialCPU.js +2 -2
  214. package/dist/utilities/packed.js +1 -1
  215. package/dist/utilities/performance.js +1 -1
  216. package/dist/utilities/profile.js +1 -1
  217. package/dist/utilities/safetensors.js +2 -2
  218. package/dist/utilities/sentences.d.ts +1 -1
  219. package/dist/utilities/sentences.js +11 -11
  220. package/dist/utilities/weights.js +2 -2
  221. package/dist/{variable-DQ9yYgEU.js → variable-DPt_Iuog.js} +1 -1
  222. package/dist/{webgpu_program-CAE4RICo.js → webgpu_program-BpWRlghH.js} +1 -1
  223. package/dist/{webgpu_util-BdovYhXr.js → webgpu_util-DMiKzzQM.js} +7 -7
  224. package/dist/{zeros-DeiE2zTa.js → zeros-5YROwwUH.js} +2 -2
  225. package/dist/{zeros_like-BAz3iKru.js → zeros_like-De4n1C3m.js} +57 -57
  226. package/package.json +1 -1
  227. package/dist/clip_by_value-Dn5tzexi.js +0 -12
  228. package/dist/concat-C6X3AAlQ.js +0 -17
  229. package/dist/expand_dims-BzfJK2uc.js +0 -11
  230. package/dist/gather-BcO5UQNJ.js +0 -9
  231. package/dist/mat_mul-DxpNTCRz.js +0 -11
  232. package/dist/relu-Cf80uA2p.js +0 -9
  233. package/dist/split-BNz5jcGc.js +0 -9
  234. package/dist/squeeze--YMgaAAf.js +0 -10
  235. package/dist/sum-BdplSvq_.js +0 -11
  236. package/dist/tile-CvN_LyVr.js +0 -11
@@ -1,38 +1,38 @@
1
- import { q as u, u as h, E as d, c9 as st, ca as rt, cb as nt, cc as et, cd as it, ce as pt, D as B, cf as at, cg as ht, b_ as ut, y as D, ch as ct, ci as ft, l as H, a3 as C, b$ as lt, cj as dt, ck as mt, cl as Dt, aG as yt, cm as It, a2 as wt, m as M, $ as F, cn as xt, co as gt, N as $, c3 as $t, cp as bt, cq as kt, cr as vt, cs as Nt, b as _t, ct as Tt, cu as Et, cv as St, cw as qt, cx as r, aZ as Kt, n as zt, a4 as W, cy as Pt, cz as Ct, p as Mt, o as Ot, b0 as At, c as Bt } from "./index-D0RBWjq8.js";
2
- import { e as j, a as R, l as G, b as X, d as V, m as Z, f as U, r as E, g as Ht, h as Ft, i as Wt, j as jt, k as Rt, n as Gt, o as Xt, c as Vt, p as Zt, q as Ut, t as Jt, u as Qt, v as Yt, w as Lt, x as to, y as oo, z as so, A as ro, B as no, C as eo, s as io, D as po, E as ao, F as ho } from "./unsorted_segment_sum-LAbmE9G4.js";
3
- import { r as l } from "./reshape-CkjKPPqB.js";
4
- import { b as uo } from "./broadcast_to-DDaNMbX7.js";
5
- import { c as co } from "./clip_by_value-Dn5tzexi.js";
6
- import { c as _ } from "./concat-C6X3AAlQ.js";
7
- import { w as J, n as Q, b as S, c as fo, g as lo, l as mo, a as Do, f as yo, d as Io, j as wo, m as xo, e as go, i as $o, h as bo, r as ko, s as vo, u as No } from "./resize_nearest_neighbor-DB8k9KN_.js";
8
- import { m as v } from "./mat_mul-DxpNTCRz.js";
9
- import { s as Y, k as _o, h as To, e as Eo, l as So, p as qo, r as Ko, a as zo } from "./step-dXR33iOg.js";
10
- import { e as Po, l as Co, a as Mo, m as Oo } from "./log_sum_exp-VLZgbFAH.js";
11
- import { e as Ao } from "./expand_dims-BzfJK2uc.js";
12
- import { f as Bo } from "./floor-DIb-lN_u.js";
13
- import { g as Ho } from "./gather-BcO5UQNJ.js";
14
- import { c as q } from "./complex-DClmWqJt.js";
15
- import { n as N, r as K, i as L, t as Fo } from "./transpose-JawVKyZy.js";
16
- import { s as T } from "./slice-Aqy7KbJh.js";
17
- import { m as Wo } from "./mod-PrOKlFxH.js";
18
- import { r as jo } from "./relu-Cf80uA2p.js";
19
- import { s as z } from "./split-BNz5jcGc.js";
20
- import { z as Ro } from "./zeros-DeiE2zTa.js";
21
- import { s as Go } from "./softmax-faLoUZVT.js";
22
- import { s as Xo } from "./squeeze--YMgaAAf.js";
23
- import { s as Vo } from "./stack-WJK22CFn.js";
24
- import { s as Zo } from "./sum-BdplSvq_.js";
25
- import { t as Uo } from "./tile-CvN_LyVr.js";
1
+ import { o as u, q as h, E as d, c9 as st, ca as rt, cb as nt, cc as et, cd as it, ce as pt, B, cf as at, cg as ht, b_ as ut, x as D, ch as ct, ci as ft, j as H, a2 as C, b$ as lt, cj as dt, ck as mt, cl as Dt, aG as yt, cm as It, a1 as wt, m as M, _ as F, cn as xt, co as gt, L as $, c3 as $t, cp as bt, cq as kt, cr as vt, cs as Nt, b as _t, ct as Tt, cu as Et, cv as St, cw as qt, cx as r, aZ as Kt, l as zt, a3 as j, cy as Pt, cz as Ct, p as Mt, n as Ot, b0 as At, c as Bt } from "./index-Duu1Lvvv.js";
2
+ import { e as W, a as R, l as G, b as X, d as V, m as Z, f as U, r as E, g as Ht, h as Ft, i as jt, j as Wt, k as Rt, n as Gt, o as Xt, c as Vt, p as Zt, q as Ut, t as Jt, u as Lt, v as Qt, w as Yt, x as to, y as oo, z as so, A as ro, B as no, C as eo, s as io, D as po, E as ao, F as ho } from "./unsorted_segment_sum-BljxHhCY.js";
3
+ import { r as l } from "./reshape-BI0yzp1T.js";
4
+ import { b as uo } from "./broadcast_to-D1Dmg2Oz.js";
5
+ import { c as co } from "./clip_by_value-fg2aKzUy.js";
6
+ import { c as _ } from "./concat-CSm2rMwe.js";
7
+ import { w as J, n as L, b as S, c as fo, g as lo, l as mo, a as Do, f as yo, d as Io, j as wo, m as xo, e as go, i as $o, h as bo, r as ko, s as vo, u as No } from "./resize_nearest_neighbor-BA_BX-ub.js";
8
+ import { m as v } from "./mat_mul-Bn2BDpT4.js";
9
+ import { s as Q, k as _o, h as To, e as Eo, l as So, p as qo, r as Ko, a as zo } from "./step-BS5JXRR6.js";
10
+ import { e as Po, l as Co, a as Mo, m as Oo } from "./log_sum_exp-CVqLsVLl.js";
11
+ import { e as Ao } from "./expand_dims-ChkuOp6I.js";
12
+ import { f as Bo } from "./floor-BRMPgeIs.js";
13
+ import { g as Ho } from "./gather-BSULDalH.js";
14
+ import { c as q } from "./complex-Cyg-eQeZ.js";
15
+ import { n as N, r as K, i as Y, t as Fo } from "./transpose-BUkQCJp9.js";
16
+ import { s as T } from "./slice-wBNvzVyz.js";
17
+ import { m as jo } from "./mod-B4AUd1Np.js";
18
+ import { r as Wo } from "./relu-BsXmGzzu.js";
19
+ import { s as z } from "./split-BYrLboMq.js";
20
+ import { z as Ro } from "./zeros-5YROwwUH.js";
21
+ import { s as Go } from "./softmax-DfuYyjMh.js";
22
+ import { s as Xo } from "./squeeze-Bk8Brcct.js";
23
+ import { s as Vo } from "./stack-CDWShFHF.js";
24
+ import { s as Zo } from "./sum-BPUfDB2X.js";
25
+ import { t as Uo } from "./tile-OWUvpIVt.js";
26
26
  function Jo(t) {
27
27
  const s = { x: h(t, "x", "acos") };
28
28
  return d.runKernel(st, s);
29
29
  }
30
- const Qo = /* @__PURE__ */ u({ acos_: Jo });
31
- function Yo(t) {
30
+ const Lo = /* @__PURE__ */ u({ acos_: Jo });
31
+ function Qo(t) {
32
32
  const s = { x: h(t, "x", "acosh") };
33
33
  return d.runKernel(rt, s);
34
34
  }
35
- const Lo = /* @__PURE__ */ u({ acosh_: Yo });
35
+ const Yo = /* @__PURE__ */ u({ acosh_: Qo });
36
36
  function ts(t, o = 0) {
37
37
  const n = { x: h(t, "x", "argMin") }, e = { axis: o };
38
38
  return d.runKernel(nt, n, e);
@@ -93,7 +93,7 @@ const ys = /* @__PURE__ */ u({ dilation2d_: Ds });
93
93
  function Is(t, o) {
94
94
  let s = h(t, "a", "div"), n = h(o, "b", "div");
95
95
  [s, n] = B(s, n);
96
- const e = H(s, n), i = C(e), p = j(n, i);
96
+ const e = H(s, n), i = C(e), p = W(n, i);
97
97
  return J(p, i, e);
98
98
  }
99
99
  const ws = /* @__PURE__ */ u({ divNoNan_: Is });
@@ -117,7 +117,7 @@ function xs(t, o) {
117
117
  }
118
118
  const gs = /* @__PURE__ */ u({ dot_: xs });
119
119
  function $s(t, o = null, s = !1) {
120
- return Q(t, "euclidean", o, s);
120
+ return L(t, "euclidean", o, s);
121
121
  }
122
122
  const bs = /* @__PURE__ */ u({ euclideanNorm_: $s });
123
123
  function ks(t) {
@@ -152,7 +152,7 @@ function Ks(t, o = 5, s = 1, n = 1, e = 0.5) {
152
152
  const zs = /* @__PURE__ */ u({ localResponseNormalization_: Ks });
153
153
  function Ps(t) {
154
154
  const o = h(t, "x", "logSigmoid");
155
- return wt((n) => ({ value: N(R(N(n))), gradFunc: (p) => M(p, Y(N(n))) }))(o);
155
+ return wt((n) => ({ value: N(R(N(n))), gradFunc: (p) => M(p, Q(N(n))) }))(o);
156
156
  }
157
157
  const Cs = /* @__PURE__ */ u({ logSigmoid_: Ps });
158
158
  function Ms(t, o) {
@@ -187,15 +187,15 @@ function Fs(t, o, s, n, e, i, p) {
187
187
  a.rank === 3 && (y = !0, f = l(a, [1, a.shape[0], a.shape[1], a.shape[2]])), D(_o(i, e), () => `Error in pool: Either strides or dilations must be 1. Got strides ${i} and dilations '${e}'`);
188
188
  const c = To(f.shape, o, i, e, n), m = [c.dilationHeight, c.dilationWidth];
189
189
  let I;
190
- n === "same" ? I = js([c.filterHeight, c.filterWidth], m) : I = [[0, 0], [0, 0]];
191
- const w = m[0] === 1 && m[1] === 1, [x, g] = Ws([c.inHeight, c.inWidth], m, I), b = w ? n : "valid", O = w ? f : X(f, m, x), A = (s === "avg" ? () => V(O, o, i, b, p) : () => Z(O, o, i, b, p))(), k = w ? A : U(A, m, g);
190
+ n === "same" ? I = Ws([c.filterHeight, c.filterWidth], m) : I = [[0, 0], [0, 0]];
191
+ const w = m[0] === 1 && m[1] === 1, [x, g] = js([c.inHeight, c.inWidth], m, I), b = w ? n : "valid", O = w ? f : X(f, m, x), A = (s === "avg" ? () => V(O, o, i, b, p) : () => Z(O, o, i, b, p))(), k = w ? A : U(A, m, g);
192
192
  return y ? l(k, [k.shape[1], k.shape[2], k.shape[3]]) : k;
193
193
  }
194
- function Ws(t, o, s) {
194
+ function js(t, o, s) {
195
195
  const n = s.map((c) => c[0]), e = s.map((c) => c[1]), i = t.concat(n, e), p = o.map((c, m) => (c - i[m] % c) % c), a = e.map((c, m) => c + p[m]), f = o.map((c, m) => [n[m], a[m]]), y = o.map((c, m) => [0, p[m]]);
196
196
  return [f, y];
197
197
  }
198
- function js(t, o) {
198
+ function Ws(t, o) {
199
199
  const n = t.map((p, a) => p + (p - 1) * (o[a] - 1)).map((p) => p - 1), e = n.map((p) => Math.floor(p / 2)), i = n.map((p, a) => p - e[a]);
200
200
  return n.map((p, a) => [e[a], i[a]]);
201
201
  }
@@ -217,26 +217,26 @@ function Us(t) {
217
217
  return d.runKernel(kt, s);
218
218
  }
219
219
  const Js = /* @__PURE__ */ u({ sign_: Us });
220
- function Qs(t) {
220
+ function Ls(t) {
221
221
  D(t.dtype === "complex64", () => `The dtype for tf.spectral.fft() must be complex64 but got ${t.dtype}.`);
222
222
  const o = { input: t };
223
223
  return d.runKernel(vt, o);
224
224
  }
225
- const ot = /* @__PURE__ */ u({ fft_: Qs });
226
- function Ys(t) {
225
+ const ot = /* @__PURE__ */ u({ fft_: Ls });
226
+ function Qs(t) {
227
227
  D(t.dtype === "complex64", () => `The dtype for tf.spectral.ifft() must be complex64 but got ${t.dtype}.`);
228
228
  const o = { input: t };
229
229
  return d.runKernel(Nt, o);
230
230
  }
231
- const P = /* @__PURE__ */ u({ ifft_: Ys });
232
- function Ls(t) {
231
+ const P = /* @__PURE__ */ u({ ifft_: Qs });
232
+ function Ys(t) {
233
233
  const o = t.shape[t.shape.length - 1], s = t.size / o;
234
234
  let n;
235
235
  if (o <= 2) {
236
236
  const e = l(t, [s, o]);
237
237
  n = P(e);
238
238
  } else {
239
- const e = [s, 2 * (o - 1)], i = l(K(t), [s, o]), p = l(L(t), [s, o]), a = E(T(i, [0, 1], [s, o - 2]), 1), f = M(E(T(p, [0, 1], [s, o - 2]), 1), _t(-1)), y = _([i, a], 1), c = _([p, f], 1), m = l(q(y, c), [e[0], e[1]]);
239
+ const e = [s, 2 * (o - 1)], i = l(K(t), [s, o]), p = l(Y(t), [s, o]), a = E(T(i, [0, 1], [s, o - 2]), 1), f = M(E(T(p, [0, 1], [s, o - 2]), 1), _t(-1)), y = _([i, a], 1), c = _([p, f], 1), m = l(q(y, c), [e[0], e[1]]);
240
240
  n = P(m);
241
241
  }
242
242
  if (n = K(n), t.rank === 3 && t.shape[0] !== 0) {
@@ -245,7 +245,7 @@ function Ls(t) {
245
245
  }
246
246
  return n;
247
247
  }
248
- const tr = /* @__PURE__ */ u({ irfft_: Ls });
248
+ const tr = /* @__PURE__ */ u({ irfft_: Ys });
249
249
  function or(t, o) {
250
250
  D(t.dtype === "float32", () => `The dtype for rfft() must be real value but got ${t.dtype}`);
251
251
  let s = t.shape[t.shape.length - 1];
@@ -259,7 +259,7 @@ function or(t, o) {
259
259
  x[t.shape.length - 1] = o - s, e = _([t, Ro(x)], t.shape.length - 1), s = o;
260
260
  } else
261
261
  e = t;
262
- const i = C(e), p = l(q(e, i), [n, s]), a = ot(p), f = Math.floor(s / 2) + 1, y = K(a), c = L(a), m = z(y, [f, s - f], y.shape.length - 1), I = z(c, [f, s - f], c.shape.length - 1), w = e.shape.slice();
262
+ const i = C(e), p = l(q(e, i), [n, s]), a = ot(p), f = Math.floor(s / 2) + 1, y = K(a), c = Y(a), m = z(y, [f, s - f], y.shape.length - 1), I = z(c, [f, s - f], c.shape.length - 1), w = e.shape.slice();
263
263
  return w[e.shape.length - 1] = f, l(q(m[0], I[0]), w);
264
264
  }
265
265
  const sr = /* @__PURE__ */ u({ rfft_: or });
@@ -306,10 +306,10 @@ r().prototype.abs = function() {
306
306
  return this.throwIfDisposed(), Kt(this);
307
307
  };
308
308
  r().prototype.acos = function() {
309
- return this.throwIfDisposed(), Qo(this);
309
+ return this.throwIfDisposed(), Lo(this);
310
310
  };
311
311
  r().prototype.acosh = function() {
312
- return this.throwIfDisposed(), Lo(this);
312
+ return this.throwIfDisposed(), Yo(this);
313
313
  };
314
314
  r().prototype.add = function(t) {
315
315
  return this.throwIfDisposed(), zt(this, t);
@@ -321,7 +321,7 @@ r().prototype.any = function(t, o) {
321
321
  return this.throwIfDisposed(), Ft(this, t, o);
322
322
  };
323
323
  r().prototype.argMax = function(t) {
324
- return this.throwIfDisposed(), Wt(this, t);
324
+ return this.throwIfDisposed(), jt(this, t);
325
325
  };
326
326
  r().prototype.argMin = function(t) {
327
327
  return this.throwIfDisposed(), os(this, t);
@@ -369,7 +369,7 @@ r().prototype.batchToSpaceND = function(t, o) {
369
369
  return this.throwIfDisposed(), U(this, t, o);
370
370
  };
371
371
  r().prototype.batchNorm = function(t, o, s, n, e) {
372
- return this.throwIfDisposed(), jt(this, t, o, s, n, e);
372
+ return this.throwIfDisposed(), Wt(this, t, o, s, n, e);
373
373
  };
374
374
  r().prototype.broadcastTo = function(t) {
375
375
  return this.throwIfDisposed(), uo(this, t);
@@ -384,7 +384,7 @@ r().prototype.clipByValue = function(t, o) {
384
384
  return this.throwIfDisposed(), co(this, t, o);
385
385
  };
386
386
  r().prototype.concat = function(t, o) {
387
- return this.throwIfDisposed(), t instanceof W && (t = [t]), _([this, ...t], o);
387
+ return this.throwIfDisposed(), t instanceof j && (t = [t]), _([this, ...t], o);
388
388
  };
389
389
  r().prototype.conv1d = function(t, o, s, n, e, i) {
390
390
  return this.throwIfDisposed(), Rt(this, t, o, s, n, e, i);
@@ -411,7 +411,7 @@ r().prototype.depthToSpace = function(t, o) {
411
411
  return this.throwIfDisposed(), ms(this, t, o);
412
412
  };
413
413
  r().prototype.depthwiseConv2d = function(t, o, s, n, e, i) {
414
- return this.throwIfDisposed(), Qt(this, t, o, s, n, e, i);
414
+ return this.throwIfDisposed(), Lt(this, t, o, s, n, e, i);
415
415
  };
416
416
  r().prototype.dilation2d = function(t, o, s, n, e) {
417
417
  return this.throwIfDisposed(), ys(this, t, o, s, n, e);
@@ -429,10 +429,10 @@ r().prototype.elu = function() {
429
429
  return this.throwIfDisposed(), Eo(this);
430
430
  };
431
431
  r().prototype.equal = function(t) {
432
- return this.throwIfDisposed(), j(this, t);
432
+ return this.throwIfDisposed(), W(this, t);
433
433
  };
434
434
  r().prototype.erf = function() {
435
- return this.throwIfDisposed(), Yt(this);
435
+ return this.throwIfDisposed(), Qt(this);
436
436
  };
437
437
  r().prototype.euclideanNorm = function(t, o) {
438
438
  return this.throwIfDisposed(), bs(this, t, o);
@@ -498,7 +498,7 @@ r().prototype.logSigmoid = function() {
498
498
  return this.throwIfDisposed(), Cs(this);
499
499
  };
500
500
  r().prototype.logSoftmax = function(t) {
501
- return this.throwIfDisposed(), Lt(this, t);
501
+ return this.throwIfDisposed(), Yt(this, t);
502
502
  };
503
503
  r().prototype.logSumExp = function(t, o) {
504
504
  return this.throwIfDisposed(), Co(this, t, o);
@@ -546,7 +546,7 @@ r().prototype.mirrorPad = function(t, o) {
546
546
  return this.throwIfDisposed(), Hs(this, t, o);
547
547
  };
548
548
  r().prototype.mod = function(t) {
549
- return this.throwIfDisposed(), Wo(this, t);
549
+ return this.throwIfDisposed(), jo(this, t);
550
550
  };
551
551
  r().prototype.mul = function(t) {
552
552
  return this.throwIfDisposed(), M(this, t);
@@ -555,7 +555,7 @@ r().prototype.neg = function() {
555
555
  return this.throwIfDisposed(), N(this);
556
556
  };
557
557
  r().prototype.norm = function(t, o, s) {
558
- return this.throwIfDisposed(), Q(this, t, o, s);
558
+ return this.throwIfDisposed(), L(this, t, o, s);
559
559
  };
560
560
  r().prototype.notEqual = function(t) {
561
561
  return this.throwIfDisposed(), go(this, t);
@@ -585,7 +585,7 @@ r().prototype.reciprocal = function() {
585
585
  return this.throwIfDisposed(), Zs(this);
586
586
  };
587
587
  r().prototype.relu = function() {
588
- return this.throwIfDisposed(), jo(this);
588
+ return this.throwIfDisposed(), Wo(this);
589
589
  };
590
590
  r().prototype.relu6 = function() {
591
591
  return this.throwIfDisposed(), Ko(this);
@@ -621,7 +621,7 @@ r().prototype.separableConv2d = function(t, o, s, n, e, i) {
621
621
  return this.throwIfDisposed(), eo(this, t, o, s, n, e, i);
622
622
  };
623
623
  r().prototype.sigmoid = function() {
624
- return this.throwIfDisposed(), Y(this);
624
+ return this.throwIfDisposed(), Q(this);
625
625
  };
626
626
  r().prototype.sign = function() {
627
627
  return this.throwIfDisposed(), Js(this);
@@ -661,7 +661,7 @@ r().prototype.squeeze = function(t) {
661
661
  };
662
662
  r().prototype.stack = function(t, o) {
663
663
  this.throwIfDisposed();
664
- const s = t instanceof W ? [this, t] : [this, ...t];
664
+ const s = t instanceof j ? [this, t] : [this, ...t];
665
665
  return Vo(s, o);
666
666
  };
667
667
  r().prototype.step = function(t) {
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@genai-fi/nanogpt",
3
- "version": "0.11.0",
3
+ "version": "0.12.1",
4
4
  "type": "module",
5
5
  "main": "dist/main.js",
6
6
  "types": "dist/main.d.ts",
@@ -1,12 +0,0 @@
1
- import { q as a, u as y, y as m, i as u, E as c, C as f } from "./index-D0RBWjq8.js";
2
- function p(o, s, t) {
3
- const r = y(o, "x", "clipByValue");
4
- if (m(s <= t, () => `Error in clip: min (${s}) must be less than or equal to max (${t}).`), s === t)
5
- return u(r.shape, s, r.dtype);
6
- const n = { x: r }, e = { clipValueMin: s, clipValueMax: t };
7
- return c.runKernel(f, n, e);
8
- }
9
- const E = /* @__PURE__ */ a({ clipByValue_: p });
10
- export {
11
- E as c
12
- };
@@ -1,17 +0,0 @@
1
- import { q as s, y as a, z as p, x as i, E as l, A as f } from "./index-D0RBWjq8.js";
2
- function h(n, e = 0) {
3
- a(n.length >= 1, () => "Pass at least one tensor to concat");
4
- const t = p(n, "tensors", "concat", "string_or_numeric");
5
- if (t[0].dtype === "complex64" && t.forEach((o) => {
6
- if (o.dtype !== "complex64")
7
- throw new Error(`Cannot concatenate complex64 tensors with a tensor
8
- with dtype ${o.dtype}. `);
9
- }), t.length === 1)
10
- return i(t[0]);
11
- const r = t, c = { axis: e };
12
- return l.runKernel(f, r, c);
13
- }
14
- const u = /* @__PURE__ */ s({ concat_: h });
15
- export {
16
- u as c
17
- };
@@ -1,11 +0,0 @@
1
- import { q as o, u as a, y as i, E as m, B as p } from "./index-D0RBWjq8.js";
2
- function u(t, n = 0) {
3
- const s = a(t, "x", "expandDims", "string_or_numeric");
4
- i(n <= s.rank, () => "Axis must be <= rank of the tensor");
5
- const r = { input: s }, e = { dim: n };
6
- return m.runKernel(p, r, e);
7
- }
8
- const x = /* @__PURE__ */ o({ expandDims_: u });
9
- export {
10
- x as e
11
- };
@@ -1,9 +0,0 @@
1
- import { q as g, u as t, E as h, G as u } from "./index-D0RBWjq8.js";
2
- function p(n, s, r = 0, e = 0) {
3
- const o = t(n, "x", "gather"), a = t(s, "indices", "gather", "int32"), c = { x: o, indices: a }, i = { axis: r, batchDims: e };
4
- return h.runKernel(u, c, i);
5
- }
6
- const d = /* @__PURE__ */ g({ gather_: p });
7
- export {
8
- d as g
9
- };
@@ -1,11 +0,0 @@
1
- import { q as m, u as s, D as c, E as M, H as p } from "./index-D0RBWjq8.js";
2
- function f(e, n, o = !1, l = !1) {
3
- let a = s(e, "a", "matMul"), t = s(n, "b", "matMul");
4
- [a, t] = c(a, t);
5
- const r = { a, b: t }, u = { transposeA: o, transposeB: l };
6
- return M.runKernel(p, r, u);
7
- }
8
- const i = /* @__PURE__ */ m({ matMul_: f });
9
- export {
10
- i as m
11
- };
@@ -1,9 +0,0 @@
1
- import { q as o, u as e, E as s, I as t } from "./index-D0RBWjq8.js";
2
- function u(r) {
3
- const n = { x: e(r, "x", "relu") };
4
- return s.runKernel(t, n);
5
- }
6
- const l = /* @__PURE__ */ o({ relu_: u });
7
- export {
8
- l as r
9
- };
@@ -1,9 +0,0 @@
1
- import { q as p, u as i, E as a, K as c } from "./index-D0RBWjq8.js";
2
- function e(t, s, n = 0) {
3
- const o = { x: i(t, "x", "split") }, r = { numOrSizeSplits: s, axis: n };
4
- return a.runKernel(c, o, r);
5
- }
6
- const x = /* @__PURE__ */ p({ split_: e });
7
- export {
8
- x as s
9
- };
@@ -1,10 +0,0 @@
1
- import { q as o, u as n, L as a } from "./index-D0RBWjq8.js";
2
- import { r as t } from "./reshape-CkjKPPqB.js";
3
- function p(s, r) {
4
- const e = n(s, "x", "squeeze", "string_or_numeric");
5
- return t(e, a(e.shape, r).newShape);
6
- }
7
- const i = /* @__PURE__ */ o({ squeeze_: p });
8
- export {
9
- i as s
10
- };
@@ -1,11 +0,0 @@
1
- import { q as a, u as e, N as c, E as l, Q as m } from "./index-D0RBWjq8.js";
2
- function i(t, n = null, o = !1) {
3
- let s = e(t, "x", "sum");
4
- s.dtype === "bool" && (s = c(s, "int32"));
5
- const r = { x: s }, u = { axis: n, keepDims: o };
6
- return l.runKernel(m, r, u);
7
- }
8
- const f = /* @__PURE__ */ a({ sum_: i });
9
- export {
10
- f as s
11
- };
@@ -1,11 +0,0 @@
1
- import { q as e, u as a, y as i, E as c, T as u } from "./index-D0RBWjq8.js";
2
- function l(r, t) {
3
- const n = a(r, "x", "tile", "string_or_numeric");
4
- i(n.rank === t.length, () => `Error in transpose: rank of input ${n.rank} must match length of reps ${t}.`);
5
- const s = { x: n }, o = { reps: t };
6
- return c.runKernel(u, s, o);
7
- }
8
- const p = /* @__PURE__ */ e({ tile_: l });
9
- export {
10
- p as t
11
- };