@genai-fi/nanogpt 0.7.0 → 0.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (152) hide show
  1. package/dist/Generator.js +13 -9
  2. package/dist/NanoGPTModel.js +10 -10
  3. package/dist/{RealDiv-C4hOvYOZ.js → RealDiv-CVYNbZxu.js} +11 -11
  4. package/dist/{Reshape-BLijOA8h.js → Reshape-CEsEp0AI.js} +2 -2
  5. package/dist/Reshape-Do18N3gO.js +30 -0
  6. package/dist/TeachableLLM.js +9 -5
  7. package/dist/{TiedEmbedding-BLltddza.js → TiedEmbedding-ccLBFiZi.js} +4 -4
  8. package/dist/{axis_util-DaAl5MER.js → axis_util-5DTW2tFV.js} +1 -1
  9. package/dist/backend.js +2 -2
  10. package/dist/{backend_util-DWiwsi2N.js → backend_util-C9Ut8n0Q.js} +40 -40
  11. package/dist/{broadcast_to-C4v-j9yA.js → broadcast_to-Ba9h_8DO.js} +2 -2
  12. package/dist/{concat-CsHeR4zV.js → concat-CbXTetof.js} +1 -1
  13. package/dist/{dataset-JDyjG3QR.js → dataset-U3PrjwgU.js} +7 -7
  14. package/dist/{dropout-hpDwECTe.js → dropout-DPfPgWWe.js} +11 -11
  15. package/dist/{gather-D0_gPiBz.js → gather-Bbh8DHhM.js} +4 -4
  16. package/dist/{gelu-uyHP1x1f.js → gelu-BFwVnd1r.js} +1 -1
  17. package/dist/{gpgpu_math-DJm3ZTAf.js → gpgpu_math-DffelNS-.js} +2 -2
  18. package/dist/{index-BPPzKVdR.js → index-DYD_yPa-.js} +1083 -1106
  19. package/dist/{index-C0dhsYom.js → index-UdZhlibC.js} +126 -126
  20. package/dist/{kernel_funcs_utils-CwRTFqrc.js → kernel_funcs_utils-CXDy3EN7.js} +3 -3
  21. package/dist/layers/BaseLayer.js +2 -2
  22. package/dist/layers/CausalSelfAttention.js +8 -8
  23. package/dist/layers/MLP.js +5 -5
  24. package/dist/layers/RMSNorm.js +3 -3
  25. package/dist/layers/RoPECache.js +4 -4
  26. package/dist/layers/TiedEmbedding.js +5 -5
  27. package/dist/layers/TransformerBlock.js +1 -1
  28. package/dist/loader/loadTransformers.js +1 -1
  29. package/dist/loader/oldZipLoad.js +11 -7
  30. package/dist/{log_sum_exp-D086OgZJ.js → log_sum_exp-BnmCkHWl.js} +8 -8
  31. package/dist/main.d.ts +11 -0
  32. package/dist/main.js +44 -27
  33. package/dist/{mat_mul-1nwdPkQ_.js → mat_mul-dwmZz69e.js} +1 -1
  34. package/dist/{max-BQc2Aj-I.js → max-ByjEGoFx.js} +3 -3
  35. package/dist/{mulmat_packed_gpu-Gzf3I9UV.js → mulmat_packed_gpu-IGPBp6h9.js} +1 -1
  36. package/dist/{ones-D63HpSF_.js → ones-C8Mfln6-.js} +2 -2
  37. package/dist/ops/adamAdjust.d.ts +2 -0
  38. package/dist/ops/adamAdjust.js +9 -0
  39. package/dist/ops/adamMoments.d.ts +2 -0
  40. package/dist/ops/adamMoments.js +9 -0
  41. package/dist/ops/appendCache.js +3 -3
  42. package/dist/ops/attentionMask.js +1 -1
  43. package/dist/ops/cpu/adamAdjust.d.ts +1 -0
  44. package/dist/ops/cpu/adamAdjust.js +18 -0
  45. package/dist/ops/cpu/adamMoments.d.ts +1 -0
  46. package/dist/ops/cpu/adamMoments.js +16 -0
  47. package/dist/ops/cpu/appendCache.js +2 -2
  48. package/dist/ops/cpu/attentionMask.js +5 -5
  49. package/dist/ops/cpu/fusedSoftmax.js +2 -2
  50. package/dist/ops/cpu/gatherSub.js +3 -3
  51. package/dist/ops/cpu/gelu.js +1 -1
  52. package/dist/ops/cpu/matMulGelu.js +2 -2
  53. package/dist/ops/cpu/matMulMul.js +1 -1
  54. package/dist/ops/cpu/mulDropout.js +1 -1
  55. package/dist/ops/cpu/normRMS.js +1 -1
  56. package/dist/ops/cpu/qkv.js +3 -3
  57. package/dist/ops/cpu/rope.js +5 -5
  58. package/dist/ops/cpu/scatterSub.js +11 -11
  59. package/dist/ops/fusedSoftmax.js +1 -1
  60. package/dist/ops/gatherSub.js +1 -1
  61. package/dist/ops/gelu.js +2 -2
  62. package/dist/ops/grads/attentionMask.js +1 -1
  63. package/dist/ops/grads/fusedSoftmax.js +2 -2
  64. package/dist/ops/grads/gelu.js +2 -2
  65. package/dist/ops/grads/matMulGelu.js +1 -1
  66. package/dist/ops/grads/normRMS.js +1 -1
  67. package/dist/ops/grads/qkv.js +1 -1
  68. package/dist/ops/grads/rope.js +1 -1
  69. package/dist/ops/matMulGelu.js +1 -1
  70. package/dist/ops/matMulMul.js +1 -1
  71. package/dist/ops/mulDrop.js +1 -1
  72. package/dist/ops/normRMS.js +1 -1
  73. package/dist/ops/qkv.js +1 -1
  74. package/dist/ops/rope.js +4 -4
  75. package/dist/ops/scatterSub.js +1 -1
  76. package/dist/ops/webgl/adamAdjust.d.ts +1 -0
  77. package/dist/ops/webgl/adamAdjust.js +50 -0
  78. package/dist/ops/webgl/adamMoments.d.ts +1 -0
  79. package/dist/ops/webgl/adamMoments.js +38 -0
  80. package/dist/ops/webgl/appendCache.js +1 -1
  81. package/dist/ops/webgl/attentionMask.js +1 -1
  82. package/dist/ops/webgl/fusedSoftmax.js +4 -4
  83. package/dist/ops/webgl/gatherSub.js +8 -8
  84. package/dist/ops/webgl/gelu.js +2 -2
  85. package/dist/ops/webgl/log.js +3 -3
  86. package/dist/ops/webgl/matMulGelu.js +4 -4
  87. package/dist/ops/webgl/matMulMul.js +1 -1
  88. package/dist/ops/webgl/mulDropout.js +1 -1
  89. package/dist/ops/webgl/normRMS.js +2 -2
  90. package/dist/ops/webgl/qkv.js +1 -1
  91. package/dist/ops/webgl/rope.js +1 -1
  92. package/dist/ops/webgl/scatterSub.js +1 -1
  93. package/dist/ops/webgpu/adamAdjust.d.ts +1 -0
  94. package/dist/ops/webgpu/adamAdjust.js +52 -0
  95. package/dist/ops/webgpu/adamMoments.d.ts +1 -0
  96. package/dist/ops/webgpu/adamMoments.js +51 -0
  97. package/dist/ops/webgpu/appendCache.js +13 -12
  98. package/dist/ops/webgpu/attentionMask.js +11 -10
  99. package/dist/ops/webgpu/gatherSub.js +26 -11
  100. package/dist/ops/webgpu/gelu.js +7 -6
  101. package/dist/ops/webgpu/index.js +3 -0
  102. package/dist/ops/webgpu/normRMS.js +27 -101
  103. package/dist/ops/webgpu/normRMSGrad.d.ts +1 -0
  104. package/dist/ops/webgpu/normRMSGrad.js +128 -0
  105. package/dist/ops/webgpu/qkv.js +9 -8
  106. package/dist/ops/webgpu/rope.js +8 -7
  107. package/dist/ops/webgpu/scatterSub.js +8 -7
  108. package/dist/ops/webgpu/utils/reductions.d.ts +9 -0
  109. package/dist/ops/webgpu/utils/reductions.js +68 -0
  110. package/dist/{ops-CIQLNshk.js → ops-aRTXR2Sr.js} +195 -219
  111. package/dist/{random_width-DkYP8W8N.js → random_width-DbSpgl4o.js} +22 -21
  112. package/dist/{range-CYzpQY53.js → range-D9CZhVlR.js} +1 -1
  113. package/dist/{reciprocal-_A9yv27J.js → reciprocal-CGB48wZB.js} +1 -1
  114. package/dist/{register_all_kernels-guvSxp7M.js → register_all_kernels-DnbAyBXt.js} +30 -29
  115. package/dist/{reshape-BMUzc1UY.js → reshape-BR0eoLYN.js} +3 -3
  116. package/dist/{scatter_nd_util-IRBqKz_b.js → scatter_nd_util-OjyAxku2.js} +1 -1
  117. package/dist/{selu_util-Dt_iuXaq.js → selu_util-Ce6pu9IM.js} +41 -41
  118. package/dist/{shared-CDu9S76h.js → shared-Czipaeb6.js} +6 -6
  119. package/dist/{shared-BNa2q6jD.js → shared-DS5waSIY.js} +1 -1
  120. package/dist/{sin-Cocju-BY.js → sin-CiBxrDqX.js} +6 -6
  121. package/dist/slice-BHbDHObE.js +28 -0
  122. package/dist/{softmax-GPNK3o-U.js → softmax-JMEIUo2J.js} +3 -3
  123. package/dist/{split-CHzJjxDv.js → split-CRU0PjVV.js} +1 -1
  124. package/dist/{stack-Dpgg_1W1.js → stack-ikk2Y8_P.js} +1 -1
  125. package/dist/{sum-B8wEpKsg.js → sum-NLYbiDag.js} +3 -3
  126. package/dist/{tensor-RvZVNmg0.js → tensor-Do9PKbIE.js} +1 -1
  127. package/dist/{tensor2d-B_kyod7_.js → tensor2d-CWHxHpLh.js} +1 -1
  128. package/dist/training/Adam.d.ts +22 -0
  129. package/dist/training/Adam.js +93 -0
  130. package/dist/training/AdamExt.d.ts +1 -1
  131. package/dist/training/AdamExt.js +13 -12
  132. package/dist/training/DatasetBuilder.js +2 -2
  133. package/dist/training/FullTrainer.js +22 -22
  134. package/dist/training/Trainer.d.ts +1 -1
  135. package/dist/training/Trainer.js +32 -32
  136. package/dist/training/sparseCrossEntropy.d.ts +0 -4
  137. package/dist/training/sparseCrossEntropy.js +7 -7
  138. package/dist/utilities/arrayClose.d.ts +1 -0
  139. package/dist/utilities/arrayClose.js +11 -0
  140. package/dist/utilities/dummy.js +2 -2
  141. package/dist/utilities/generate.js +3 -3
  142. package/dist/utilities/multinomialCPU.js +2 -2
  143. package/dist/utilities/performance.d.ts +1 -1
  144. package/dist/utilities/performance.js +11 -11
  145. package/dist/utilities/profile.js +1 -1
  146. package/dist/utilities/safetensors.js +2 -2
  147. package/dist/utilities/weights.js +2 -2
  148. package/dist/{variable-DXEUOwew.js → variable-BTBkayv_.js} +1 -1
  149. package/dist/{webgpu_util-g13LvDIv.js → webgpu_program-WaoMq-WD.js} +138 -215
  150. package/dist/webgpu_util-DhSeP4b6.js +80 -0
  151. package/dist/{zeros-DCPCdFGq.js → zeros-DnPT2nD4.js} +4 -4
  152. package/package.json +1 -1
@@ -4152,66 +4152,66 @@ function Bs() {
4152
4152
  */
4153
4153
  Bs();
4154
4154
  export {
4155
- ea as $,
4156
- Is as A,
4157
- Tn as B,
4158
- Ct as C,
4159
- Ge as D,
4155
+ Ps as $,
4156
+ bi as A,
4157
+ D as B,
4158
+ T as C,
4159
+ Tn as D,
4160
4160
  f as E,
4161
- K as F,
4161
+ Ct as F,
4162
4162
  ta as G,
4163
- hr as H,
4164
- Ya as I,
4165
- So as J,
4166
- Xn as K,
4167
- Po as L,
4168
- Sr as M,
4169
- ka as N,
4170
- Xa as O,
4163
+ Ge as H,
4164
+ K as I,
4165
+ hr as J,
4166
+ Ya as K,
4167
+ So as L,
4168
+ Xn as M,
4169
+ Po as N,
4170
+ H as O,
4171
4171
  Ga as P,
4172
- Rt as Q,
4172
+ Sr as Q,
4173
4173
  Ka as R,
4174
4174
  ko as S,
4175
4175
  x as T,
4176
- bo as U,
4177
- In as V,
4178
- An as W,
4179
- Ps as X,
4180
- ni as Y,
4181
- $t as Z,
4182
- oo as _,
4176
+ ka as U,
4177
+ Xa as V,
4178
+ ho as W,
4179
+ Rt as X,
4180
+ bo as Y,
4181
+ In as Z,
4182
+ An as _,
4183
4183
  b as a,
4184
4184
  Na as a$,
4185
- xe as a0,
4186
- wr as a1,
4187
- ne as a2,
4188
- Br as a3,
4189
- fo as a4,
4190
- xa as a5,
4191
- k as a6,
4192
- Kr as a7,
4193
- fa as a8,
4194
- Gs as a9,
4195
- di as aA,
4196
- Se as aB,
4197
- fi as aC,
4198
- gi as aD,
4199
- Us as aE,
4200
- _s as aF,
4201
- $s as aG,
4202
- ut as aH,
4203
- Ws as aI,
4204
- jt as aJ,
4205
- ue as aK,
4206
- Xo as aL,
4207
- O as aM,
4208
- ho as aN,
4209
- fr as aO,
4210
- lo as aP,
4211
- zr as aQ,
4212
- Ma as aR,
4213
- rs as aS,
4214
- nt as aT,
4185
+ ni as a0,
4186
+ $t as a1,
4187
+ Gs as a2,
4188
+ oo as a3,
4189
+ ea as a4,
4190
+ xe as a5,
4191
+ wr as a6,
4192
+ ne as a7,
4193
+ Br as a8,
4194
+ fo as a9,
4195
+ A as aA,
4196
+ st as aB,
4197
+ di as aC,
4198
+ Se as aD,
4199
+ fi as aE,
4200
+ gi as aF,
4201
+ Us as aG,
4202
+ _s as aH,
4203
+ $s as aI,
4204
+ ut as aJ,
4205
+ Ws as aK,
4206
+ jt as aL,
4207
+ ue as aM,
4208
+ Xo as aN,
4209
+ O as aO,
4210
+ fr as aP,
4211
+ lo as aQ,
4212
+ zr as aR,
4213
+ Ma as aS,
4214
+ rs as aT,
4215
4215
  V as aU,
4216
4216
  Hr as aV,
4217
4217
  na as aW,
@@ -4222,29 +4222,29 @@ export {
4222
4222
  pi as aa,
4223
4223
  xt as ab,
4224
4224
  S as ac,
4225
- F as ad,
4226
- pe as ae,
4227
- ti as af,
4228
- gt as ag,
4229
- Zr as ah,
4230
- qn as ai,
4231
- $ as aj,
4232
- ie as ak,
4233
- la as al,
4234
- Zo as am,
4235
- za as an,
4236
- Ne as ao,
4237
- po as ap,
4238
- Vr as aq,
4239
- Ja as ar,
4240
- no as as,
4241
- Vo as at,
4242
- yi as au,
4243
- Ns as av,
4244
- Qo as aw,
4245
- Xe as ax,
4246
- A as ay,
4247
- st as az,
4225
+ xa as ad,
4226
+ Kr as ae,
4227
+ fa as af,
4228
+ F as ag,
4229
+ pe as ah,
4230
+ ti as ai,
4231
+ gt as aj,
4232
+ Zr as ak,
4233
+ qn as al,
4234
+ ie as am,
4235
+ la as an,
4236
+ Zo as ao,
4237
+ za as ap,
4238
+ Ne as aq,
4239
+ po as ar,
4240
+ Vr as as,
4241
+ Ja as at,
4242
+ no as au,
4243
+ Vo as av,
4244
+ yi as aw,
4245
+ Ns as ax,
4246
+ Qo as ay,
4247
+ Xe as az,
4248
4248
  q as b,
4249
4249
  Ea as b$,
4250
4250
  ma as b0,
@@ -4322,32 +4322,32 @@ export {
4322
4322
  go as c7,
4323
4323
  zo as c8,
4324
4324
  Ir as c9,
4325
- Or as cA,
4326
- Wr as cB,
4327
- oa as cC,
4328
- ia as cD,
4329
- ca as cE,
4330
- ba as cF,
4331
- Sa as cG,
4332
- wa as cH,
4333
- Aa as cI,
4334
- Ta as cJ,
4335
- Fa as cK,
4336
- Ra as cL,
4337
- tn as cM,
4338
- eo as cN,
4339
- Qa as cO,
4340
- mo as cP,
4341
- Mo as cQ,
4342
- $o as cR,
4343
- ms as cS,
4344
- sn as cT,
4345
- li as cU,
4346
- ws as cV,
4347
- bs as cW,
4348
- G as cX,
4349
- Oe as cY,
4350
- H as cZ,
4325
+ Gr as cA,
4326
+ Or as cB,
4327
+ Wr as cC,
4328
+ oa as cD,
4329
+ ia as cE,
4330
+ ca as cF,
4331
+ ba as cG,
4332
+ Sa as cH,
4333
+ wa as cI,
4334
+ Aa as cJ,
4335
+ Ta as cK,
4336
+ Fa as cL,
4337
+ Ra as cM,
4338
+ tn as cN,
4339
+ eo as cO,
4340
+ Qa as cP,
4341
+ mo as cQ,
4342
+ Mo as cR,
4343
+ $o as cS,
4344
+ ms as cT,
4345
+ sn as cU,
4346
+ li as cV,
4347
+ ws as cW,
4348
+ bs as cX,
4349
+ G as cY,
4350
+ Oe as cZ,
4351
4351
  xs as c_,
4352
4352
  Ko as ca,
4353
4353
  Cr as cb,
@@ -4356,25 +4356,25 @@ export {
4356
4356
  Be as ce,
4357
4357
  Es as cf,
4358
4358
  As as cg,
4359
- Ss as ch,
4360
- Ts as ci,
4361
- ks as cj,
4362
- Xs as ck,
4363
- Js as cl,
4364
- Ys as cm,
4365
- er as cn,
4366
- nr as co,
4367
- sr as cp,
4368
- or as cq,
4369
- rr as cr,
4370
- ar as cs,
4371
- ur as ct,
4372
- cr as cu,
4373
- mr as cv,
4374
- He as cw,
4375
- Ar as cx,
4376
- _r as cy,
4377
- Gr as cz,
4359
+ Is as ch,
4360
+ Ss as ci,
4361
+ Ts as cj,
4362
+ ks as ck,
4363
+ Xs as cl,
4364
+ Js as cm,
4365
+ Ys as cn,
4366
+ er as co,
4367
+ nr as cp,
4368
+ sr as cq,
4369
+ or as cr,
4370
+ rr as cs,
4371
+ ar as ct,
4372
+ ur as cu,
4373
+ cr as cv,
4374
+ mr as cw,
4375
+ He as cx,
4376
+ Ar as cy,
4377
+ _r as cz,
4378
4378
  M as d,
4379
4379
  ui as d0,
4380
4380
  hi as d1,
@@ -4432,17 +4432,17 @@ export {
4432
4432
  os as k,
4433
4433
  y as l,
4434
4434
  ri as m,
4435
- Qt as n,
4436
- Bn as o,
4435
+ $ as n,
4436
+ k as o,
4437
4437
  $e as p,
4438
- wi as q,
4438
+ nt as q,
4439
4439
  oi as r,
4440
4440
  ai as s,
4441
4441
  E as t,
4442
4442
  fe as u,
4443
4443
  hs as v,
4444
- bi as w,
4445
- D as x,
4446
- T as y,
4444
+ Bn as w,
4445
+ Qt as x,
4446
+ wi as y,
4447
4447
  C as z
4448
4448
  };
@@ -1,6 +1,6 @@
1
- import { k as B, j as G, ak as K, a1 as W, al as z, am as V, ac as N, an as F, u as S } from "./index-C0dhsYom.js";
2
- import { u as O, f as Y } from "./gpgpu_math-DJm3ZTAf.js";
3
- import { f as v } from "./backend_util-DWiwsi2N.js";
1
+ import { k as B, j as G, am as K, a6 as W, an as z, ao as V, ac as N, ap as F, u as S } from "./index-UdZhlibC.js";
2
+ import { u as O, f as Y } from "./gpgpu_math-DffelNS-.js";
3
+ import { f as v } from "./backend_util-C9Ut8n0Q.js";
4
4
  /**
5
5
  * @license
6
6
  * Copyright 2018 Google LLC. All Rights Reserved.
@@ -1,5 +1,5 @@
1
- import { T as g, q as p, e as o, w as v } from "../index-C0dhsYom.js";
2
- import { v as _ } from "../variable-DXEUOwew.js";
1
+ import { T as g, y as p, e as o, A as v } from "../index-UdZhlibC.js";
2
+ import { v as _ } from "../variable-BTBkayv_.js";
3
3
  class M {
4
4
  parent;
5
5
  config;
@@ -3,14 +3,14 @@ import O from "./BaseLayer.js";
3
3
  import { qkv as P } from "../ops/qkv.js";
4
4
  import { rope as v } from "../ops/rope.js";
5
5
  import { appendCache as V } from "../ops/appendCache.js";
6
- import { o as c, t as C } from "../index-C0dhsYom.js";
6
+ import { w as c, t as C } from "../index-UdZhlibC.js";
7
7
  import { fusedSoftmax as T } from "../ops/fusedSoftmax.js";
8
- import { d as y } from "../random_width-DkYP8W8N.js";
9
- import { v as b } from "../variable-DXEUOwew.js";
10
- import { r as k, d as L } from "../dropout-hpDwECTe.js";
11
- import { r as N } from "../reshape-BMUzc1UY.js";
12
- import { m as R } from "../mat_mul-1nwdPkQ_.js";
13
- class $ extends O {
8
+ import { d as y } from "../random_width-DbSpgl4o.js";
9
+ import { v as b } from "../variable-BTBkayv_.js";
10
+ import { r as k, d as L } from "../dropout-DPfPgWWe.js";
11
+ import { r as N } from "../reshape-BR0eoLYN.js";
12
+ import { m as R } from "../mat_mul-dwmZz69e.js";
13
+ class W extends O {
14
14
  divisor;
15
15
  index;
16
16
  units;
@@ -92,5 +92,5 @@ class $ extends O {
92
92
  }
93
93
  }
94
94
  export {
95
- $ as default
95
+ W as default
96
96
  };
@@ -1,10 +1,10 @@
1
- import { t as l } from "../index-C0dhsYom.js";
1
+ import { t as l } from "../index-UdZhlibC.js";
2
2
  import u from "./BaseLayer.js";
3
3
  import { matMulGelu as M } from "../ops/matMulGelu.js";
4
- import { v as o } from "../variable-DXEUOwew.js";
5
- import { r as h, d as f } from "../dropout-hpDwECTe.js";
6
- import { r as d } from "../reshape-BMUzc1UY.js";
7
- import { m as c } from "../mat_mul-1nwdPkQ_.js";
4
+ import { v as o } from "../variable-BTBkayv_.js";
5
+ import { r as h, d as f } from "../dropout-DPfPgWWe.js";
6
+ import { r as d } from "../reshape-BR0eoLYN.js";
7
+ import { m as c } from "../mat_mul-dwmZz69e.js";
8
8
  class V extends u {
9
9
  index;
10
10
  hiddenUnits;
@@ -1,8 +1,8 @@
1
- import { t as s } from "../index-C0dhsYom.js";
1
+ import { t as s } from "../index-UdZhlibC.js";
2
2
  import e from "./BaseLayer.js";
3
3
  import { normRMS as a } from "../ops/normRMS.js";
4
- import { v as i } from "../variable-DXEUOwew.js";
5
- import { o as m } from "../ones-D63HpSF_.js";
4
+ import { v as i } from "../variable-BTBkayv_.js";
5
+ import { o as m } from "../ones-C8Mfln6-.js";
6
6
  class f extends e {
7
7
  GAMMA;
8
8
  constructor(r, t = "", o) {
@@ -1,7 +1,7 @@
1
- import { b as t, n as h, t as n, o as p } from "../index-C0dhsYom.js";
2
- import { r as c } from "../reciprocal-_A9yv27J.js";
3
- import { c as f, s as m } from "../sin-Cocju-BY.js";
4
- import { r as a } from "../range-CYzpQY53.js";
1
+ import { b as t, x as h, t as n, w as p } from "../index-UdZhlibC.js";
2
+ import { r as c } from "../reciprocal-CGB48wZB.js";
3
+ import { c as f, s as m } from "../sin-CiBxrDqX.js";
4
+ import { r as a } from "../range-D9CZhVlR.js";
5
5
  class D {
6
6
  constructor(o) {
7
7
  this.config = o;
@@ -1,9 +1,9 @@
1
- import "../random_width-DkYP8W8N.js";
2
- import "../index-C0dhsYom.js";
3
- import { T as e } from "../TiedEmbedding-BLltddza.js";
1
+ import "../random_width-DbSpgl4o.js";
2
+ import "../index-UdZhlibC.js";
3
+ import { T as e } from "../TiedEmbedding-ccLBFiZi.js";
4
4
  import "./BaseLayer.js";
5
- import "../variable-DXEUOwew.js";
6
- import "../gather-D0_gPiBz.js";
5
+ import "../variable-BTBkayv_.js";
6
+ import "../gather-Bbh8DHhM.js";
7
7
  export {
8
8
  e as default
9
9
  };
@@ -2,7 +2,7 @@ import l from "./CausalSelfAttention.js";
2
2
  import r from "./MLP.js";
3
3
  import o from "./RMSNorm.js";
4
4
  import d from "./BaseLayer.js";
5
- import { t as p } from "../index-C0dhsYom.js";
5
+ import { t as p } from "../index-UdZhlibC.js";
6
6
  class k extends d {
7
7
  ln1;
8
8
  attn;
@@ -2,7 +2,7 @@ import b from "../NanoGPTModel.js";
2
2
  import c from "../tokeniser/CharTokeniser.js";
3
3
  import l from "../tokeniser/bpe.js";
4
4
  import { load_safetensors as u } from "../utilities/safetensors.js";
5
- import { Y as y } from "../index-C0dhsYom.js";
5
+ import { a0 as y } from "../index-UdZhlibC.js";
6
6
  import { dummyPassAsync as h } from "../utilities/dummy.js";
7
7
  async function L(e, a, r, t) {
8
8
  const n = {
@@ -1,13 +1,17 @@
1
1
  import d from "../NanoGPTModel.js";
2
2
  import "../jszip.min-CjP2V1VV.js";
3
3
  import h from "../tokeniser/CharTokeniser.js";
4
- import { Y as k } from "../index-C0dhsYom.js";
4
+ import { a0 as k } from "../index-UdZhlibC.js";
5
5
  import b from "../tokeniser/bpe.js";
6
6
  import { dummyPassAsync as u } from "../utilities/dummy.js";
7
7
  import "../Generator.js";
8
8
  import "../index-Dwqa6Zy2.js";
9
- import "../dataset-JDyjG3QR.js";
9
+ import "../dataset-U3PrjwgU.js";
10
10
  import "../index-Tf7vU29b.js";
11
+ import "../ops/cpu/adamAdjust.js";
12
+ import "../ops/webgl/adamAdjust.js";
13
+ import "../ops/cpu/adamMoments.js";
14
+ import "../ops/webgl/adamMoments.js";
11
15
  import "../papaparse.min-C8l2Kvo1.js";
12
16
  import "../ops/cpu/scatterSub.js";
13
17
  import "../ops/webgl/scatterSub.js";
@@ -19,8 +23,8 @@ import "../ops/grads/attentionMask.js";
19
23
  import "../ops/cpu/qkv.js";
20
24
  import "../ops/webgl/qkv.js";
21
25
  import "../ops/grads/qkv.js";
22
- import "../random_width-DkYP8W8N.js";
23
- import "../register_all_kernels-guvSxp7M.js";
26
+ import "../random_width-DbSpgl4o.js";
27
+ import "../register_all_kernels-DnbAyBXt.js";
24
28
  import "../ops/cpu/rope.js";
25
29
  import "../ops/webgl/rope.js";
26
30
  import "../ops/grads/rope.js";
@@ -34,13 +38,13 @@ import "../ops/webgl/matMulGelu.js";
34
38
  import "../ops/grads/matMulGelu.js";
35
39
  import "../ops/cpu/gelu.js";
36
40
  import "../ops/webgl/gelu.js";
37
- import "../gelu-uyHP1x1f.js";
41
+ import "../gelu-BFwVnd1r.js";
38
42
  import "../ops/cpu/normRMS.js";
39
43
  import "../ops/webgl/normRMS.js";
40
44
  import "../ops/grads/normRMS.js";
41
45
  import "../ops/webgl/log.js";
42
46
  import { importWeights as O } from "../utilities/weights.js";
43
- async function ft(o) {
47
+ async function yt(o) {
44
48
  const n = /* @__PURE__ */ new Map(), s = await o.file("manifest.json")?.async("string");
45
49
  if (!s)
46
50
  throw new Error("Manifest file not found in the zip archive");
@@ -72,5 +76,5 @@ async function ft(o) {
72
76
  return { model: e, tokeniser: l };
73
77
  }
74
78
  export {
75
- ft as default
79
+ yt as default
76
80
  };
@@ -1,8 +1,8 @@
1
- import { x as r, y as p, E as u, a7 as E, a8 as h, p as S, c as $, a6 as d } from "./index-C0dhsYom.js";
2
- import { e as K } from "./axis_util-DaAl5MER.js";
3
- import { m as T } from "./max-BQc2Aj-I.js";
4
- import { r as m } from "./reshape-BMUzc1UY.js";
5
- import { s as _ } from "./sum-B8wEpKsg.js";
1
+ import { B as r, C as p, E as u, ae as E, af as h, p as S, c as $, o as d } from "./index-UdZhlibC.js";
2
+ import { e as K } from "./axis_util-5DTW2tFV.js";
3
+ import { m as T } from "./max-ByjEGoFx.js";
4
+ import { r as m } from "./reshape-BR0eoLYN.js";
5
+ import { s as _ } from "./sum-NLYbiDag.js";
6
6
  /**
7
7
  * @license
8
8
  * Copyright 2018 Google LLC. All Rights Reserved.
@@ -61,7 +61,7 @@ const w = /* @__PURE__ */ r({ log_: v });
61
61
  * limitations under the License.
62
62
  * =============================================================================
63
63
  */
64
- function y(s, n = null, o = !1) {
64
+ function A(s, n = null, o = !1) {
65
65
  const a = p(s, "x", "logSumExp"), t = S(n, a.shape), x = T(
66
66
  a,
67
67
  t,
@@ -74,9 +74,9 @@ function y(s, n = null, o = !1) {
74
74
  }
75
75
  return e;
76
76
  }
77
- const M = /* @__PURE__ */ r({ logSumExp_: y });
77
+ const L = /* @__PURE__ */ r({ logSumExp_: A });
78
78
  export {
79
79
  w as a,
80
80
  N as e,
81
- M as l
81
+ L as l
82
82
  };
package/dist/main.d.ts CHANGED
@@ -1,3 +1,7 @@
1
+ import { default as CausalSelfAttention } from './layers/CausalSelfAttention';
2
+ import { default as MLP } from './layers/MLP';
3
+ import { default as TransformerBlock } from './layers/TransformerBlock';
4
+ import { default as RoPECache } from './layers/RoPECache';
1
5
  export { default as NanoGPT } from './NanoGPTModel';
2
6
  export { default as TeachableLLM } from './TeachableLLM';
3
7
  export { default as CharTokeniser } from './tokeniser/CharTokeniser';
@@ -13,3 +17,10 @@ export type { GPTConfig } from './config';
13
17
  export { estimateParameterCount, estimateMemoryUsage, estimateTrainingMemoryUsage, estimateResources, validateConfig, } from './utilities/parameters';
14
18
  export { selectBackend } from './backend';
15
19
  export { default as performanceTest } from './utilities/performance';
20
+ export declare const layers: {
21
+ CausalSelfAttention: typeof CausalSelfAttention;
22
+ MLP: typeof MLP;
23
+ TransformerBlock: typeof TransformerBlock;
24
+ RoPECache: typeof RoPECache;
25
+ };
26
+ export { default as AdamExt } from './training/AdamExt';
package/dist/main.js CHANGED
@@ -1,11 +1,11 @@
1
- import { default as R } from "./NanoGPTModel.js";
2
- import { default as q } from "./TeachableLLM.js";
3
- import { default as A } from "./tokeniser/CharTokeniser.js";
4
- import { default as I } from "./tokeniser/bpe.js";
5
- import { default as K } from "./utilities/waitForModel.js";
6
- import { default as Q } from "./data/textLoader.js";
7
- import { estimateMemoryUsage as V, estimateParameterCount as W, estimateResources as X, estimateTrainingMemoryUsage as Y, validateConfig as Z } from "./utilities/parameters.js";
8
- import "./index-C0dhsYom.js";
1
+ import { default as W } from "./NanoGPTModel.js";
2
+ import { default as Y } from "./TeachableLLM.js";
3
+ import { default as _ } from "./tokeniser/CharTokeniser.js";
4
+ import { default as oo } from "./tokeniser/bpe.js";
5
+ import { default as to } from "./utilities/waitForModel.js";
6
+ import { default as eo } from "./data/textLoader.js";
7
+ import { estimateMemoryUsage as po, estimateParameterCount as ao, estimateResources as fo, estimateTrainingMemoryUsage as so, validateConfig as lo } from "./utilities/parameters.js";
8
+ import "./index-UdZhlibC.js";
9
9
  import "./ops/cpu/scatterSub.js";
10
10
  import "./ops/webgl/scatterSub.js";
11
11
  import "./ops/cpu/gatherSub.js";
@@ -16,10 +16,10 @@ import "./ops/grads/attentionMask.js";
16
16
  import "./ops/cpu/qkv.js";
17
17
  import "./ops/webgl/qkv.js";
18
18
  import "./ops/grads/qkv.js";
19
- import "./random_width-DkYP8W8N.js";
20
- import "./register_all_kernels-guvSxp7M.js";
19
+ import "./random_width-DbSpgl4o.js";
20
+ import "./register_all_kernels-DnbAyBXt.js";
21
21
  import "./index-Tf7vU29b.js";
22
- import "./dataset-JDyjG3QR.js";
22
+ import "./dataset-U3PrjwgU.js";
23
23
  import "./ops/cpu/rope.js";
24
24
  import "./ops/webgl/rope.js";
25
25
  import "./ops/grads/rope.js";
@@ -33,25 +33,42 @@ import "./ops/webgl/matMulGelu.js";
33
33
  import "./ops/grads/matMulGelu.js";
34
34
  import "./ops/cpu/gelu.js";
35
35
  import "./ops/webgl/gelu.js";
36
- import "./gelu-uyHP1x1f.js";
36
+ import "./gelu-BFwVnd1r.js";
37
37
  import "./ops/cpu/normRMS.js";
38
38
  import "./ops/webgl/normRMS.js";
39
39
  import "./ops/grads/normRMS.js";
40
40
  import "./ops/webgl/log.js";
41
- import { selectBackend as $ } from "./backend.js";
42
- import { default as ot } from "./utilities/performance.js";
41
+ import "./ops/cpu/adamMoments.js";
42
+ import "./ops/webgl/adamMoments.js";
43
+ import "./ops/cpu/adamAdjust.js";
44
+ import "./ops/webgl/adamAdjust.js";
45
+ import { selectBackend as xo } from "./backend.js";
46
+ import { default as co } from "./utilities/performance.js";
47
+ import o from "./layers/CausalSelfAttention.js";
48
+ import r from "./layers/MLP.js";
49
+ import t from "./layers/TransformerBlock.js";
50
+ import m from "./layers/RoPECache.js";
51
+ import { default as ko } from "./training/AdamExt.js";
52
+ const O = {
53
+ CausalSelfAttention: o,
54
+ MLP: r,
55
+ TransformerBlock: t,
56
+ RoPECache: m
57
+ };
43
58
  export {
44
- I as BPETokeniser,
45
- A as CharTokeniser,
46
- R as NanoGPT,
47
- q as TeachableLLM,
48
- V as estimateMemoryUsage,
49
- W as estimateParameterCount,
50
- X as estimateResources,
51
- Y as estimateTrainingMemoryUsage,
52
- Q as loadTextData,
53
- ot as performanceTest,
54
- $ as selectBackend,
55
- Z as validateConfig,
56
- K as waitForModel
59
+ ko as AdamExt,
60
+ oo as BPETokeniser,
61
+ _ as CharTokeniser,
62
+ W as NanoGPT,
63
+ Y as TeachableLLM,
64
+ po as estimateMemoryUsage,
65
+ ao as estimateParameterCount,
66
+ fo as estimateResources,
67
+ so as estimateTrainingMemoryUsage,
68
+ O as layers,
69
+ eo as loadTextData,
70
+ co as performanceTest,
71
+ xo as selectBackend,
72
+ lo as validateConfig,
73
+ to as waitForModel
57
74
  };
@@ -1,4 +1,4 @@
1
- import { x as m, y as s, F as c, E as M, H as p } from "./index-C0dhsYom.js";
1
+ import { B as m, C as s, I as c, E as M, J as p } from "./index-UdZhlibC.js";
2
2
  /**
3
3
  * @license
4
4
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -1,4 +1,4 @@
1
- import { x as r, y as x, E as e, N as c } from "./index-C0dhsYom.js";
1
+ import { B as r, C as e, E as x, U as c } from "./index-UdZhlibC.js";
2
2
  /**
3
3
  * @license
4
4
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -16,8 +16,8 @@ import { x as r, y as x, E as e, N as c } from "./index-C0dhsYom.js";
16
16
  * =============================================================================
17
17
  */
18
18
  function m(n, s = null, o = !1) {
19
- const t = { x: x(n, "x", "max") }, a = { reductionIndices: s, keepDims: o };
20
- return e.runKernel(c, t, a);
19
+ const t = { x: e(n, "x", "max") }, a = { reductionIndices: s, keepDims: o };
20
+ return x.runKernel(c, t, a);
21
21
  }
22
22
  const l = /* @__PURE__ */ r({ max_: m });
23
23
  export {
@@ -1,4 +1,4 @@
1
- import { u as z } from "./gpgpu_math-DJm3ZTAf.js";
1
+ import { u as z } from "./gpgpu_math-DffelNS-.js";
2
2
  /**
3
3
  * @license
4
4
  * Copyright 2018 Google LLC. All Rights Reserved.