@genai-fi/nanogpt 0.8.5 → 0.9.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (153) hide show
  1. package/dist/Generator.d.ts +4 -1
  2. package/dist/Generator.js +144 -124
  3. package/dist/{RealDiv-D_q39E3A.js → RealDiv-D4EzDsC0.js} +7 -7
  4. package/dist/{Reshape-Bh_jzKzV.js → Reshape-Bowtk9BP.js} +2 -2
  5. package/dist/{Reshape-41YpQqEo.js → Reshape-DUqYftGC.js} +1 -1
  6. package/dist/TeachableLLM.js +5 -5
  7. package/dist/Trainer.d.ts +1 -0
  8. package/dist/Trainer.js +3 -0
  9. package/dist/{axis_util-Did9235A.js → axis_util-TbGYJ208.js} +1 -1
  10. package/dist/backend.js +2 -2
  11. package/dist/{backend_util-yC3YH1jo.js → backend_util-CJIiDoV1.js} +4 -4
  12. package/dist/{broadcast_to-CUvOdOT5.js → broadcast_to-DzlNweb8.js} +2 -2
  13. package/dist/checks/appendCache.js +2 -2
  14. package/dist/checks/attentionMask.js +3 -3
  15. package/dist/checks/gelu.js +2 -2
  16. package/dist/checks/matMulGelu.js +5 -5
  17. package/dist/checks/normRMS.js +4 -4
  18. package/dist/checks/normRMSGrad.js +3 -3
  19. package/dist/checks/qkv.js +2 -2
  20. package/dist/checks/rope.js +2 -2
  21. package/dist/{concat-pHiVqR3L.js → concat-B912vBbo.js} +1 -1
  22. package/dist/{dataset-DPPl-iLT.js → dataset-DlZtKmBq.js} +3 -3
  23. package/dist/{dropout-CcKSfOYE.js → dropout-C-csYCLj.js} +6 -6
  24. package/dist/{exports_initializers-DKk7-bsx.js → exports_initializers-B8iZMgQ0.js} +1 -1
  25. package/dist/{gather-CPg6ZlQA.js → gather-Dnpgw-YQ.js} +1 -1
  26. package/dist/{gelu-BkcmEEyD.js → gelu-Bp_-935b.js} +1 -1
  27. package/dist/{gpgpu_math-D_ODOLix.js → gpgpu_math-CDaYiyE_.js} +2 -2
  28. package/dist/{index-DdmHGZjq.js → index-BzFyqcy-.js} +13 -13
  29. package/dist/{index-evZ57wr4.js → index-C1rx_Ajs.js} +10 -10
  30. package/dist/{kernel_funcs_utils-CDfFpUab.js → kernel_funcs_utils-DKLK0Mg3.js} +3 -3
  31. package/dist/layers/BaseLayer.js +2 -2
  32. package/dist/layers/CausalSelfAttention.js +6 -6
  33. package/dist/layers/MLP.js +5 -5
  34. package/dist/layers/PositionEmbedding.js +5 -5
  35. package/dist/layers/RMSNorm.js +3 -3
  36. package/dist/layers/RoPECache.js +4 -4
  37. package/dist/layers/TiedEmbedding.js +5 -5
  38. package/dist/layers/TransformerBlock.js +1 -1
  39. package/dist/loader/loadTransformers.js +1 -1
  40. package/dist/loader/oldZipLoad.js +5 -5
  41. package/dist/{log_sum_exp-C8yFJfZz.js → log_sum_exp-DO6z8tSE.js} +9 -9
  42. package/dist/main.d.ts +1 -0
  43. package/dist/main.js +18 -16
  44. package/dist/{mat_mul-Dpy2mMRu.js → mat_mul-DzjTFx-u.js} +1 -1
  45. package/dist/{mod-CbibJi3D.js → mod-Dobti4j4.js} +1 -1
  46. package/dist/models/NanoGPTV1.d.ts +1 -0
  47. package/dist/models/NanoGPTV1.js +12 -9
  48. package/dist/models/model.d.ts +1 -0
  49. package/dist/models/model.js +5 -5
  50. package/dist/{mulmat_packed_gpu-q_Gmwyld.js → mulmat_packed_gpu-BT60jmzP.js} +1 -1
  51. package/dist/{ones-BAqVh-eA.js → ones-tIJeHlq-.js} +2 -2
  52. package/dist/ops/adamAdjust.js +1 -1
  53. package/dist/ops/adamMoments.js +1 -1
  54. package/dist/ops/appendCache.js +3 -3
  55. package/dist/ops/attentionMask.js +1 -1
  56. package/dist/ops/cpu/adamAdjust.js +1 -1
  57. package/dist/ops/cpu/adamMoments.js +2 -2
  58. package/dist/ops/cpu/appendCache.js +2 -2
  59. package/dist/ops/cpu/attentionMask.js +5 -5
  60. package/dist/ops/cpu/fusedSoftmax.js +2 -2
  61. package/dist/ops/cpu/gatherSub.js +5 -5
  62. package/dist/ops/cpu/gelu.js +1 -1
  63. package/dist/ops/cpu/matMulGelu.js +2 -2
  64. package/dist/ops/cpu/matMulMul.js +1 -1
  65. package/dist/ops/cpu/mulDropout.js +1 -1
  66. package/dist/ops/cpu/normRMS.js +1 -1
  67. package/dist/ops/cpu/qkv.js +3 -3
  68. package/dist/ops/cpu/rope.js +5 -5
  69. package/dist/ops/cpu/scatterSub.js +13 -13
  70. package/dist/ops/fusedSoftmax.js +1 -1
  71. package/dist/ops/gatherSub.js +1 -1
  72. package/dist/ops/gelu.js +2 -2
  73. package/dist/ops/grads/attentionMask.js +1 -1
  74. package/dist/ops/grads/fusedSoftmax.js +2 -2
  75. package/dist/ops/grads/gelu.js +2 -2
  76. package/dist/ops/grads/matMulGelu.js +1 -1
  77. package/dist/ops/grads/normRMS.js +1 -1
  78. package/dist/ops/grads/qkv.js +1 -1
  79. package/dist/ops/grads/rope.js +1 -1
  80. package/dist/ops/matMulGelu.js +1 -1
  81. package/dist/ops/matMulMul.js +1 -1
  82. package/dist/ops/mulDrop.js +1 -1
  83. package/dist/ops/normRMS.js +1 -1
  84. package/dist/ops/qkv.js +1 -1
  85. package/dist/ops/rope.js +4 -4
  86. package/dist/ops/scatterSub.js +1 -1
  87. package/dist/ops/webgl/adamAdjust.js +2 -2
  88. package/dist/ops/webgl/adamMoments.js +1 -1
  89. package/dist/ops/webgl/appendCache.js +1 -1
  90. package/dist/ops/webgl/attentionMask.js +1 -1
  91. package/dist/ops/webgl/fusedSoftmax.js +4 -4
  92. package/dist/ops/webgl/gatherSub.js +1 -1
  93. package/dist/ops/webgl/gelu.js +2 -2
  94. package/dist/ops/webgl/log.js +3 -3
  95. package/dist/ops/webgl/matMulGelu.js +4 -4
  96. package/dist/ops/webgl/matMulMul.js +1 -1
  97. package/dist/ops/webgl/mulDropout.js +1 -1
  98. package/dist/ops/webgl/normRMS.js +2 -2
  99. package/dist/ops/webgl/qkv.js +1 -1
  100. package/dist/ops/webgl/rope.js +1 -1
  101. package/dist/ops/webgl/scatterSub.js +1 -1
  102. package/dist/ops/webgpu/adamAdjust.js +3 -3
  103. package/dist/ops/webgpu/adamMoments.js +3 -3
  104. package/dist/ops/webgpu/appendCache.js +3 -3
  105. package/dist/ops/webgpu/attentionMask.js +3 -3
  106. package/dist/ops/webgpu/gatherSub.js +3 -3
  107. package/dist/ops/webgpu/gelu.js +37 -35
  108. package/dist/ops/webgpu/normRMS.js +2 -2
  109. package/dist/ops/webgpu/normRMSGrad.js +5 -5
  110. package/dist/ops/webgpu/qkv.js +3 -3
  111. package/dist/ops/webgpu/rope.js +3 -3
  112. package/dist/ops/webgpu/scatterSub.js +3 -3
  113. package/dist/ops/webgpu/utils/reductions.js +4 -4
  114. package/dist/{ops-542ai2vG.js → ops-LuCMAnmM.js} +65 -65
  115. package/dist/{random_width-DKGeiFuR.js → random_width-CXVRloNK.js} +23 -23
  116. package/dist/{range-BcUvLuf5.js → range-CWcz7xFA.js} +3 -3
  117. package/dist/{reciprocal-DhDWSKiD.js → reciprocal-C4rNcM-S.js} +1 -1
  118. package/dist/{register_all_kernels-Do9VvZmo.js → register_all_kernels-DIGpEwcf.js} +31 -31
  119. package/dist/{relu-B1AXs7p5.js → relu-BjCh_SYb.js} +1 -1
  120. package/dist/{reshape-WeJkT3ja.js → reshape-CnIwVG1c.js} +1 -1
  121. package/dist/{scatter_nd_util-B7yDhiQr.js → scatter_nd_util-BQdz--Gn.js} +1 -1
  122. package/dist/{selu_util-BgUO9gHY.js → selu_util-OtRzVwW5.js} +23 -23
  123. package/dist/{shared-V6D_md-c.js → shared-DmRsFyaJ.js} +6 -6
  124. package/dist/{shared-CZiWmQCI.js → shared-DuP7ue-R.js} +1 -1
  125. package/dist/{sin-CPxad7Am.js → sin-gpDNRxE0.js} +1 -1
  126. package/dist/{slice-B7jXtPnp.js → slice-d0Vo9XTN.js} +1 -1
  127. package/dist/{softmax-BfsyI4As.js → softmax-D7Jj3p_P.js} +1 -1
  128. package/dist/{split-BPxr8_8m.js → split-DK2k5eHf.js} +1 -1
  129. package/dist/{stack-BNwLzE43.js → stack-DFatutCx.js} +1 -1
  130. package/dist/{sum-ByFINZgi.js → sum-CJ0ULhmt.js} +1 -1
  131. package/dist/{tensor-DbqgIV9B.js → tensor-CZr4dh61.js} +1 -1
  132. package/dist/{tensor1d-CtJq5BOv.js → tensor1d-vML0r3q6.js} +1 -1
  133. package/dist/{tensor2d-CObBWBkW.js → tensor2d-D76QGjF3.js} +1 -1
  134. package/dist/{tensor4d-DLtk7Nxh.js → tensor4d-Df1WlVDY.js} +1 -1
  135. package/dist/training/Adam.js +2 -2
  136. package/dist/training/AdamExt.js +1 -1
  137. package/dist/training/DatasetBuilder.js +2 -2
  138. package/dist/training/FullTrainer.js +72 -61
  139. package/dist/training/Trainer.js +2 -2
  140. package/dist/training/sparseCrossEntropy.js +3 -3
  141. package/dist/utilities/dummy.js +2 -2
  142. package/dist/utilities/multinomialCPU.js +2 -2
  143. package/dist/utilities/performance.js +1 -1
  144. package/dist/utilities/profile.js +1 -1
  145. package/dist/utilities/safetensors.js +2 -2
  146. package/dist/utilities/topP.d.ts +1 -0
  147. package/dist/utilities/topP.js +13 -0
  148. package/dist/utilities/weights.js +2 -2
  149. package/dist/{variable-DPFOJyRG.js → variable-Bm2OFwGI.js} +1 -1
  150. package/dist/{webgpu_program-Dhk9R5aG.js → webgpu_program-DkQJOJSd.js} +1 -1
  151. package/dist/{webgpu_util-BqGnZg8t.js → webgpu_util-pLEV9tks.js} +1 -1
  152. package/dist/{zeros-Dnwix0p4.js → zeros-Bj5rMYA7.js} +1 -1
  153. package/package.json +1 -1
@@ -1,5 +1,5 @@
1
- import "../index-DdmHGZjq.js";
2
- import { t as e } from "../tensor2d-CObBWBkW.js";
1
+ import "../index-BzFyqcy-.js";
2
+ import { t as e } from "../tensor2d-D76QGjF3.js";
3
3
  function l(n) {
4
4
  let r = 0;
5
5
  const i = Math.random();
@@ -1,4 +1,4 @@
1
- import { t as s } from "../index-DdmHGZjq.js";
1
+ import { t as s } from "../index-BzFyqcy-.js";
2
2
  async function f(e, o = 10, r = !1) {
3
3
  for (let t = 0; t < 100; t++) {
4
4
  const a = r ? await e() : s(e);
@@ -1,4 +1,4 @@
1
- import { m as a } from "../index-DdmHGZjq.js";
1
+ import { m as a } from "../index-BzFyqcy-.js";
2
2
  const s = 1024 * 1024;
3
3
  class l {
4
4
  log = /* @__PURE__ */ new Map();
@@ -1,5 +1,5 @@
1
- import "../index-DdmHGZjq.js";
2
- import { t as y } from "../tensor-DbqgIV9B.js";
1
+ import "../index-BzFyqcy-.js";
2
+ import { t as y } from "../tensor-CZr4dh61.js";
3
3
  function l(t) {
4
4
  if (t === "float32") return "F32";
5
5
  if (t === "int32") return "I32";
@@ -0,0 +1 @@
1
+ export default function topP(probs: number[][], tP: number): number[];
@@ -0,0 +1,13 @@
1
+ function c(s, a) {
2
+ const t = s[0].map((o, r) => ({ prob: o, index: r })).sort((o, r) => r.prob - o.prob);
3
+ let n = 0;
4
+ const e = new Array(t.length).fill(0);
5
+ for (const o of t)
6
+ if (n += o.prob, e[o.index] = o.prob, n >= a)
7
+ break;
8
+ const b = e.reduce((o, r) => o + r, 0);
9
+ return e.map((o) => o / b);
10
+ }
11
+ export {
12
+ c as default
13
+ };
@@ -1,5 +1,5 @@
1
- import "../index-DdmHGZjq.js";
2
- import { t as p } from "../tensor-DbqgIV9B.js";
1
+ import "../index-BzFyqcy-.js";
2
+ import { t as p } from "../tensor-CZr4dh61.js";
3
3
  function h(n) {
4
4
  const e = n.reduce((s, o) => s + o.length, 0), a = new Float32Array(e);
5
5
  let t = 0;
@@ -1,4 +1,4 @@
1
- import { E as i } from "./index-DdmHGZjq.js";
1
+ import { G as i } from "./index-BzFyqcy-.js";
2
2
  /**
3
3
  * @license
4
4
  * Copyright 2018 Google LLC. All Rights Reserved.
@@ -1,4 +1,4 @@
1
- import { ae as k, af as z, ag as E, a3 as j, n as A } from "./index-DdmHGZjq.js";
1
+ import { ae as k, af as z, ag as E, a3 as j, n as A } from "./index-BzFyqcy-.js";
2
2
  /**
3
3
  * @license
4
4
  * Copyright 2019 Google LLC. All Rights Reserved.
@@ -1,4 +1,4 @@
1
- import { n as u } from "./index-DdmHGZjq.js";
1
+ import { n as u } from "./index-BzFyqcy-.js";
2
2
  /**
3
3
  * @license
4
4
  * Copyright 2019 Google LLC. All Rights Reserved.
@@ -1,4 +1,4 @@
1
- import { C as m, D as r, a4 as l, E as c, aa as i, M as p, ab as u, j as f } from "./index-DdmHGZjq.js";
1
+ import { E as m, F as r, a4 as l, G as c, aa as i, M as p, ab as u, j as f } from "./index-BzFyqcy-.js";
2
2
  /**
3
3
  * @license
4
4
  * Copyright 2020 Google LLC. All Rights Reserved.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@genai-fi/nanogpt",
3
- "version": "0.8.5",
3
+ "version": "0.9.1",
4
4
  "type": "module",
5
5
  "main": "dist/main.js",
6
6
  "types": "dist/main.d.ts",