npm - @genai-fi/nanogpt - Versions diffs - 0.7.3 → 0.8.1 - Mend

@genai-fi/nanogpt 0.7.3 → 0.8.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (197) hide show

package/dist/Generator.d.ts +25 -2
package/dist/Generator.js +152 -49
package/dist/{RealDiv-Dy0p8Bvo.js → RealDiv-D_q39E3A.js} +13 -13
package/dist/{Reshape-DvudQDvJ.js → Reshape-41YpQqEo.js} +1 -1
package/dist/{Reshape-DH5srBP0.js → Reshape-Bh_jzKzV.js} +5 -5
package/dist/TeachableLLM.d.ts +6 -6
package/dist/TeachableLLM.js +33 -31
package/dist/Trainer.d.ts +13 -2
package/dist/Trainer.js +21 -12
package/dist/{axis_util-BzbKo31C.js → axis_util-Did9235A.js} +3 -3
package/dist/backend.js +2 -2
package/dist/{backend_util-TE7aTPhZ.js → backend_util-yC3YH1jo.js} +58 -58
package/dist/{broadcast_to-CdbwV-Dj.js → broadcast_to-CUvOdOT5.js} +2 -2
package/dist/checks/appendCache.d.ts +1 -0
package/dist/checks/appendCache.js +22 -0
package/dist/checks/attentionMask.d.ts +1 -0
package/dist/checks/attentionMask.js +37 -0
package/dist/checks/check.d.ts +9 -0
package/dist/checks/check.js +20 -0
package/dist/checks/gelu.d.ts +1 -0
package/dist/checks/gelu.js +18 -0
package/dist/checks/index.d.ts +19 -0
package/dist/checks/index.js +21 -0
package/dist/checks/normRMS.d.ts +1 -0
package/dist/checks/normRMS.js +16 -0
package/dist/checks/normRMSGrad.d.ts +1 -0
package/dist/checks/normRMSGrad.js +12 -0
package/dist/checks/qkv.d.ts +1 -0
package/dist/checks/qkv.js +25 -0
package/dist/checks/rope.d.ts +1 -0
package/dist/checks/rope.js +21 -0
package/dist/{concat-CsxrgovM.js → concat-pHiVqR3L.js} +1 -1
package/dist/{dataset-CtdBYwjo.js → dataset-DPPl-iLT.js} +9 -9
package/dist/{dropout-DYs5QFGQ.js → dropout-CcKSfOYE.js} +18 -18
package/dist/exports_initializers-DKk7-bsx.js +16 -0
package/dist/{gather-CMMy2KEG.js → gather-CPg6ZlQA.js} +1 -1
package/dist/{gelu-C-dPj6Ku.js → gelu-BkcmEEyD.js} +1 -1
package/dist/{gpgpu_math-DGNLNL4I.js → gpgpu_math-D_ODOLix.js} +26 -26
package/dist/{index-BoWRt-10.js → index-DdmHGZjq.js} +659 -650
package/dist/{index-CLthM0TO.js → index-evZ57wr4.js} +185 -185
package/dist/{kernel_funcs_utils-BYKWV8Aa.js → kernel_funcs_utils-CDfFpUab.js} +21 -21
package/dist/layers/BaseLayer.d.ts +8 -13
package/dist/layers/BaseLayer.js +25 -13
package/dist/layers/CausalSelfAttention.d.ts +3 -2
package/dist/layers/CausalSelfAttention.js +28 -28
package/dist/layers/MLP.d.ts +3 -2
package/dist/layers/MLP.js +16 -20
package/dist/layers/PositionEmbedding.d.ts +9 -0
package/dist/layers/PositionEmbedding.js +45 -0
package/dist/layers/RMSNorm.d.ts +3 -2
package/dist/layers/RMSNorm.js +6 -6
package/dist/layers/RoPECache.d.ts +1 -1
package/dist/layers/RoPECache.js +4 -4
package/dist/layers/TiedEmbedding.d.ts +3 -2
package/dist/layers/TiedEmbedding.js +29 -7
package/dist/layers/TransformerBlock.d.ts +3 -2
package/dist/layers/TransformerBlock.js +1 -1
package/dist/loader/load.d.ts +2 -2
package/dist/loader/loadHF.d.ts +2 -2
package/dist/loader/loadTransformers.d.ts +4 -2
package/dist/loader/loadTransformers.js +10 -9
package/dist/loader/newZipLoad.d.ts +2 -2
package/dist/loader/oldZipLoad.d.ts +2 -2
package/dist/loader/oldZipLoad.js +44 -51
package/dist/loader/save.d.ts +8 -0
package/dist/loader/save.js +62 -0
package/dist/{log_sum_exp-DbjkV734.js → log_sum_exp-C8yFJfZz.js} +45 -24
package/dist/main.d.ts +6 -4
package/dist/main.js +24 -18
package/dist/{mat_mul-8m8pfdcx.js → mat_mul-Dpy2mMRu.js} +1 -1
package/dist/mod-CbibJi3D.js +27 -0
package/dist/models/NanoGPTV1.d.ts +15 -0
package/dist/models/NanoGPTV1.js +71 -0
package/dist/{config.d.ts → models/config.d.ts} +1 -0
package/dist/{config.js → models/config.js} +1 -0
package/dist/models/factory.d.ts +3 -0
package/dist/models/factory.js +14 -0
package/dist/models/model.d.ts +26 -0
package/dist/models/model.js +70 -0
package/dist/{mulmat_packed_gpu-VSekgsNv.js → mulmat_packed_gpu-q_Gmwyld.js} +1 -1
package/dist/{ones-Dj0SDhHf.js → ones-BAqVh-eA.js} +2 -2
package/dist/ops/adamAdjust.js +1 -1
package/dist/ops/adamMoments.js +1 -1
package/dist/ops/appendCache.js +3 -3
package/dist/ops/attentionMask.js +1 -1
package/dist/ops/cpu/adamAdjust.js +9 -9
package/dist/ops/cpu/adamMoments.js +2 -2
package/dist/ops/cpu/appendCache.js +2 -2
package/dist/ops/cpu/attentionMask.js +5 -5
package/dist/ops/cpu/fusedSoftmax.js +2 -2
package/dist/ops/cpu/gatherSub.js +5 -5
package/dist/ops/cpu/gelu.js +1 -1
package/dist/ops/cpu/matMulGelu.js +2 -2
package/dist/ops/cpu/matMulMul.js +1 -1
package/dist/ops/cpu/mulDropout.js +1 -1
package/dist/ops/cpu/normRMS.js +1 -1
package/dist/ops/cpu/qkv.js +3 -3
package/dist/ops/cpu/rope.js +5 -5
package/dist/ops/cpu/scatterSub.js +7 -7
package/dist/ops/fusedSoftmax.js +1 -1
package/dist/ops/gatherSub.js +1 -1
package/dist/ops/gelu.js +2 -2
package/dist/ops/grads/attentionMask.js +1 -1
package/dist/ops/grads/fusedSoftmax.js +2 -2
package/dist/ops/grads/gelu.js +2 -2
package/dist/ops/grads/matMulGelu.js +1 -1
package/dist/ops/grads/normRMS.js +1 -1
package/dist/ops/grads/qkv.js +1 -1
package/dist/ops/grads/rope.js +1 -1
package/dist/ops/matMulGelu.js +1 -1
package/dist/ops/matMulMul.js +1 -1
package/dist/ops/mulDrop.js +1 -1
package/dist/ops/normRMS.js +1 -1
package/dist/ops/qkv.js +1 -1
package/dist/ops/rope.js +4 -4
package/dist/ops/scatterSub.js +1 -1
package/dist/ops/webgl/adamAdjust.js +2 -2
package/dist/ops/webgl/adamMoments.js +1 -1
package/dist/ops/webgl/appendCache.js +1 -1
package/dist/ops/webgl/attentionMask.js +1 -1
package/dist/ops/webgl/fusedSoftmax.js +4 -4
package/dist/ops/webgl/gatherSub.js +1 -1
package/dist/ops/webgl/gelu.js +2 -2
package/dist/ops/webgl/log.js +3 -3
package/dist/ops/webgl/matMulGelu.js +10 -10
package/dist/ops/webgl/matMulMul.js +1 -1
package/dist/ops/webgl/mulDropout.js +1 -1
package/dist/ops/webgl/normRMS.js +2 -2
package/dist/ops/webgl/qkv.js +1 -1
package/dist/ops/webgl/rope.js +1 -1
package/dist/ops/webgl/scatterSub.js +1 -1
package/dist/ops/webgpu/adamAdjust.js +3 -3
package/dist/ops/webgpu/adamMoments.js +3 -3
package/dist/ops/webgpu/appendCache.js +3 -3
package/dist/ops/webgpu/attentionMask.js +3 -3
package/dist/ops/webgpu/gatherSub.js +3 -3
package/dist/ops/webgpu/gelu.js +3 -3
package/dist/ops/webgpu/normRMS.js +2 -2
package/dist/ops/webgpu/normRMSGrad.js +5 -5
package/dist/ops/webgpu/qkv.js +3 -3
package/dist/ops/webgpu/rope.js +3 -3
package/dist/ops/webgpu/scatterSub.js +3 -3
package/dist/ops/webgpu/utils/reductions.js +4 -4
package/dist/ops-542ai2vG.js +1525 -0
package/dist/{random_width-sZORGo5k.js → random_width-DKGeiFuR.js} +1471 -1538
package/dist/{range-CRuAh-gd.js → range-BcUvLuf5.js} +1 -1
package/dist/{reciprocal-BvGAyKyu.js → reciprocal-DhDWSKiD.js} +1 -1
package/dist/{register_all_kernels-BwDSRN-f.js → register_all_kernels-Do9VvZmo.js} +2488 -2534
package/dist/{max-Ddnnb5xe.js → relu-B1AXs7p5.js} +6 -6
package/dist/{reshape-CdBq1WJ6.js → reshape-WeJkT3ja.js} +1 -1
package/dist/{scatter_nd_util-DUstGbU1.js → scatter_nd_util-B7yDhiQr.js} +1 -1
package/dist/{selu_util-BJEXVvjX.js → selu_util-BgUO9gHY.js} +125 -146
package/dist/{shared-wS99K7_n.js → shared-CZiWmQCI.js} +1 -1
package/dist/{shared-B8ztnyEk.js → shared-V6D_md-c.js} +72 -72
package/dist/{sin-BeA3tsEd.js → sin-CPxad7Am.js} +1 -1
package/dist/{slice-BiOsknYS.js → slice-B7jXtPnp.js} +1 -1
package/dist/{softmax-Bv_6lyMX.js → softmax-BfsyI4As.js} +1 -1
package/dist/{split-B-dikLRw.js → split-BPxr8_8m.js} +1 -1
package/dist/{stack-B17UN2nn.js → stack-BNwLzE43.js} +1 -1
package/dist/{sum-66ew2byf.js → sum-ByFINZgi.js} +3 -3
package/dist/{tensor-JwS7ZYY6.js → tensor-DbqgIV9B.js} +1 -1
package/dist/tensor1d-CtJq5BOv.js +27 -0
package/dist/{tensor2d-wxPAnDQy.js → tensor2d-CObBWBkW.js} +1 -1
package/dist/tensor3d-BOukqWwr.js +30 -0
package/dist/tensor4d-DLtk7Nxh.js +30 -0
package/dist/training/Adam.js +2 -2
package/dist/training/AdamExt.js +1 -1
package/dist/training/DatasetBuilder.js +2 -2
package/dist/training/Evaluator.d.ts +2 -2
package/dist/training/FullTrainer.d.ts +3 -3
package/dist/training/FullTrainer.js +61 -69
package/dist/training/Trainer.d.ts +15 -3
package/dist/training/Trainer.js +39 -47
package/dist/training/sparseCrossEntropy.js +12 -13
package/dist/utilities/arrayClose.d.ts +1 -1
package/dist/utilities/arrayClose.js +16 -7
package/dist/utilities/dummy.d.ts +4 -4
package/dist/utilities/dummy.js +13 -13
package/dist/utilities/multinomialCPU.js +2 -2
package/dist/utilities/parameters.d.ts +1 -1
package/dist/utilities/performance.js +1 -1
package/dist/utilities/profile.js +1 -1
package/dist/utilities/safetensors.js +2 -2
package/dist/utilities/weights.js +2 -2
package/dist/{variable-BuddVFLa.js → variable-DPFOJyRG.js} +1 -1
package/dist/{webgpu_program-PFzf1hAQ.js → webgpu_program-Dhk9R5aG.js} +1 -1
package/dist/{webgpu_util-D____QpY.js → webgpu_util-BqGnZg8t.js} +27 -27
package/dist/{zeros--BdLQ3oG.js → zeros-Dnwix0p4.js} +1 -1
package/package.json +2 -3
package/dist/NanoGPTModel.d.ts +0 -52
package/dist/NanoGPTModel.js +0 -203
package/dist/TiedEmbedding-BxOerUmB.js +0 -43
package/dist/ops-BFGCx8Ri.js +0 -1202
package/dist/utilities/generate.d.ts +0 -3
package/dist/utilities/generate.js +0 -22
package/dist/utilities/save.d.ts +0 -9
package/dist/utilities/save.js +0 -61

package/dist/Trainer.js CHANGED Viewed

@@ -1,11 +1,13 @@
 import { E as l } from "./index-Dwqa6Zy2.js";
 import h from "./training/FullTrainer.js";
-class p extends l {
+class m extends l {
   trainer;
   hasTrained = !1;
   trainDataset;
   validationDataset;
   totalSamples = 0;
+  log = [];
+  progress = null;
   constructor(t, e) {
     super(), this.trainer = new h(t, e, 1e-3);
   }
@@ -13,7 +15,7 @@ class p extends l {
     this.trainer.stop();
   }
   reset() {
-    this.hasTrained = !1, this.trainer.reset();
+    this.hasTrained = !1, this.log = [], this.trainer.reset();
   }
   async prepare(t, e) {
     const { trainDataset: a, validationDataset: s } = await this.trainer.createTrainValidationSplit(
@@ -26,7 +28,7 @@ class p extends l {
   async train(t) {
     if (!this.trainDataset || !this.validationDataset)
       throw new Error("Datasets not prepared");
-    this.hasTrained || this.trainer.setLearningRate(t?.learningRate || 1e-3), this.hasTrained = !0, this.emit("start"), await this.trainer.trainOnDataset(
+    this.hasTrained || this.trainer.setLearningRate(t?.learningRate || 1e-3), this.hasTrained = !0, this.emit("start"), this.trainer.setGradientCheckpointing(t?.gradientCheckpointing || !1), await this.trainer.trainOnDataset(
       this.trainDataset,
       {
         prompt: t?.prompt,
@@ -35,16 +37,17 @@ class p extends l {
         maxSteps: t?.maxSteps || 1e3,
         advancedMetrics: t?.advancedMetrics || !1,
         onStep: async (e, a) => {
+          this.log.push(e), this.progress = {
+            ...a,
+            progress: a.totalSamples / this.totalSamples,
+            remaining: Math.max(
+              0,
+              (this.totalSamples - a.totalSamples) / a.totalSamples * a.duration
+            )
+          };
           const s = this.listeners("log");
           for (const i of s)
-            await i(e, {
-              ...a,
-              progress: a.totalSamples / this.totalSamples,
-              remaining: Math.max(
-                0,
-                (this.totalSamples - a.totalSamples) / a.totalSamples * a.duration
-              )
-            });
+            await i(e, this.progress);
         }
       },
       this.validationDataset
@@ -76,7 +79,13 @@ class p extends l {
       });
     this.emit("stop");
   }
+  getLog() {
+    return this.log;
+  }
+  getProgress() {
+    return this.progress;
+  }
 }
 export {
-  p as default
+  m as default
 };

package/dist/{axis_util-BzbKo31C.js → axis_util-Did9235A.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { l as c } from "./index-BoWRt-10.js";
+import { n as c } from "./index-DdmHGZjq.js";
 /**
  * @license
  * Copyright 2017 Google LLC. All Rights Reserved.
@@ -28,7 +28,7 @@ function a(e, n, t) {
     t.indexOf(u) === -1 ? s.push(e[o++]) : s.push(n[f++]);
   return s;
 }
-function p(e, n) {
+function l(e, n) {
   const t = [], r = e.length;
   for (let o = 0; o < r; o++)
     n.indexOf(o) === -1 && t.push(e[o]);
@@ -62,7 +62,7 @@ function x(e, n) {
 export {
   x as a,
   m as b,
-  p as c,
+  l as c,
   i as d,
   h as e,
   a as f,

package/dist/backend.js CHANGED Viewed

@@ -1,6 +1,6 @@
-import { g as a, s as i, r as o } from "./index-BoWRt-10.js";
+import { g as a, s as i, r as o } from "./index-DdmHGZjq.js";
 async function e(t) {
-  a() !== t && (t === "webgpu" && (await import("./index-CLthM0TO.js"), await import("./ops/webgpu/index.js")), await i(t), await o(), console.log(`Backend set to ${t}`));
+  a() !== t && (t === "webgpu" && (await import("./index-evZ57wr4.js"), await import("./ops/webgpu/index.js")), await i(t), await o(), console.log(`Backend set to ${t}`));
 }
 export {
   e as selectBackend

package/dist/{backend_util-TE7aTPhZ.js → backend_util-yC3YH1jo.js} RENAMED Viewed

@@ -1,7 +1,7 @@
-import { j as m, a1 as O, l as g, aK as $, aL as R, aM as M, k as _, aa as y, aw as D, aN as T, u as b, aO as F } from "./index-BoWRt-10.js";
-import { b as L, d as W, f as v, c as N, e as x, g as P, a as C, h as z } from "./axis_util-BzbKo31C.js";
-import { S as U, a as B, b as V, c as j, d as k, e as G, f as H, g as q, h as Z, i as K, j as X, k as J, l as Y, m as Q, s as ee, n as te, o as ne, t as se } from "./selu_util-BJEXVvjX.js";
-import { c as re, v as oe, a as ae } from "./scatter_nd_util-DUstGbU1.js";
+import { j as m, a3 as R, n as g, aN as $, aO as O, aP as _, l as M, ae as y, ax as D, aQ as T, u as b, aR as F } from "./index-DdmHGZjq.js";
+import { b as L, d as W, f as v, c as N, e as x, g as P, a as C, h as z } from "./axis_util-Did9235A.js";
+import { S as U, a as B, b as V, c as j, d as G, e as H, f as k, g as q, h as Z, i as X, j as J, k as K, l as Q, m as Y, s as ee, n as te, o as ne, t as se } from "./selu_util-BgUO9gHY.js";
+import { c as re, v as oe, a as ae } from "./scatter_nd_util-B7yDhiQr.js";
 function ie(e, n) {
   const r = e.shape.length, t = n.shape.length;
   if (r < 1)
@@ -24,7 +24,7 @@ function ie(e, n) {
   for (let i = o; i < r; ++i)
     h *= u[i], c.push(u[i]);
   const d = [
-    ...O(e.shape).map((i) => i / h),
+    ...R(e.shape).map((i) => i / h),
     1
   ].slice(0, o);
   return [c, a, h, d];
@@ -233,7 +233,7 @@ function Ie(e, n) {
     r.push(e[t][0]);
   return r;
 }
-function we(e, n, r) {
+function Se(e, n, r) {
   const t = e.slice(0, 1);
   for (let s = 0; s < r; ++s)
     t.push(e[s + 1] - n[s][0] - n[s][1]);
@@ -255,7 +255,7 @@ function we(e, n, r) {
  * limitations under the License.
  * =============================================================================
  */
-const Se = 0.3275911, Ae = 0.254829592, Oe = -0.284496736, Re = 1.421413741, Me = -1.453152027, _e = 1.061405429;
+const we = 0.3275911, Ae = 0.254829592, Re = -0.284496736, Oe = 1.421413741, _e = -1.453152027, Me = 1.061405429;
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.
@@ -333,7 +333,7 @@ function ve(e, n, r) {
  * limitations under the License.
  * =============================================================================
  */
-const E = "->", Ne = /->/g, w = ",", S = "...";
+const E = "->", Ne = /->/g, S = ",", w = "...";
 function xe(e, n) {
   e = e.replace(/\s/g, "");
   const r = (e.length - e.replace(Ne, "").length) / E.length;
@@ -342,8 +342,8 @@ function xe(e, n) {
   if (r > 1)
     throw new Error(`Equation must contain exactly one arrow ("${E}").`);
   const [t, s] = e.split(E);
-  g(t.indexOf(S) === -1, () => `The ellipsis notation ("${S}") is not supported yet.`);
-  const o = t.split(w), a = o.length;
+  g(t.indexOf(w) === -1, () => `The ellipsis notation ("${w}") is not supported yet.`);
+  const o = t.split(S), a = o.length;
   if (n !== a)
     throw new Error(`Expected ${a} input tensors, received ${n}`);
   if (a > 2)
@@ -357,7 +357,7 @@ function xe(e, n) {
   }
   for (let l = 0; l < t.length; ++l) {
     const f = t[l];
-    u.indexOf(f) === -1 && f !== w && u.push(f);
+    u.indexOf(f) === -1 && f !== S && u.push(f);
   }
   const c = new Array(o.length);
   for (let l = 0; l < a; ++l) {
@@ -449,10 +449,10 @@ function je(e) {
   return `Received SparseTensor with denseShape[0] = 0 but
   indices.shape[0] = ${e}`;
 }
-function ke(e, n) {
+function Ge(e, n) {
   return `indices(${e}, 0) is invalid: ${n} < 0`;
 }
-function Ge(e, n, r) {
+function He(e, n, r) {
   return `indices(${e}, 0) is invalid: ${n} >= ${r}`;
 }
 /**
@@ -471,7 +471,7 @@ function Ge(e, n, r) {
  * limitations under the License.
  * =============================================================================
  */
-function He(e, n) {
+function ke(e, n) {
   return `only one output dimension may be -1, not both ${e} and ${n}`;
 }
 function qe(e, n) {
@@ -480,12 +480,12 @@ function qe(e, n) {
 function Ze() {
   return "reshape cannot infer the missing input size for an empty tensor unless all specified input sizes are non-zero";
 }
-function Ke(e, n) {
+function Xe(e, n) {
   const r = m(e), t = m(n);
   return `Input to reshape is a SparseTensor with ${r}
   dense values, but the requested shape requires a multiple of ${t}. inputShape=${e} outputShape= ${n}`;
 }
-function Xe(e, n) {
+function Je(e, n) {
   const r = m(e), t = m(n);
   return `Input to reshape is a tensor with ${r} dense values, but the requested shape has ${t}. inputShape=${e} outputShape=${n}`;
 }
@@ -505,13 +505,13 @@ function Xe(e, n) {
  * limitations under the License.
  * =============================================================================
  */
-function Je() {
+function Ke() {
   return "segment ids must be >= 0";
 }
-function Ye() {
+function Qe() {
   return "segment ids are not increasing";
 }
-function Qe(e, n) {
+function Ye(e, n) {
   return `Segment id ${e} out of range [0, ${n}), possibly because segmentIds input is not sorted.`;
 }
 function et(e, n, r) {
@@ -593,22 +593,22 @@ const rt = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
  */
 function ot(e) {
   try {
-    return e.map((n) => R(n));
+    return e.map((n) => O(n));
   } catch (n) {
     throw new Error(`Failed to decode encoded string bytes into utf-8, error: ${n}`);
   }
 }
 function at(e) {
-  return e.map((n) => M(n));
+  return e.map((n) => _(n));
 }
 const ht = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
   __proto__: null,
   ERF_A1: Ae,
-  ERF_A2: Oe,
-  ERF_A3: Re,
-  ERF_A4: Me,
-  ERF_A5: _e,
-  ERF_P: Se,
+  ERF_A2: Re,
+  ERF_A3: Oe,
+  ERF_A4: _e,
+  ERF_A5: Me,
+  ERF_P: we,
   PARALLELIZE_THRESHOLD: I,
   get RowPartitionType() {
     return p;
@@ -616,7 +616,7 @@ const ht = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
   SELU_SCALE: U,
   SELU_SCALEALPHA: B,
   applyActivation: V,
-  assertAndGetBroadcastShape: _,
+  assertAndGetBroadcastShape: M,
   assertAxesAreInnerMostDims: L,
   assertParamsConsistent: ue,
   assignToTypedArray: Le,
@@ -628,18 +628,18 @@ const ht = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
   combineRaggedTensorToTensorShapes: ce,
   complexWithEvenIndex: Te,
   complexWithOddIndex: be,
-  computeConv2DInfo: k,
-  computeConv3DInfo: G,
-  computeDefaultPad: H,
+  computeConv2DInfo: G,
+  computeConv3DInfo: H,
+  computeDefaultPad: k,
   computeDilation2DInfo: q,
   computeOptimalWindowSize: ge,
   computeOutAndReduceShapes: N,
   computeOutShape: le,
   computePool2DInfo: Z,
-  computePool3DInfo: K,
-  convertConv2DDataFormat: X,
+  computePool3DInfo: X,
+  convertConv2DDataFormat: J,
   decodeEinsumEquation: xe,
-  eitherStridesOrDilationsAreOne: J,
+  eitherStridesOrDilationsAreOne: K,
   expandShapeToKeepDim: x,
   exponent: ve,
   exponents: We,
@@ -650,8 +650,8 @@ const ht = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
   getComplexWithIndex: Fe,
   getEinsumComputePath: ze,
   getEinsumPermutation: Pe,
-  getFusedBiasGradient: Y,
-  getFusedDyActivation: Q,
+  getFusedBiasGradient: Q,
+  getFusedDyActivation: Y,
   getImageCenter: de,
   getInnerMostAxes: C,
   getPermuted: Ee,
@@ -661,19 +661,19 @@ const ht = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
   getReshapedPermuted: $e,
   getRowPartitionTypesHelper: he,
   getSliceBeginCoords: Ie,
-  getSliceSize: we,
+  getSliceSize: Se,
   getSparseFillEmptyRowsIndicesDenseShapeMismatch: je,
-  getSparseFillEmptyRowsNegativeIndexErrorMessage: ke,
-  getSparseFillEmptyRowsOutOfRangeIndexErrorMessage: Ge,
+  getSparseFillEmptyRowsNegativeIndexErrorMessage: Ge,
+  getSparseFillEmptyRowsOutOfRangeIndexErrorMessage: He,
   getSparseReshapeEmptyTensorZeroOutputDimErrorMessage: Ze,
-  getSparseReshapeInputOutputMismatchErrorMessage: Xe,
-  getSparseReshapeInputOutputMultipleErrorMessage: Ke,
-  getSparseReshapeMultipleNegativeOneOutputDimErrorMessage: He,
+  getSparseReshapeInputOutputMismatchErrorMessage: Je,
+  getSparseReshapeInputOutputMultipleErrorMessage: Xe,
+  getSparseReshapeMultipleNegativeOneOutputDimErrorMessage: ke,
   getSparseReshapeNegativeOutputDimErrorMessage: qe,
   getSparseSegmentReductionIndicesOutOfRangeErrorMessage: et,
-  getSparseSegmentReductionNegativeSegmentIdsErrorMessage: Je,
-  getSparseSegmentReductionNonIncreasingSegmentIdsErrorMessage: Ye,
-  getSparseSegmentReductionSegmentIdOutOfRangeErrorMessage: Qe,
+  getSparseSegmentReductionNegativeSegmentIdsErrorMessage: Ke,
+  getSparseSegmentReductionNonIncreasingSegmentIdsErrorMessage: Qe,
+  getSparseSegmentReductionSegmentIdOutOfRangeErrorMessage: Ye,
   getUndoAxesPermutation: z,
   isIdentityPermutation: Ue,
   log: T,
@@ -697,8 +697,8 @@ export {
   Ee as B,
   $e as C,
   Ie as D,
-  Se as E,
-  we as F,
+  we as E,
+  Se as F,
   le as G,
   ue as H,
   xe as I,
@@ -728,22 +728,22 @@ export {
   ot as f,
   he as g,
   je as h,
-  ke as i,
-  Ge as j,
-  He as k,
+  Ge as i,
+  He as j,
+  ke as k,
   qe as l,
   ye as m,
   Ze as n,
-  Ke as o,
-  Xe as p,
-  Je as q,
-  Ye as r,
-  Qe as s,
+  Xe as o,
+  Je as p,
+  Ke as q,
+  Qe as r,
+  Ye as s,
   et as t,
   Ae as u,
   pe as v,
-  Oe as w,
-  Re as x,
-  Me as y,
-  _e as z
+  Re as w,
+  Oe as x,
+  _e as y,
+  Me as z
 };

package/dist/{broadcast_to-CdbwV-Dj.js → broadcast_to-CUvOdOT5.js} RENAMED Viewed

@@ -1,5 +1,5 @@
-import { B as h, C as f, F as p, M as g, E as u, N as b } from "./index-BoWRt-10.js";
-import { r as T } from "./reshape-CdBq1WJ6.js";
+import { C as h, D as f, M as p, H as g, E as u, X as b } from "./index-DdmHGZjq.js";
+import { r as T } from "./reshape-WeJkT3ja.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.

package/dist/checks/appendCache.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][]>;

package/dist/checks/appendCache.js ADDED Viewed

@@ -0,0 +1,22 @@
+import { s, e as a } from "../index-DdmHGZjq.js";
+import { t } from "../tensor4d-DLtk7Nxh.js";
+async function u(e) {
+  await s(e);
+  const n = t(
+    [
+      [
+        [
+          [0.1, 0.2, 0, 0],
+          [0.1, 0.2, 0, 0],
+          [0, 0, 0, 0],
+          [0, 0, 0, 0]
+        ]
+      ]
+    ],
+    [1, 1, 4, 4]
+  ), r = t([[[[0.1, 0.2, 0.3, 0.4]]]], [1, 1, 1, 4]);
+  return await a().runKernel("AppendCache", { cache: n, item: r }, { maxSize: 4, pastLen: 2 }).array();
+}
+export {
+  u as execute
+};

package/dist/checks/attentionMask.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][]>;

package/dist/checks/attentionMask.js ADDED Viewed

@@ -0,0 +1,37 @@
+import { s as i, e } from "../index-DdmHGZjq.js";
+import { t } from "../tensor4d-DLtk7Nxh.js";
+import { t as a } from "../tensor2d-CObBWBkW.js";
+async function k(n) {
+  await i(n);
+  const s = t(
+    [
+      [
+        [
+          [0.1, 0.2, 0.3, 0.4],
+          [0.3, 0.4, 0.5, 0.6]
+        ]
+      ]
+    ],
+    [1, 1, 2, 4]
+  ), o = t(
+    [
+      [
+        [
+          [0.5, 0.6, 0.5, 0.6],
+          [0.7, 0.8, 0.7, 0.8]
+        ]
+      ]
+    ],
+    [1, 1, 2, 4]
+  ), r = a(
+    [
+      [0, -1 / 0, -1 / 0, -1 / 0],
+      [0, 0, 0, -1 / 0]
+    ],
+    [2, 4]
+  );
+  return await e().runKernel("AttentionMask", { q: s, k: o, mask: r }, { divisor: 0.5, pastLen: 0 }).array();
+}
+export {
+  k as execute
+};

package/dist/checks/check.d.ts ADDED Viewed

@@ -0,0 +1,9 @@
+interface Result {
+    backend: string;
+    result: unknown;
+    error?: string;
+    passed: boolean;
+    maxError?: number;
+}
+export default function runCheck(check: (backend: string) => Promise<unknown>, epsilon?: number): Promise<Result[]>;
+export {};

package/dist/checks/check.js ADDED Viewed

@@ -0,0 +1,20 @@
+import { arraysClose as l } from "../utilities/arrayClose.js";
+async function f(c, a) {
+  const n = ["cpu", "webgl", "webgpu"], t = [];
+  for (const e of n)
+    try {
+      const r = await c(e);
+      t.push({ backend: e, result: r, passed: !0 });
+    } catch (r) {
+      t.push({ backend: e, error: r.message, result: [], passed: !1 });
+    }
+  const s = await Promise.all(t), u = s[0].result;
+  for (let e = 1; e < s.length; e++) {
+    const r = s[e].result, o = l(u, r);
+    s[e].passed = o <= (a ?? 1e-6), s[e].maxError = o;
+  }
+  return s;
+}
+export {
+  f as default
+};

package/dist/checks/gelu.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][]>;

package/dist/checks/gelu.js ADDED Viewed

@@ -0,0 +1,18 @@
+import { s as e, e as o } from "../index-DdmHGZjq.js";
+import { t as s } from "../tensor2d-CObBWBkW.js";
+async function m(t) {
+  await e(t);
+  const r = s(
+    [
+      [0.1, 0.2, 0, 0],
+      [0.1, 0.2, 0, 0],
+      [0, 0, 0, 0],
+      [0, 0, 0, 0]
+    ],
+    [4, 4]
+  );
+  return await o().runKernel("Gelu", { x: r }).array();
+}
+export {
+  m as execute
+};

package/dist/checks/index.d.ts ADDED Viewed

@@ -0,0 +1,19 @@
+import { execute as rope } from './rope';
+import { execute as normRMS } from './normRMS';
+import { execute as qkv } from './qkv';
+import { execute as gelu } from './gelu';
+import { execute as normRMSGrad } from './normRMSGrad';
+import { execute as appendCache } from './appendCache';
+import { execute as attentionMask } from './attentionMask';
+import { default as runCheck } from './check';
+declare const checks: {
+    rope: typeof rope;
+    qkv: typeof qkv;
+    gelu: typeof gelu;
+    normRMS: typeof normRMS;
+    normRMSGrad: typeof normRMSGrad;
+    appendCache: typeof appendCache;
+    attentionMask: typeof attentionMask;
+    runCheck: typeof runCheck;
+};
+export default checks;

package/dist/checks/index.js ADDED Viewed

@@ -0,0 +1,21 @@
+import { execute as e } from "./rope.js";
+import { execute as t } from "./normRMS.js";
+import { execute as o } from "./qkv.js";
+import { execute as r } from "./gelu.js";
+import { execute as c } from "./normRMSGrad.js";
+import { execute as m } from "./appendCache.js";
+import { execute as u } from "./attentionMask.js";
+import x from "./check.js";
+const d = {
+  rope: e,
+  qkv: o,
+  gelu: r,
+  normRMS: t,
+  normRMSGrad: c,
+  appendCache: m,
+  attentionMask: u,
+  runCheck: x
+};
+export {
+  d as default
+};

package/dist/checks/normRMS.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<(number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][])[]>;

package/dist/checks/normRMS.js ADDED Viewed

@@ -0,0 +1,16 @@
+import { s as u, y as A, e as y } from "../index-DdmHGZjq.js";
+import { a as h } from "../ops-542ai2vG.js";
+import { t as p } from "../tensor1d-CtJq5BOv.js";
+import { t as a } from "../tensor-DbqgIV9B.js";
+const w = Array.from({ length: 2048 * 192 }, () => Math.random()), x = Array.from({ length: 192 }, () => Math.random()), M = Array.from({ length: 2048 * 192 }, () => Math.random());
+async function k(t) {
+  await u(t);
+  const o = p(x, "float32"), n = a(w, [16, 128, 192], "float32"), s = a(M, [16, 128, 192], "float32"), e = (d, g) => {
+    const i = y().runKernel("RMSNorm", { x: d, gamma: g });
+    return h.meanSquaredError(i, s);
+  }, { value: m, grads: r } = A(e)([n, o]), c = await m.array(), f = await r[0].array(), l = await r[1].array();
+  return [c, f, l];
+}
+export {
+  k as execute
+};

package/dist/checks/normRMSGrad.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<(number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][])[]>;

package/dist/checks/normRMSGrad.js ADDED Viewed

@@ -0,0 +1,12 @@
+import { s as c, e as d } from "../index-DdmHGZjq.js";
+import { t as f } from "../tensor1d-CtJq5BOv.js";
+import { t as r } from "../tensor-DbqgIV9B.js";
+const y = Array.from({ length: 2048 * 192 }, () => Math.random()), i = Array.from({ length: 192 }, () => Math.random()), l = Array.from({ length: 2048 * 192 }, () => Math.random());
+async function x(t) {
+  await c(t);
+  const o = f(i, "float32"), n = r(y, [16, 128, 192], "float32"), m = r(l, [16, 128, 192], "float32"), a = d().runKernel("RMSNormGrad", { x: n, gamma: o, dy: m }), s = await a[0].array(), e = await a[1].array();
+  return [s, e];
+}
+export {
+  x as execute
+};

package/dist/checks/qkv.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<(number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][])[]>;

package/dist/checks/qkv.js ADDED Viewed

@@ -0,0 +1,25 @@
+import { s as c, e as m } from "../index-DdmHGZjq.js";
+import { t as i } from "../tensor3d-BOukqWwr.js";
+import { t as u } from "../tensor2d-CObBWBkW.js";
+async function w(a) {
+  await c(a);
+  const o = i(
+    [
+      [
+        [0.1, 0.2],
+        [0.3, 0.4]
+      ]
+    ],
+    [1, 2, 2]
+  ), r = u(
+    [
+      [0.5, 0.6, 0.9, 1, 1.3, 1.4],
+      [0.7, 0.8, 1.1, 1.2, 1.5, 1.6]
+    ],
+    [2, 6]
+  ), t = m().runKernel("QKV", { x: o, kernel: r }, { heads: 1 }), s = await t[0].array(), n = await t[1].array(), e = await t[2].array();
+  return [s, n, e];
+}
+export {
+  w as execute
+};

package/dist/checks/rope.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][] \| Promise<number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][]>[]>;

package/dist/checks/rope.js ADDED Viewed

@@ -0,0 +1,21 @@
+import { s as c, e as i } from "../index-DdmHGZjq.js";
+import { t as m } from "../tensor4d-DLtk7Nxh.js";
+import { t } from "../tensor3d-BOukqWwr.js";
+async function y(n) {
+  await c(n);
+  const s = m(
+    [
+      [
+        [
+          [0.1, 0.2],
+          [0.3, 0.4]
+        ]
+      ]
+    ],
+    [1, 1, 2, 2]
+  ), e = t([0.5, 0.6], [2, 1, 1]), o = t([0.9, 1], [2, 1, 1]), r = i().runKernel("Rope", { x: s, sin: e, cos: o }, { pastLen: 0 });
+  return Array.isArray(r) ? r.map((a) => a.array()) : r.array();
+}
+export {
+  y as execute
+};

package/dist/{concat-CsxrgovM.js → concat-pHiVqR3L.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { B as s, l as a, D as p, M as i, E as l, Q as f } from "./index-BoWRt-10.js";
+import { C as s, n as a, F as p, H as i, E as l, I as f } from "./index-DdmHGZjq.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.