npm - @genai-fi/nanogpt - Versions diffs - 0.8.0 → 0.8.2 - Mend

@genai-fi/nanogpt 0.8.0 → 0.8.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (162) hide show

package/dist/Generator.d.ts +2 -1
package/dist/Generator.js +44 -37
package/dist/{RealDiv-N8TpOMYv.js → RealDiv-D_q39E3A.js} +14 -14
package/dist/{Reshape-B-lWQRnF.js → Reshape-41YpQqEo.js} +1 -1
package/dist/{Reshape-Bo8HzP8V.js → Reshape-Bh_jzKzV.js} +2 -2
package/dist/TeachableLLM.js +7 -5
package/dist/{axis_util-DubwyOhW.js → axis_util-Did9235A.js} +1 -1
package/dist/backend.js +2 -2
package/dist/{backend_util-BJ-_jSeK.js → backend_util-yC3YH1jo.js} +17 -17
package/dist/{broadcast_to-BYfCp5iL.js → broadcast_to-CUvOdOT5.js} +2 -2
package/dist/checks/appendCache.d.ts +1 -0
package/dist/checks/appendCache.js +22 -0
package/dist/checks/attentionMask.d.ts +1 -0
package/dist/checks/attentionMask.js +37 -0
package/dist/checks/check.d.ts +9 -0
package/dist/checks/check.js +20 -0
package/dist/checks/gelu.d.ts +1 -0
package/dist/checks/gelu.js +18 -0
package/dist/checks/index.d.ts +22 -0
package/dist/checks/index.js +24 -0
package/dist/checks/normRMS.d.ts +1 -0
package/dist/checks/normRMS.js +16 -0
package/dist/checks/normRMSGrad.d.ts +1 -0
package/dist/checks/normRMSGrad.js +12 -0
package/dist/checks/qkv.d.ts +1 -0
package/dist/checks/qkv.js +50 -0
package/dist/checks/rope.d.ts +1 -0
package/dist/checks/rope.js +38 -0
package/dist/checks/weights.d.ts +16 -0
package/dist/checks/weights.js +29 -0
package/dist/{concat-BmDqqFsa.js → concat-pHiVqR3L.js} +1 -1
package/dist/{dataset-CJmEGu6D.js → dataset-DPPl-iLT.js} +7 -7
package/dist/{dropout-sx0sjVAT.js → dropout-CcKSfOYE.js} +11 -11
package/dist/{exports_initializers-DAKM8UO9.js → exports_initializers-DKk7-bsx.js} +1 -1
package/dist/{gather-C1siEkdp.js → gather-CPg6ZlQA.js} +1 -1
package/dist/{gelu-Bd3UBBxg.js → gelu-BkcmEEyD.js} +1 -1
package/dist/{gpgpu_math-TFLxaLkw.js → gpgpu_math-D_ODOLix.js} +2 -2
package/dist/{index-CUQrfsw_.js → index-DdmHGZjq.js} +655 -647
package/dist/{index-BaPo_0H8.js → index-evZ57wr4.js} +10 -10
package/dist/{kernel_funcs_utils-P9aFa232.js → kernel_funcs_utils-CDfFpUab.js} +15 -15
package/dist/layers/BaseLayer.js +2 -2
package/dist/layers/CausalSelfAttention.js +29 -29
package/dist/layers/MLP.js +18 -18
package/dist/layers/PositionEmbedding.js +5 -5
package/dist/layers/RMSNorm.js +3 -3
package/dist/layers/RoPECache.js +4 -4
package/dist/layers/TiedEmbedding.js +11 -11
package/dist/layers/TransformerBlock.js +1 -1
package/dist/loader/loadTransformers.js +1 -1
package/dist/loader/oldZipLoad.js +9 -7
package/dist/{log_sum_exp-C142qZqY.js → log_sum_exp-C8yFJfZz.js} +45 -24
package/dist/main.d.ts +2 -0
package/dist/main.js +9 -7
package/dist/{mat_mul-DMkduNJu.js → mat_mul-Dpy2mMRu.js} +1 -1
package/dist/{mod-uUuj4gSb.js → mod-CbibJi3D.js} +1 -1
package/dist/models/NanoGPTV1.js +1 -1
package/dist/models/model.js +9 -7
package/dist/{mulmat_packed_gpu-Cm2gw-c8.js → mulmat_packed_gpu-q_Gmwyld.js} +1 -1
package/dist/{ones-ZdgQGBCP.js → ones-BAqVh-eA.js} +2 -2
package/dist/ops/adamAdjust.js +1 -1
package/dist/ops/adamMoments.js +1 -1
package/dist/ops/appendCache.js +3 -3
package/dist/ops/attentionMask.js +1 -1
package/dist/ops/cpu/adamAdjust.js +1 -1
package/dist/ops/cpu/adamMoments.js +2 -2
package/dist/ops/cpu/appendCache.js +2 -2
package/dist/ops/cpu/attentionMask.js +5 -5
package/dist/ops/cpu/fusedSoftmax.js +2 -2
package/dist/ops/cpu/gatherSub.js +5 -5
package/dist/ops/cpu/gelu.js +1 -1
package/dist/ops/cpu/matMulGelu.js +2 -2
package/dist/ops/cpu/matMulMul.js +1 -1
package/dist/ops/cpu/mulDropout.js +1 -1
package/dist/ops/cpu/normRMS.js +1 -1
package/dist/ops/cpu/qkv.js +3 -3
package/dist/ops/cpu/rope.js +5 -5
package/dist/ops/cpu/scatterSub.js +13 -13
package/dist/ops/fusedSoftmax.js +1 -1
package/dist/ops/gatherSub.js +1 -1
package/dist/ops/gelu.js +2 -2
package/dist/ops/grads/attentionMask.js +1 -1
package/dist/ops/grads/fusedSoftmax.js +2 -2
package/dist/ops/grads/gelu.js +2 -2
package/dist/ops/grads/matMulGelu.js +1 -1
package/dist/ops/grads/normRMS.js +1 -1
package/dist/ops/grads/qkv.js +1 -1
package/dist/ops/grads/rope.js +1 -1
package/dist/ops/matMulGelu.js +1 -1
package/dist/ops/matMulMul.js +1 -1
package/dist/ops/mulDrop.js +1 -1
package/dist/ops/normRMS.js +1 -1
package/dist/ops/qkv.js +1 -1
package/dist/ops/rope.js +4 -4
package/dist/ops/scatterSub.js +1 -1
package/dist/ops/webgl/adamAdjust.js +2 -2
package/dist/ops/webgl/adamMoments.js +1 -1
package/dist/ops/webgl/appendCache.js +1 -1
package/dist/ops/webgl/attentionMask.js +1 -1
package/dist/ops/webgl/fusedSoftmax.js +4 -4
package/dist/ops/webgl/gatherSub.js +1 -1
package/dist/ops/webgl/gelu.js +2 -2
package/dist/ops/webgl/log.js +3 -3
package/dist/ops/webgl/matMulGelu.js +4 -4
package/dist/ops/webgl/matMulMul.js +1 -1
package/dist/ops/webgl/mulDropout.js +1 -1
package/dist/ops/webgl/normRMS.js +2 -2
package/dist/ops/webgl/qkv.js +1 -1
package/dist/ops/webgl/rope.js +1 -1
package/dist/ops/webgl/scatterSub.js +1 -1
package/dist/ops/webgpu/adamAdjust.js +3 -3
package/dist/ops/webgpu/adamMoments.js +3 -3
package/dist/ops/webgpu/appendCache.js +3 -3
package/dist/ops/webgpu/attentionMask.js +3 -3
package/dist/ops/webgpu/gatherSub.js +3 -3
package/dist/ops/webgpu/gelu.js +3 -3
package/dist/ops/webgpu/normRMS.js +2 -2
package/dist/ops/webgpu/normRMSGrad.js +5 -5
package/dist/ops/webgpu/qkv.js +3 -3
package/dist/ops/webgpu/rope.js +3 -3
package/dist/ops/webgpu/scatterSub.js +3 -3
package/dist/ops/webgpu/utils/reductions.js +4 -4
package/dist/ops-542ai2vG.js +1525 -0
package/dist/{random_width-D8Pwy_na.js → random_width-DKGeiFuR.js} +1514 -1581
package/dist/{range-LVHrSLdi.js → range-BcUvLuf5.js} +1 -1
package/dist/{reciprocal-CaR9e67G.js → reciprocal-DhDWSKiD.js} +1 -1
package/dist/{register_all_kernels-DUshvVWP.js → register_all_kernels-Do9VvZmo.js} +2312 -2335
package/dist/{max-B3JOcNGb.js → relu-B1AXs7p5.js} +6 -6
package/dist/{reshape-DEfQGSin.js → reshape-WeJkT3ja.js} +1 -1
package/dist/{scatter_nd_util-CUPPNLaA.js → scatter_nd_util-B7yDhiQr.js} +1 -1
package/dist/{selu_util-8vv5JxQV.js → selu_util-BgUO9gHY.js} +125 -146
package/dist/{shared-D1elLckx.js → shared-CZiWmQCI.js} +1 -1
package/dist/{shared-CkNorDcU.js → shared-V6D_md-c.js} +120 -120
package/dist/{sin-D2CKKmyR.js → sin-CPxad7Am.js} +1 -1
package/dist/{slice-BnyE-M_7.js → slice-B7jXtPnp.js} +1 -1
package/dist/{softmax-DLoZWYBx.js → softmax-BfsyI4As.js} +1 -1
package/dist/{split-By_n4TKP.js → split-BPxr8_8m.js} +1 -1
package/dist/{stack-DkdFLq37.js → stack-BNwLzE43.js} +1 -1
package/dist/{sum-l_0SqM4h.js → sum-ByFINZgi.js} +1 -1
package/dist/{tensor-BAQdLqoU.js → tensor-DbqgIV9B.js} +1 -1
package/dist/tensor1d-CtJq5BOv.js +27 -0
package/dist/{tensor2d-BHy261cI.js → tensor2d-CObBWBkW.js} +1 -1
package/dist/tensor4d-DLtk7Nxh.js +30 -0
package/dist/training/Adam.js +2 -2
package/dist/training/AdamExt.js +1 -1
package/dist/training/DatasetBuilder.js +2 -2
package/dist/training/FullTrainer.js +1 -1
package/dist/training/Trainer.js +2 -2
package/dist/training/sparseCrossEntropy.js +8 -9
package/dist/utilities/arrayClose.d.ts +1 -1
package/dist/utilities/arrayClose.js +16 -7
package/dist/utilities/dummy.js +2 -2
package/dist/utilities/multinomialCPU.js +2 -2
package/dist/utilities/performance.js +1 -1
package/dist/utilities/profile.js +1 -1
package/dist/utilities/safetensors.js +2 -2
package/dist/utilities/weights.js +2 -2
package/dist/{variable-C9hihzDB.js → variable-DPFOJyRG.js} +1 -1
package/dist/{webgpu_program-dFEVbDPL.js → webgpu_program-Dhk9R5aG.js} +1 -1
package/dist/{webgpu_util-DLImlSc6.js → webgpu_util-BqGnZg8t.js} +1 -1
package/dist/{zeros-VZ72lWXM.js → zeros-Dnwix0p4.js} +1 -1
package/package.json +1 -1
package/dist/ops-C_1K_-35.js +0 -1202

package/dist/Generator.d.ts CHANGED Viewed

@@ -45,7 +45,8 @@ export default class Generator extends EE<'start' | 'stop' | 'tokens'> {
     generate(prompt?: string, options?: IGenerateOptions): Promise<string>;
     stop(): void;
     getText(): string;
-    getAttentionData(): number[][][][];
+    getAttentionData(): number[][][][][];
     getProbabilitiesData(): number[][][];
+    getEmbeddingsData(): number[][][][];
     getTokens(): number[];
 }

package/dist/Generator.js CHANGED Viewed

@@ -1,15 +1,15 @@
 import { E as z } from "./index-Dwqa6Zy2.js";
-import { B as A, C as L, E as C, a5 as I, t as O, k as R } from "./index-CUQrfsw_.js";
+import { C as A, D as L, E as C, a6 as I, t as O, k as R } from "./index-DdmHGZjq.js";
 import "./ops/cpu/attentionMask.js";
 import "./ops/webgl/attentionMask.js";
 import "./ops/grads/attentionMask.js";
 import "./ops/cpu/qkv.js";
 import "./ops/webgl/qkv.js";
 import "./ops/grads/qkv.js";
-import { p as _ } from "./random_width-D8Pwy_na.js";
-import { t as K } from "./register_all_kernels-DUshvVWP.js";
+import { p as _ } from "./random_width-DKGeiFuR.js";
+import { t as K } from "./register_all_kernels-Do9VvZmo.js";
 import "./index-Tf7vU29b.js";
-import "./dataset-CJmEGu6D.js";
+import "./dataset-DPPl-iLT.js";
 import "./ops/cpu/rope.js";
 import "./ops/webgl/rope.js";
 import "./ops/grads/rope.js";
@@ -37,14 +37,16 @@ import "./ops/webgl/adamMoments.js";
 import "./papaparse.min-C8l2Kvo1.js";
 import "./ops/cpu/gelu.js";
 import "./ops/webgl/gelu.js";
-import "./gelu-Bd3UBBxg.js";
+import "./gelu-BkcmEEyD.js";
 import "./ops/webgl/log.js";
+import "./checks/normRMS.js";
+import "./checks/normRMSGrad.js";
 import $ from "./utilities/multinomialCPU.js";
-import { r as x } from "./reshape-DEfQGSin.js";
-import { t as P } from "./tensor2d-BHy261cI.js";
-import { s as v } from "./softmax-DLoZWYBx.js";
-import { g as q } from "./gather-C1siEkdp.js";
-import { c as G } from "./concat-BmDqqFsa.js";
+import { r as x } from "./reshape-WeJkT3ja.js";
+import { t as P } from "./tensor2d-CObBWBkW.js";
+import { s as v } from "./softmax-BfsyI4As.js";
+import { g as q } from "./gather-CPg6ZlQA.js";
+import { c as G } from "./concat-pHiVqR3L.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -61,8 +63,8 @@ import { c as G } from "./concat-BmDqqFsa.js";
  * limitations under the License.
  * =============================================================================
  */
-function N(h, t, e, i = !1) {
-  const o = L(h, "logits", "multinomial"), s = o.size, n = o.rank;
+function N(m, t, e, i = !1) {
+  const o = L(m, "logits", "multinomial"), s = o.size, n = o.rank;
   if (s < 2)
     throw new Error(`Error in multinomial: you need at least 2 outcomes, but got ${s}.`);
   if (n > 2)
@@ -71,8 +73,8 @@ function N(h, t, e, i = !1) {
   const a = { logits: n === 1 ? x(o, [1, -1]) : o }, p = { numSamples: t, seed: e, normalized: i }, l = C.runKernel(I, a, p);
   return n === 1 ? x(l, [l.size]) : l;
 }
-const S = /* @__PURE__ */ A({ multinomial_: N }), B = [
-  ...Array.from({ length: 95 }, (h, t) => String.fromCharCode(t + 32)),
+const D = /* @__PURE__ */ A({ multinomial_: N }), H = [
+  ...Array.from({ length: 95 }, (m, t) => String.fromCharCode(t + 32)),
   // ASCII
   // Spanish accented letters and punctuation
   ..."áéíóúüñ¿¡",
@@ -83,10 +85,10 @@ const S = /* @__PURE__ */ A({ multinomial_: N }), B = [
   // Cyrillic letters
   ..."абвгдеёжзийклмнопрстуфхцчшщъыьэюяАБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯ"
 ];
-function H(h, t) {
-  return h.length === t ? h : h.length > t ? h.slice(0, t) : h.concat(Array(t - h.length).fill(""));
+function U(m, t) {
+  return m.length === t ? m : m.length > t ? m.slice(0, t) : m.concat(Array(t - m.length).fill(""));
 }
-class Mt extends z {
+class qt extends z {
   constructor(t, e) {
     super(), this.model = t, this.tokeniser = e, this.actualTokeniser = e;
   }
@@ -110,7 +112,9 @@ class Mt extends z {
       return null;
     const n = await t.decode([s]);
     if (i) {
-      const d = await Promise.all(i.map((a) => a.array().then((p) => p)));
+      const d = await Promise.all(
+        i.map((a) => a.array().then((p) => p))
+      );
       i.forEach((a) => a.dispose()), this.attentionData.push(d);
     }
     if (o) {
@@ -129,13 +133,13 @@ class Mt extends z {
       cache: e,
       outputEmbeddings: i?.embeddings ?? !1
     }, p = O(() => {
-      const r = t, m = r.shape[1], u = m <= this.model.config.blockSize ? r : r.slice(
-        [0, m - this.model.config.blockSize],
+      const r = t, h = r.shape[1], u = h <= this.model.config.blockSize ? r : r.slice(
+        [0, h - this.model.config.blockSize],
         [r.shape[0], this.model.config.blockSize]
-      ), k = d ? this.model.config.blockSize - u.shape[1] : 0, b = k > 0 ? _(u, [
+      ), g = d ? this.model.config.blockSize - u.shape[1] : 0, b = g > 0 ? _(u, [
         [0, 0],
-        [0, k]
-      ]) : u, [f] = this.model.forward(a, b), y = f.shape[1] - 1 - k, c = f.slice([0, y, 0], [f.shape[0], 1, f.shape[2]]);
+        [0, g]
+      ]) : u, [f] = this.model.forward(a, b), y = f.shape[1] - 1 - g, c = f.slice([0, y, 0], [f.shape[0], 1, f.shape[2]]);
       return a.attentionScores?.attentionOut && a.attentionScores.attentionOut.forEach((T, E) => {
         T.shape[1] !== 1 && (a.attentionScores.attentionOut[E] = R(
           T.slice([0, y, 0], [T.shape[0], 1, T.shape[2]])
@@ -144,32 +148,32 @@ class Mt extends z {
     });
     let l;
     if (n) {
-      const r = v(p), m = await r.array();
+      const r = v(p), h = await r.array();
       r.dispose();
-      const u = m[0].map((c, g) => ({ prob: c, index: g })).sort((c, g) => g.prob - c.prob);
-      let k = 0;
+      const u = h[0].map((c, k) => ({ prob: c, index: k })).sort((c, k) => k.prob - c.prob);
+      let g = 0;
       const b = new Array(u.length).fill(0);
       for (const c of u)
-        if (k += c.prob, b[c.index] = c.prob, k >= n)
+        if (g += c.prob, b[c.index] = c.prob, g >= n)
           break;
-      const f = b.reduce((c, g) => c + g, 0), y = b.map((c) => c / f);
+      const f = b.reduce((c, k) => c + k, 0), y = b.map((c) => c / f);
       l = $(y);
     } else if (s) {
-      const { values: r, indices: m } = K(p, s), u = S(r, 1);
-      l = q(m, u, 1), r.dispose(), m.dispose(), u.dispose();
+      const { values: r, indices: h } = K(p, s), u = D(r, 1);
+      l = q(h, u, 1), r.dispose(), h.dispose(), u.dispose();
     } else
-      l = S(p, 1);
+      l = D(p, 1);
     let w;
     i?.includeProbabilities && (w = v(p)), a.embeddings && this.embeddingsData.push(
       await Promise.all(
         a.embeddings.map(async (r) => {
-          const m = await r.array();
-          return r.dispose(), m;
+          const h = await r.array();
+          return r.dispose(), h;
         })
       )
     );
-    const D = l.reshape([1, 1]);
-    return l.dispose(), l = D, p.dispose(), { output: l, probabilities: w, attention: a.attentionScores?.attentionOut };
+    const S = l.reshape([1, 1]);
+    return l.dispose(), l = S, p.dispose(), { output: l, probabilities: w, attention: a.attentionScores?.attentionOut };
   }
   /** Generate multiple tokens in a loop and produce text */
   async _generate(t) {
@@ -213,7 +217,7 @@ class Mt extends z {
         s[n] = { k: void 0, v: void 0, length: 0, cumulativeLength: 0 };
       this.cache = s, this.lastToken = -1;
     }
-    const o = this.tokeniser.trained ? this.tokeniser : new M(H(B, this.tokeniser.vocabSize));
+    const o = this.tokeniser.trained ? this.tokeniser : new M(U(H, this.tokeniser.vocabSize));
     this.actualTokeniser = o;
   }
   async step(t, e) {
@@ -237,10 +241,13 @@ class Mt extends z {
   getProbabilitiesData() {
     return this.probabilitiesData;
   }
+  getEmbeddingsData() {
+    return this.embeddingsData;
+  }
   getTokens() {
     return this.tokens;
   }
 }
 export {
-  Mt as default
+  qt as default
 };

package/dist/{RealDiv-N8TpOMYv.js → RealDiv-D_q39E3A.js} RENAMED Viewed

@@ -1,10 +1,10 @@
-import { as as T, af as E, p as O, j as V, aA as B, a0 as F, X as j, aB as K } from "./index-CUQrfsw_.js";
-import { r as $ } from "./Reshape-Bo8HzP8V.js";
-import { g as A, a as k, b as C, c as N, e as R } from "./axis_util-DubwyOhW.js";
-import { t as U, m as W } from "./shared-D1elLckx.js";
-import { c as _ } from "./backend_util-BJ-_jSeK.js";
-import { f as y } from "./gpgpu_math-TFLxaLkw.js";
-import { g as G, b as L } from "./kernel_funcs_utils-P9aFa232.js";
+import { aq as T, ag as E, p as O, j as V, aB as B, a1 as F, ah as j, aC as K } from "./index-DdmHGZjq.js";
+import { r as $ } from "./Reshape-Bh_jzKzV.js";
+import { g as A, a as C, b as k, c as N, e as R } from "./axis_util-Did9235A.js";
+import { t as U, m as W } from "./shared-CZiWmQCI.js";
+import { c as _ } from "./backend_util-yC3YH1jo.js";
+import { f as y } from "./gpgpu_math-D_ODOLix.js";
+import { g as G, b as L } from "./kernel_funcs_utils-CDfFpUab.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -105,7 +105,7 @@ class w {
  * limitations under the License.
  * =============================================================================
  */
-class X {
+class q {
   constructor(s, e) {
     this.variableNames = ["x"];
     const { windowSize: t, batchSize: n, inSize: l, outSize: r } = s;
@@ -229,7 +229,7 @@ class X {
  * limitations under the License.
  * =============================================================================
  */
-function q(a) {
+function X(a) {
   const s = [];
   for (; s.length === 0 || s[s.length - 1].outSize !== 1; ) {
     const e = s.length ? s[s.length - 1].outSize : a[1], t = _(e);
@@ -242,12 +242,12 @@ function q(a) {
   return s;
 }
 function P(a, s, e, t) {
-  const n = q(a.shape);
+  const n = X(a.shape);
   let l = a;
   for (let r = 0; r < n.length; r++) {
     const { inSize: i, windowSize: c, outSize: o } = n[r];
     let u, p;
-    e === "mean" ? u = r === 0 ? new w({ windowSize: c, inSize: i, batchSize: a.shape[0], outSize: o }, i) : new w({ windowSize: c, inSize: i, batchSize: a.shape[0], outSize: o }) : u = new X({ windowSize: c, inSize: i, batchSize: a.shape[0], outSize: o }, e), p = l, l = t.runWebGLProgram(u, [l], s), p.dataId !== a.dataId && t.disposeIntermediateTensorInfo(p);
+    e === "mean" ? u = r === 0 ? new w({ windowSize: c, inSize: i, batchSize: a.shape[0], outSize: o }, i) : new w({ windowSize: c, inSize: i, batchSize: a.shape[0], outSize: o }) : u = new q({ windowSize: c, inSize: i, batchSize: a.shape[0], outSize: o }, e), p = l, l = t.runWebGLProgram(u, [l], s), p.dataId !== a.dataId && t.disposeIntermediateTensorInfo(p);
   }
   return l;
 }
@@ -381,7 +381,7 @@ function Q(a, s, e, t) {
   let i = r;
   const c = A(i, l), o = c != null;
   let u = a;
-  o && (u = D(a, c, t), i = k(i.length, l)), C("sum", i, l);
+  o && (u = D(a, c, t), i = C(i.length, l)), k("sum", i, l);
   const [p, h] = N(u.shape, i);
   let d = p;
   e && (d = R(p, r));
@@ -465,9 +465,9 @@ function te(a) {
       M.values = z;
     } else
       d = D(n, u, e);
-    o = k(o.length, i);
+    o = C(o.length, i);
   }
-  C("max", o, i);
+  k("max", o, i);
   const [f, S] = N(d.shape, o);
   let g = f;
   r && (g = R(f, c));

package/dist/{Reshape-B-lWQRnF.js → Reshape-41YpQqEo.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { j as h, a4 as d, n as c, U as m } from "./index-CUQrfsw_.js";
+import { j as h, a5 as d, n as c, V as m } from "./index-DdmHGZjq.js";
 /**
  * @license
  * Copyright 2021 Google LLC. All Rights Reserved.

package/dist/{Reshape-Bo8HzP8V.js → Reshape-Bh_jzKzV.js} RENAMED Viewed

@@ -1,5 +1,5 @@
-import { j as c, a4 as C, n as f, U as R } from "./index-CUQrfsw_.js";
-import { u as g, g as I, a as x, b as F, c as $, d as u, e as m, i as l } from "./gpgpu_math-TFLxaLkw.js";
+import { j as c, a5 as C, n as f, V as R } from "./index-DdmHGZjq.js";
+import { u as g, g as I, a as x, b as F, c as $, d as u, e as m, i as l } from "./gpgpu_math-D_ODOLix.js";
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.

package/dist/TeachableLLM.js CHANGED Viewed

@@ -5,17 +5,17 @@ import u from "./Generator.js";
 import f from "./Trainer.js";
 import { E as p } from "./index-Dwqa6Zy2.js";
 import { dummyPassTrainAsync as m } from "./utilities/dummy.js";
-import "./index-CUQrfsw_.js";
+import "./index-DdmHGZjq.js";
 import "./ops/cpu/attentionMask.js";
 import "./ops/webgl/attentionMask.js";
 import "./ops/grads/attentionMask.js";
 import "./ops/cpu/qkv.js";
 import "./ops/webgl/qkv.js";
 import "./ops/grads/qkv.js";
-import "./random_width-D8Pwy_na.js";
-import "./register_all_kernels-DUshvVWP.js";
+import "./random_width-DKGeiFuR.js";
+import "./register_all_kernels-Do9VvZmo.js";
 import "./index-Tf7vU29b.js";
-import "./dataset-CJmEGu6D.js";
+import "./dataset-DPPl-iLT.js";
 import "./ops/cpu/rope.js";
 import "./ops/webgl/rope.js";
 import "./ops/grads/rope.js";
@@ -40,12 +40,14 @@ import "./papaparse.min-C8l2Kvo1.js";
 import "./jszip.min-CjP2V1VV.js";
 import "./ops/cpu/gelu.js";
 import "./ops/webgl/gelu.js";
-import "./gelu-Bd3UBBxg.js";
+import "./gelu-BkcmEEyD.js";
 import "./ops/webgl/log.js";
 import "./ops/cpu/adamMoments.js";
 import "./ops/webgl/adamMoments.js";
 import "./ops/cpu/adamAdjust.js";
 import "./ops/webgl/adamAdjust.js";
+import "./checks/normRMS.js";
+import "./checks/normRMSGrad.js";
 import k from "./utilities/profile.js";
 import w from "./models/factory.js";
 class a {

package/dist/{axis_util-DubwyOhW.js → axis_util-Did9235A.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { n as c } from "./index-CUQrfsw_.js";
+import { n as c } from "./index-DdmHGZjq.js";
 /**
  * @license
  * Copyright 2017 Google LLC. All Rights Reserved.

package/dist/backend.js CHANGED Viewed

@@ -1,6 +1,6 @@
-import { g as a, s as i, r as o } from "./index-CUQrfsw_.js";
+import { g as a, s as i, r as o } from "./index-DdmHGZjq.js";
 async function e(t) {
-  a() !== t && (t === "webgpu" && (await import("./index-BaPo_0H8.js"), await import("./ops/webgpu/index.js")), await i(t), await o(), console.log(`Backend set to ${t}`));
+  a() !== t && (t === "webgpu" && (await import("./index-evZ57wr4.js"), await import("./ops/webgpu/index.js")), await i(t), await o(), console.log(`Backend set to ${t}`));
 }
 export {
   e as selectBackend

package/dist/{backend_util-BJ-_jSeK.js → backend_util-yC3YH1jo.js} RENAMED Viewed

@@ -1,7 +1,7 @@
-import { j as m, a2 as O, n as g, aM as $, aN as R, aO as M, l as _, ad as y, ay as D, aP as T, u as b, aQ as F } from "./index-CUQrfsw_.js";
-import { b as L, d as W, f as v, c as N, e as x, g as P, a as C, h as z } from "./axis_util-DubwyOhW.js";
-import { S as U, a as B, b as V, c as j, d as G, e as H, f as k, g as q, h as Z, i as X, j as J, k as K, l as Q, m as Y, s as ee, n as te, o as ne, t as se } from "./selu_util-8vv5JxQV.js";
-import { c as re, v as oe, a as ae } from "./scatter_nd_util-CUPPNLaA.js";
+import { j as m, a3 as R, n as g, aN as $, aO as O, aP as _, l as M, ae as y, ax as D, aQ as T, u as b, aR as F } from "./index-DdmHGZjq.js";
+import { b as L, d as W, f as v, c as N, e as x, g as P, a as C, h as z } from "./axis_util-Did9235A.js";
+import { S as U, a as B, b as V, c as j, d as G, e as H, f as k, g as q, h as Z, i as X, j as J, k as K, l as Q, m as Y, s as ee, n as te, o as ne, t as se } from "./selu_util-BgUO9gHY.js";
+import { c as re, v as oe, a as ae } from "./scatter_nd_util-B7yDhiQr.js";
 function ie(e, n) {
   const r = e.shape.length, t = n.shape.length;
   if (r < 1)
@@ -24,7 +24,7 @@ function ie(e, n) {
   for (let i = o; i < r; ++i)
     h *= u[i], c.push(u[i]);
   const d = [
-    ...O(e.shape).map((i) => i / h),
+    ...R(e.shape).map((i) => i / h),
     1
   ].slice(0, o);
   return [c, a, h, d];
@@ -255,7 +255,7 @@ function Se(e, n, r) {
  * limitations under the License.
  * =============================================================================
  */
-const we = 0.3275911, Ae = 0.254829592, Oe = -0.284496736, Re = 1.421413741, Me = -1.453152027, _e = 1.061405429;
+const we = 0.3275911, Ae = 0.254829592, Re = -0.284496736, Oe = 1.421413741, _e = -1.453152027, Me = 1.061405429;
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.
@@ -593,21 +593,21 @@ const rt = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
  */
 function ot(e) {
   try {
-    return e.map((n) => R(n));
+    return e.map((n) => O(n));
   } catch (n) {
     throw new Error(`Failed to decode encoded string bytes into utf-8, error: ${n}`);
   }
 }
 function at(e) {
-  return e.map((n) => M(n));
+  return e.map((n) => _(n));
 }
 const ht = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
   __proto__: null,
   ERF_A1: Ae,
-  ERF_A2: Oe,
-  ERF_A3: Re,
-  ERF_A4: Me,
-  ERF_A5: _e,
+  ERF_A2: Re,
+  ERF_A3: Oe,
+  ERF_A4: _e,
+  ERF_A5: Me,
   ERF_P: we,
   PARALLELIZE_THRESHOLD: I,
   get RowPartitionType() {
@@ -616,7 +616,7 @@ const ht = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
   SELU_SCALE: U,
   SELU_SCALEALPHA: B,
   applyActivation: V,
-  assertAndGetBroadcastShape: _,
+  assertAndGetBroadcastShape: M,
   assertAxesAreInnerMostDims: L,
   assertParamsConsistent: ue,
   assignToTypedArray: Le,
@@ -742,8 +742,8 @@ export {
   et as t,
   Ae as u,
   pe as v,
-  Oe as w,
-  Re as x,
-  Me as y,
-  _e as z
+  Re as w,
+  Oe as x,
+  _e as y,
+  Me as z
 };

package/dist/{broadcast_to-BYfCp5iL.js → broadcast_to-CUvOdOT5.js} RENAMED Viewed

@@ -1,5 +1,5 @@
-import { B as h, C as f, L as p, F as g, E as u, W as b } from "./index-CUQrfsw_.js";
-import { r as T } from "./reshape-DEfQGSin.js";
+import { C as h, D as f, M as p, H as g, E as u, X as b } from "./index-DdmHGZjq.js";
+import { r as T } from "./reshape-WeJkT3ja.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.

package/dist/checks/appendCache.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][]>;

package/dist/checks/appendCache.js ADDED Viewed

@@ -0,0 +1,22 @@
+import { s, e as a } from "../index-DdmHGZjq.js";
+import { t } from "../tensor4d-DLtk7Nxh.js";
+async function u(e) {
+  await s(e);
+  const n = t(
+    [
+      [
+        [
+          [0.1, 0.2, 0, 0],
+          [0.1, 0.2, 0, 0],
+          [0, 0, 0, 0],
+          [0, 0, 0, 0]
+        ]
+      ]
+    ],
+    [1, 1, 4, 4]
+  ), r = t([[[[0.1, 0.2, 0.3, 0.4]]]], [1, 1, 1, 4]);
+  return await a().runKernel("AppendCache", { cache: n, item: r }, { maxSize: 4, pastLen: 2 }).array();
+}
+export {
+  u as execute
+};

package/dist/checks/attentionMask.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][]>;

package/dist/checks/attentionMask.js ADDED Viewed

@@ -0,0 +1,37 @@
+import { s as i, e } from "../index-DdmHGZjq.js";
+import { t } from "../tensor4d-DLtk7Nxh.js";
+import { t as a } from "../tensor2d-CObBWBkW.js";
+async function k(n) {
+  await i(n);
+  const s = t(
+    [
+      [
+        [
+          [0.1, 0.2, 0.3, 0.4],
+          [0.3, 0.4, 0.5, 0.6]
+        ]
+      ]
+    ],
+    [1, 1, 2, 4]
+  ), o = t(
+    [
+      [
+        [
+          [0.5, 0.6, 0.5, 0.6],
+          [0.7, 0.8, 0.7, 0.8]
+        ]
+      ]
+    ],
+    [1, 1, 2, 4]
+  ), r = a(
+    [
+      [0, -1 / 0, -1 / 0, -1 / 0],
+      [0, 0, 0, -1 / 0]
+    ],
+    [2, 4]
+  );
+  return await e().runKernel("AttentionMask", { q: s, k: o, mask: r }, { divisor: 0.5, pastLen: 0 }).array();
+}
+export {
+  k as execute
+};

package/dist/checks/check.d.ts ADDED Viewed

@@ -0,0 +1,9 @@
+interface Result {
+    backend: string;
+    result: unknown;
+    error?: string;
+    passed: boolean;
+    maxError?: number;
+}
+export default function runCheck(check: (backend: string) => Promise<unknown>, epsilon?: number): Promise<Result[]>;
+export {};

package/dist/checks/check.js ADDED Viewed

@@ -0,0 +1,20 @@
+import { arraysClose as l } from "../utilities/arrayClose.js";
+async function f(c, a) {
+  const n = ["cpu", "webgl", "webgpu"], t = [];
+  for (const e of n)
+    try {
+      const r = await c(e);
+      t.push({ backend: e, result: r, passed: !0 });
+    } catch (r) {
+      t.push({ backend: e, error: r.message, result: [], passed: !1 });
+    }
+  const s = await Promise.all(t), u = s[0].result;
+  for (let e = 1; e < s.length; e++) {
+    const r = s[e].result, o = l(u, r);
+    s[e].passed = o <= (a ?? 1e-6), s[e].maxError = o;
+  }
+  return s;
+}
+export {
+  f as default
+};

package/dist/checks/gelu.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][]>;

package/dist/checks/gelu.js ADDED Viewed

@@ -0,0 +1,18 @@
+import { s as e, e as o } from "../index-DdmHGZjq.js";
+import { t as s } from "../tensor2d-CObBWBkW.js";
+async function m(t) {
+  await e(t);
+  const r = s(
+    [
+      [0.1, 0.2, 0, 0],
+      [0.1, 0.2, 0, 0],
+      [0, 0, 0, 0],
+      [0, 0, 0, 0]
+    ],
+    [4, 4]
+  );
+  return await o().runKernel("Gelu", { x: r }).array();
+}
+export {
+  m as execute
+};

package/dist/checks/index.d.ts ADDED Viewed

@@ -0,0 +1,22 @@
+import { execute as rope } from './rope';
+import { execute as normRMS } from './normRMS';
+import { execute as qkv } from './qkv';
+import { execute as gelu } from './gelu';
+import { execute as normRMSGrad } from './normRMSGrad';
+import { execute as appendCache } from './appendCache';
+import { execute as attentionMask } from './attentionMask';
+import { default as runCheck } from './check';
+import { createWeightStatistics, createTensorStatistics } from './weights';
+declare const checks: {
+    rope: typeof rope;
+    qkv: typeof qkv;
+    gelu: typeof gelu;
+    normRMS: typeof normRMS;
+    normRMSGrad: typeof normRMSGrad;
+    appendCache: typeof appendCache;
+    attentionMask: typeof attentionMask;
+    runCheck: typeof runCheck;
+    createLayerWeightStatistics: typeof createWeightStatistics;
+    createWeightStatistics: typeof createTensorStatistics;
+};
+export default checks;

package/dist/checks/index.js ADDED Viewed

@@ -0,0 +1,24 @@
+import { execute as e } from "./rope.js";
+import { execute as t } from "./normRMS.js";
+import { execute as r } from "./qkv.js";
+import { execute as c } from "./gelu.js";
+import { execute as o } from "./normRMSGrad.js";
+import { execute as a } from "./appendCache.js";
+import { execute as i } from "./attentionMask.js";
+import m from "./check.js";
+import { createTensorStatistics as s, createWeightStatistics as u } from "./weights.js";
+const d = {
+  rope: e,
+  qkv: r,
+  gelu: c,
+  normRMS: t,
+  normRMSGrad: o,
+  appendCache: a,
+  attentionMask: i,
+  runCheck: m,
+  createLayerWeightStatistics: u,
+  createWeightStatistics: s
+};
+export {
+  d as default
+};

package/dist/checks/normRMS.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<(number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][])[]>;

package/dist/checks/normRMS.js ADDED Viewed

@@ -0,0 +1,16 @@
+import { s as u, y as A, e as y } from "../index-DdmHGZjq.js";
+import { a as h } from "../ops-542ai2vG.js";
+import { t as p } from "../tensor1d-CtJq5BOv.js";
+import { t as a } from "../tensor-DbqgIV9B.js";
+const w = Array.from({ length: 2048 * 192 }, () => Math.random()), x = Array.from({ length: 192 }, () => Math.random()), M = Array.from({ length: 2048 * 192 }, () => Math.random());
+async function k(t) {
+  await u(t);
+  const o = p(x, "float32"), n = a(w, [16, 128, 192], "float32"), s = a(M, [16, 128, 192], "float32"), e = (d, g) => {
+    const i = y().runKernel("RMSNorm", { x: d, gamma: g });
+    return h.meanSquaredError(i, s);
+  }, { value: m, grads: r } = A(e)([n, o]), c = await m.array(), f = await r[0].array(), l = await r[1].array();
+  return [c, f, l];
+}
+export {
+  k as execute
+};

package/dist/checks/normRMSGrad.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<(number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][])[]>;

package/dist/checks/normRMSGrad.js ADDED Viewed

@@ -0,0 +1,12 @@
+import { s as c, e as d } from "../index-DdmHGZjq.js";
+import { t as f } from "../tensor1d-CtJq5BOv.js";
+import { t as r } from "../tensor-DbqgIV9B.js";
+const y = Array.from({ length: 2048 * 192 }, () => Math.random()), i = Array.from({ length: 192 }, () => Math.random()), l = Array.from({ length: 2048 * 192 }, () => Math.random());
+async function x(t) {
+  await c(t);
+  const o = f(i, "float32"), n = r(y, [16, 128, 192], "float32"), m = r(l, [16, 128, 192], "float32"), a = d().runKernel("RMSNormGrad", { x: n, gamma: o, dy: m }), s = await a[0].array(), e = await a[1].array();
+  return [s, e];
+}
+export {
+  x as execute
+};

package/dist/checks/qkv.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function execute(backend: string): Promise<(number \| number[] \| number[][] \| number[][][] \| number[][][][] \| number[][][][][] \| number[][][][][][])[]>;