npm - @genai-fi/nanogpt - Versions diffs - 0.6.1 → 0.6.2 - Mend

@genai-fi/nanogpt 0.6.1 → 0.6.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

package/dist/Generator.js +6 -6
package/dist/NanoGPTModel.js +9 -9
package/dist/{RealDiv-7xu-pkZN.js → RealDiv-BYViZwhN.js} +6 -6
package/dist/{Reshape-BYC1oUku.js → Reshape-t7Kcikjk.js} +2 -2
package/dist/TeachableLLM.js +5 -5
package/dist/{TiedEmbedding-C1HBot-5.js → TiedEmbedding-9WeDwvjO.js} +4 -4
package/dist/{axis_util-CCNL7jea.js → axis_util-Bu4h7XWV.js} +1 -1
package/dist/{broadcast_to-CddAF879.js → broadcast_to-DARN-DBD.js} +2 -2
package/dist/{concat-XOK9ANZu.js → concat-5aPGqw3Z.js} +8 -8
package/dist/{dataset-BFFipD1c.js → dataset-pgqp-YfL.js} +5 -5
package/dist/{dropout-xlKRoJyU.js → dropout-Bciw46HT.js} +10 -10
package/dist/{gather-DKtUaTtA.js → gather-DjyCjmOD.js} +1 -1
package/dist/{gpgpu_math-B_ycgZ4W.js → gpgpu_math-CNslybmD.js} +31 -31
package/dist/{index-CamYe_M8.js → index-BAzbokzv.js} +31 -31
package/dist/{kernel_funcs_utils-D5MS0JFg.js → kernel_funcs_utils-CUxJCg0g.js} +5 -5
package/dist/layers/BaseLayer.js +2 -2
package/dist/layers/CausalSelfAttention.js +6 -6
package/dist/layers/MLP.js +5 -5
package/dist/layers/RMSNorm.js +3 -3
package/dist/layers/RoPECache.js +4 -4
package/dist/layers/TiedEmbedding.js +5 -5
package/dist/layers/TransformerBlock.js +1 -1
package/dist/loader/load.d.ts +13 -0
package/dist/loader/load.js +27 -0
package/dist/loader/loadHF.d.ts +7 -0
package/dist/loader/loadHF.js +22 -0
package/dist/{utilities/load.d.ts → loader/loadTransformers.d.ts} +11 -11
package/dist/loader/loadTransformers.js +28 -0
package/dist/loader/newZipLoad.d.ts +8 -0
package/dist/loader/newZipLoad.js +21 -0
package/dist/loader/oldZipLoad.d.ts +7 -0
package/dist/loader/oldZipLoad.js +76 -0
package/dist/{log_sum_exp-CV_5-TTu.js → log_sum_exp-YEo2h3gb.js} +16 -16
package/dist/main.js +4 -4
package/dist/{mat_mul-CAbRFWUj.js → mat_mul-7121rsJk.js} +4 -4
package/dist/{max-JBBv7aUf.js → max-DtlIuVeW.js} +3 -3
package/dist/{mulmat_packed_gpu-DW4doKL_.js → mulmat_packed_gpu-D4nKF7Je.js} +1 -1
package/dist/{norm-B9dQTFYn.js → norm-CzltS9Fz.js} +10 -10
package/dist/{ones-CMHNqMr6.js → ones-BBlSRqn1.js} +2 -2
package/dist/ops/appendCache.js +3 -3
package/dist/ops/attentionMask.js +1 -1
package/dist/ops/cpu/appendCache.js +2 -2
package/dist/ops/cpu/attentionMask.js +6 -6
package/dist/ops/cpu/fusedSoftmax.js +2 -2
package/dist/ops/cpu/gatherSub.js +9 -9
package/dist/ops/cpu/gelu.js +1 -1
package/dist/ops/cpu/matMulGelu.js +1 -1
package/dist/ops/cpu/matMulMul.js +1 -1
package/dist/ops/cpu/mulDropout.js +1 -1
package/dist/ops/cpu/normRMS.js +1 -1
package/dist/ops/cpu/qkv.js +3 -3
package/dist/ops/cpu/rope.js +5 -5
package/dist/ops/cpu/scatterSub.js +14 -14
package/dist/ops/fusedSoftmax.js +1 -1
package/dist/ops/gatherSub.js +1 -1
package/dist/ops/gelu.js +1 -1
package/dist/ops/grads/attentionMask.js +1 -1
package/dist/ops/grads/fusedSoftmax.js +4 -4
package/dist/ops/grads/gelu.js +1 -1
package/dist/ops/grads/matMulGelu.js +1 -1
package/dist/ops/grads/normRMS.js +1 -1
package/dist/ops/grads/qkv.js +1 -1
package/dist/ops/grads/rope.js +1 -1
package/dist/ops/matMulGelu.js +1 -1
package/dist/ops/matMulMul.js +1 -1
package/dist/ops/mulDrop.js +1 -1
package/dist/ops/node/sparseCrossEntropy.js +1 -1
package/dist/ops/normRMS.js +1 -1
package/dist/ops/qkv.js +1 -1
package/dist/ops/rope.js +4 -4
package/dist/ops/scatterSub.js +1 -1
package/dist/ops/webgl/appendCache.js +1 -1
package/dist/ops/webgl/attentionMask.js +1 -1
package/dist/ops/webgl/fusedSoftmax.js +4 -4
package/dist/ops/webgl/gatherSub.js +1 -1
package/dist/ops/webgl/gelu.js +2 -2
package/dist/ops/webgl/log.js +3 -3
package/dist/ops/webgl/matMulGelu.js +17 -17
package/dist/ops/webgl/matMulMul.js +1 -1
package/dist/ops/webgl/mulDropout.js +1 -1
package/dist/ops/webgl/normRMS.js +2 -2
package/dist/ops/webgl/qkv.js +1 -1
package/dist/ops/webgl/rope.js +1 -1
package/dist/ops/webgl/scatterSub.js +1 -1
package/dist/{ops-DqtYemmV.js → ops-C0sQEcPw.js} +78 -78
package/dist/{random_width-CLMQG5Jn.js → random_width-DWzaOgrn.js} +22 -22
package/dist/{range-DqYjKnuG.js → range-DYsrnfiy.js} +1 -1
package/dist/{reciprocal-z49filta.js → reciprocal-CJQeasVa.js} +1 -1
package/dist/{register_all_kernels-COt6wLD0.js → register_all_kernels-BfFCQAqs.js} +28 -28
package/dist/{reshape-C45vIIRU.js → reshape-krWGKraP.js} +1 -1
package/dist/{scatter_nd_util-qgtnviTE.js → scatter_nd_util-93ln7Hut.js} +3 -3
package/dist/{selu_util-4QV_GXTB.js → selu_util-sntGesxr.js} +41 -41
package/dist/{shared-ByfrGA97.js → shared-Ca6iDobD.js} +6 -6
package/dist/{sin-9JBrfVaB.js → sin-D_h-qCSx.js} +1 -1
package/dist/{softmax-DvMvui-_.js → softmax-fsdtf6JC.js} +1 -1
package/dist/{split-DxrHrPFK.js → split-eiktj-6L.js} +4 -4
package/dist/{stack-DgaoDmnF.js → stack-dfEEz2OY.js} +2 -2
package/dist/{sum-BpcpxNEh.js → sum-BE_Irnim.js} +3 -3
package/dist/{tensor-CDz5x1mP.js → tensor-Xyi595sG.js} +1 -1
package/dist/{tensor2d-jO8JY5Jd.js → tensor2d-CPEkynbH.js} +1 -1
package/dist/training/AdamExt.js +1 -1
package/dist/training/DatasetBuilder.js +2 -2
package/dist/training/FullTrainer.js +1 -1
package/dist/training/Trainer.js +3 -3
package/dist/training/sparseCrossEntropy.js +5 -5
package/dist/utilities/dummy.js +2 -2
package/dist/utilities/generate.js +3 -3
package/dist/utilities/profile.js +1 -1
package/dist/utilities/safetensors.js +2 -2
package/dist/utilities/save.js +1 -1
package/dist/utilities/weights.js +2 -2
package/dist/{variable-CLVXjN7F.js → variable-wSS22xj5.js} +1 -1
package/dist/{zeros-DUkkVccu.js → zeros-YJDE7oRb.js} +10 -10
package/package.json +3 -3
package/dist/utilities/load.js +0 -99

package/dist/{selu_util-4QV_GXTB.js → selu_util-sntGesxr.js} RENAMED Viewed

@@ -1,6 +1,6 @@
-import { k as N, ao as H, q as _, w as S, E as L, ap as te, aq as ne, al as se, an as re, ar as ie, as as oe, at as le, b as ue, au as fe, av as O } from "./index-CamYe_M8.js";
-import { r as ce } from "./reshape-C45vIIRU.js";
-import { s as ae } from "./sum-BpcpxNEh.js";
+import { i as N, ao as H, o as _, q as S, E as L, ap as te, aq as ne, al as se, an as re, ar as ie, as as oe, at as le, a as ue, au as fe, av as O } from "./index-BAzbokzv.js";
+import { r as ce } from "./reshape-krWGKraP.js";
+import { s as ae } from "./sum-BE_Irnim.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -51,7 +51,7 @@ function X(e, t, n, s, r, u, i = !1, o = "channelsLast") {
     [c, g, a, p] = e;
   else
     throw new Error(`Unknown dataFormat ${o}`);
-  const [l, h, , d] = t, [A, m] = T(n), [b, M] = T(s), f = G(l, b), w = G(h, M), { padInfo: E, outHeight: I, outWidth: x } = de(r, a, p, A, m, f, w, u, o), y = i ? d * g : d;
+  const [l, h, , d] = t, [A, m] = T(n), [b, k] = T(s), f = G(l, b), E = G(h, k), { padInfo: w, outHeight: I, outWidth: x } = de(r, a, p, A, m, f, E, u, o), y = i ? d * g : d;
   let $;
   return o === "channelsFirst" ? $ = [c, y, I, x] : o === "channelsLast" && ($ = [c, I, x, y]), {
     batchSize: c,
@@ -62,15 +62,15 @@ function X(e, t, n, s, r, u, i = !1, o = "channelsLast") {
     outHeight: I,
     outWidth: x,
     outChannels: y,
-    padInfo: E,
+    padInfo: w,
     strideHeight: A,
     strideWidth: m,
     filterHeight: l,
     filterWidth: h,
     effectiveFilterHeight: f,
-    effectiveFilterWidth: w,
+    effectiveFilterWidth: E,
     dilationHeight: b,
-    dilationWidth: M,
+    dilationWidth: k,
     inShape: e,
     outShape: $,
     filterShape: t
@@ -84,22 +84,22 @@ function he(e, t, n, s, r, u = !1, i = "channelsLast", o) {
     [c, l, a, p, g] = e;
   else
     throw new Error(`Unknown dataFormat ${i}`);
-  const [h, d, A, , m] = t, [b, M, f] = W(n), [w, E, I] = W(s), x = G(h, w), y = G(d, E), $ = G(A, I), { padInfo: C, outDepth: k, outHeight: D, outWidth: F } = me(r, a, p, g, b, M, f, x, y, $, o), V = u ? m * l : m;
+  const [h, d, A, , m] = t, [b, k, f] = W(n), [E, w, I] = W(s), x = G(h, E), y = G(d, w), $ = G(A, I), { padInfo: C, outDepth: M, outHeight: D, outWidth: F } = me(r, a, p, g, b, k, f, x, y, $, o), V = u ? m * l : m;
   let U;
-  return i === "channelsFirst" ? U = [c, V, k, D, F] : i === "channelsLast" && (U = [c, k, D, F, V]), {
+  return i === "channelsFirst" ? U = [c, V, M, D, F] : i === "channelsLast" && (U = [c, M, D, F, V]), {
     batchSize: c,
     dataFormat: i,
     inDepth: a,
     inHeight: p,
     inWidth: g,
     inChannels: l,
-    outDepth: k,
+    outDepth: M,
     outHeight: D,
     outWidth: F,
     outChannels: V,
     padInfo: C,
     strideDepth: b,
-    strideHeight: M,
+    strideHeight: k,
     strideWidth: f,
     filterDepth: h,
     filterHeight: d,
@@ -107,8 +107,8 @@ function he(e, t, n, s, r, u = !1, i = "channelsLast", o) {
     effectiveFilterDepth: x,
     effectiveFilterHeight: y,
     effectiveFilterWidth: $,
-    dilationDepth: w,
-    dilationHeight: E,
+    dilationDepth: E,
+    dilationHeight: w,
     dilationWidth: I,
     inShape: e,
     outShape: U,
@@ -175,8 +175,8 @@ function me(e, t, n, s, r, u, i, o, c, a, p) {
     l = m[0], h = m[1], d = m[2];
   } else if (e === "same") {
     l = Math.ceil(t / r), h = Math.ceil(n / u), d = Math.ceil(s / i);
-    const A = (l - 1) * r + o - t, m = (h - 1) * u + c - n, b = (d - 1) * i + a - s, M = Math.floor(A / 2), f = A - M, w = Math.floor(m / 2), E = m - w, I = Math.floor(b / 2), x = b - I;
-    g = { top: w, bottom: E, left: I, right: x, front: M, back: f, type: "SAME" };
+    const A = (l - 1) * r + o - t, m = (h - 1) * u + c - n, b = (d - 1) * i + a - s, k = Math.floor(A / 2), f = A - k, E = Math.floor(m / 2), w = m - E, I = Math.floor(b / 2), x = b - I;
+    g = { top: E, bottom: w, left: I, right: x, front: k, back: f, type: "SAME" };
   } else
     throw Error(`Unknown padding parameter: ${e}`);
   return { padInfo: g, outDepth: l, outHeight: h, outWidth: d };
@@ -244,11 +244,11 @@ function Qe(e, t, n) {
  * limitations under the License.
  * =============================================================================
  */
-function we(e) {
+function Ee(e) {
   const n = { x: S(e, "x", "sigmoid", "float32") };
   return L.runKernel(te, n);
 }
-const Ee = /* @__PURE__ */ _({ sigmoid_: we });
+const we = /* @__PURE__ */ _({ sigmoid_: Ee });
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -311,7 +311,7 @@ function ye(e, t) {
   const n = S(e, "x", "prelu"), s = S(t, "alpha", "prelu"), r = { x: n, alpha: s };
   return L.runKernel(re, r);
 }
-const ke = /* @__PURE__ */ _({ prelu_: ye });
+const Me = /* @__PURE__ */ _({ prelu_: ye });
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -328,11 +328,11 @@ const ke = /* @__PURE__ */ _({ prelu_: ye });
  * limitations under the License.
  * =============================================================================
  */
-function Me(e) {
+function ke(e) {
   const n = { x: S(e, "x", "relu") };
   return L.runKernel(ie, n);
 }
-const Se = /* @__PURE__ */ _({ relu_: Me });
+const Se = /* @__PURE__ */ _({ relu_: ke });
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -413,11 +413,11 @@ function ze(e, t, n, s) {
   if (t === "relu6")
     return Ne(e);
   if (t === "prelu")
-    return ke(e, n);
+    return Me(e, n);
   if (t === "leakyrelu")
     return xe(e, s);
   if (t === "sigmoid")
-    return Ee(e);
+    return we(e);
   throw new Error(`Unknown fused activation ${t}.`);
 }
 const et = (e, t) => !(e > 0) || t === "linear";
@@ -600,43 +600,43 @@ function We(e, t, n, s, r, u, i, o, c) {
   for (let f = 0; f < e.length; ++f) {
     if (l.strides[f] === 0)
       throw Error(`strides[${f}] must be non-zero`);
-    const w = !!(l.shrinkAxisMask & 1 << f), E = e[f];
-    if (E === -1) {
-      m.push(w ? 1 : -1);
+    const E = !!(l.shrinkAxisMask & 1 << f), w = e[f];
+    if (w === -1) {
+      m.push(E ? 1 : -1);
       continue;
     }
     const I = [l.beginMask & 1 << f, l.endMask & 1 << f], x = [
       l.strides[f] > 0 ? 0 : -1,
-      l.strides[f] > 0 ? E : E - 1
+      l.strides[f] > 0 ? w : w - 1
     ];
-    if (w && l.strides[f] <= 0)
+    if (E && l.strides[f] <= 0)
       throw Error("only stride 1 allowed on non-range indexing.");
     A = A && l.strides[f] === 1;
     const y = !!(l.beginMask & 1 << f && l.endMask & 1 << f);
     if (l.beginValid && l.endValid) {
-      if (w) {
-        const D = l.begin[f] < 0 ? E + l.begin[f] : l.begin[f];
-        if (l.begin[f] = D, l.end[f] = l.begin[f] + 1, D < 0 || D >= E)
+      if (E) {
+        const D = l.begin[f] < 0 ? w + l.begin[f] : l.begin[f];
+        if (l.begin[f] = D, l.end[f] = l.begin[f] + 1, D < 0 || D >= w)
           throw Error(`slice index ${l.begin[f]} of dimension ${f} out of bounds.`);
       } else
-        l.begin[f] = K(l.begin[f], 0, l.strides[f], E, I, x), l.end[f] = K(l.end[f], 1, l.strides[f], E, I, x);
-      const k = l.strides[f] === 1 && l.begin[f] === 0 && l.end[f] === E;
-      h = h && k, d = d && (f === 0 && l.strides[f] === 1 || k);
+        l.begin[f] = K(l.begin[f], 0, l.strides[f], w, I, x), l.end[f] = K(l.end[f], 1, l.strides[f], w, I, x);
+      const M = l.strides[f] === 1 && l.begin[f] === 0 && l.end[f] === w;
+      h = h && M, d = d && (f === 0 && l.strides[f] === 1 || M);
     } else
       h = h && l.strides[f] === 1 && y, d = d && (f === 0 && l.strides[f] === 1 || y);
     let $, C = !1;
-    if (l.beginValid && l.endValid ? ($ = l.end[f] - l.begin[f], C = !0) : w ? ($ = 1, C = !0) : y && E >= 0 && (l.strides[f] < 0 ? $ = -E : $ = E, C = !0), C) {
-      let k;
-      $ === 0 || $ < 0 != l.strides[f] < 0 ? k = 0 : k = Math.trunc($ / l.strides[f]) + ($ % l.strides[f] !== 0 ? 1 : 0), m.push(k);
+    if (l.beginValid && l.endValid ? ($ = l.end[f] - l.begin[f], C = !0) : E ? ($ = 1, C = !0) : y && w >= 0 && (l.strides[f] < 0 ? $ = -w : $ = w, C = !0), C) {
+      let M;
+      $ === 0 || $ < 0 != l.strides[f] < 0 ? M = 0 : M = Math.trunc($ / l.strides[f]) + ($ % l.strides[f] !== 0 ? 1 : 0), m.push(M);
     } else
       m.push(-1);
   }
   for (let f = 0; f < l.finalShapeGatherIndices.length; ++f) {
-    const w = l.finalShapeGatherIndices[f];
-    w >= 0 ? b.push(m[w]) : w === v && b.push(1);
+    const E = l.finalShapeGatherIndices[f];
+    E >= 0 ? b.push(m[E]) : E === v && b.push(1);
   }
   return {
-    finalShapeSparse: b.filter((f, w) => l.finalShapeGatherIndices[w] !== v),
+    finalShapeSparse: b.filter((f, E) => l.finalShapeGatherIndices[E] !== v),
     finalShape: b,
     isIdentity: h,
     sliceDim0: d,
@@ -706,7 +706,7 @@ const tt = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
  */
 const nt = 1.7580993408473768, st = 1.0507009873554805;
 export {
-  ke as A,
+  Me as A,
   Ne as B,
   We as C,
   Re as D,
@@ -733,7 +733,7 @@ export {
   P as t,
   Ve as u,
   Le as v,
-  Ee as w,
+  we as w,
   $e as x,
   Se as y,
   xe as z

package/dist/{shared-ByfrGA97.js → shared-Ca6iDobD.js} RENAMED Viewed

@@ -1,9 +1,9 @@
-import { k as qt, bc as _e, i as A, j as Ut, W as K, bd as et, aH as ht, be as gt, bf as at, _ as Ve, $ as st, ak as De, a$ as We, bg as $e, bh as ze, bi as Be, bj as Mt, ah as H, bk as Ot, bl as D, bm as Lt, bn as At, a8 as _t, bo as Vt, ag as Dt, bp as Wt, aT as $t, aU as zt, aW as Bt, aX as Gt, a9 as jt, bq as Zt, a_ as Ht, br as Kt, aY as Ge, am as je, bs as Xt, b2 as Ze, bt as He, p as Yt, u as Ke, t as Xe, bu as Jt, bv as wt, ap as Qt, aO as Ye, bw as te, bx as ee, by as ne, aG as pt, bz as se, bA as ot } from "./index-CamYe_M8.js";
-import { h as it, m as kt, k as Je, l as Qe, R as tn, v as en, n as nn, o as sn, p as on, q as rn, r as an, s as ln, t as cn, w as un, x as hn, y as fn, z as Nt, A as gn, B as dn, C as mn } from "./gpgpu_math-B_ycgZ4W.js";
-import { g as pn, a as In, e as wn, c as bn } from "./axis_util-CCNL7jea.js";
-import { b as xn } from "./broadcast_to-CddAF879.js";
-import { r as En } from "./reshape-C45vIIRU.js";
-import { p as Fn, q as yn, r as kn, u as Nn } from "./selu_util-4QV_GXTB.js";
+import { i as qt, bc as _e, g as A, h as Ut, W as K, bd as et, aH as ht, be as gt, bf as at, _ as Ve, $ as st, ak as De, a$ as We, bg as $e, bh as ze, bi as Be, bj as Mt, ah as H, bk as Ot, bl as D, bm as Lt, bn as At, a8 as _t, bo as Vt, ag as Dt, bp as Wt, aT as $t, aU as zt, aW as Bt, aX as Gt, a9 as jt, bq as Zt, a_ as Ht, br as Kt, aY as Ge, am as je, bs as Xt, b2 as Ze, bt as He, p as Yt, u as Ke, t as Xe, bu as Jt, bv as wt, ap as Qt, aO as Ye, bw as te, bx as ee, by as ne, aG as pt, bz as se, bA as ot } from "./index-BAzbokzv.js";
+import { h as it, m as kt, k as Je, l as Qe, R as tn, v as en, n as nn, o as sn, p as on, q as rn, r as an, s as ln, t as cn, w as un, x as hn, y as fn, z as Nt, A as gn, B as dn, C as mn } from "./gpgpu_math-CNslybmD.js";
+import { g as pn, a as In, e as wn, c as bn } from "./axis_util-Bu4h7XWV.js";
+import { b as xn } from "./broadcast_to-DARN-DBD.js";
+import { r as En } from "./reshape-krWGKraP.js";
+import { p as Fn, q as yn, r as kn, u as Nn } from "./selu_util-sntGesxr.js";
 import { g as Sn } from "./_commonjsHelpers-ByX85dGu.js";
 function vn(e, t) {
   for (var n = 0; n < t.length; n++) {

package/dist/{sin-9JBrfVaB.js → sin-D_h-qCSx.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { q as o, w as t, E as c, a0 as a, a1 as e } from "./index-CamYe_M8.js";
+import { o, q as t, E as c, a0 as a, a1 as e } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.

package/dist/{softmax-DvMvui-_.js → softmax-fsdtf6JC.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { q as r, w as f, E as e, S as i } from "./index-CamYe_M8.js";
+import { o as r, q as f, E as e, S as i } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.

package/dist/{split-DxrHrPFK.js → split-eiktj-6L.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { q as p, w as i, E as a, H as c } from "./index-CamYe_M8.js";
+import { o as p, q as i, E as a, F as c } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -15,9 +15,9 @@ import { q as p, w as i, E as a, H as c } from "./index-CamYe_M8.js";
  * limitations under the License.
  * =============================================================================
  */
-function e(t, s, n = 0) {
-  const o = { x: i(t, "x", "split") }, r = { numOrSizeSplits: s, axis: n };
-  return a.runKernel(c, o, r);
+function e(t, s, o = 0) {
+  const n = { x: i(t, "x", "split") }, r = { numOrSizeSplits: s, axis: o };
+  return a.runKernel(c, n, r);
 }
 const u = /* @__PURE__ */ p({ split_: e });
 export {

package/dist/{stack-DgaoDmnF.js → stack-dfEEz2OY.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { q as e, x as c, k as n, E as k, P as i } from "./index-CamYe_M8.js";
+import { o as e, w as c, i as n, E as i, P as k } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -19,7 +19,7 @@ function u(r, t = 0) {
   const s = c(r, "tensors", "stack", "string_or_numeric");
   n(s.length >= 1, () => "Pass at least one tensor to tf.stack"), s.length > 0 && n(t <= s[0].rank, () => "Axis must be <= rank of the tensor");
   const o = s, a = { axis: t };
-  return k.runKernel(i, o, a);
+  return i.runKernel(k, o, a);
 }
 const l = /* @__PURE__ */ e({ stack_: u });
 export {

package/dist/{sum-BpcpxNEh.js → sum-BE_Irnim.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { q as e, w as u, N as c, E as l, O as m } from "./index-CamYe_M8.js";
+import { o as e, q as u, L as c, E as l, N as m } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.
@@ -15,10 +15,10 @@ import { q as e, w as u, N as c, E as l, O as m } from "./index-CamYe_M8.js";
  * limitations under the License.
  * =============================================================================
  */
-function i(t, n = null, o = !1) {
+function i(t, o = null, n = !1) {
   let s = u(t, "x", "sum");
   s.dtype === "bool" && (s = c(s, "int32"));
-  const r = { x: s }, a = { axis: n, keepDims: o };
+  const r = { x: s }, a = { axis: o, keepDims: n };
   return l.runKernel(m, r, a);
 }
 const f = /* @__PURE__ */ e({ sum_: i });

package/dist/{tensor-CDz5x1mP.js → tensor-Xyi595sG.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { Q as t, U as a } from "./index-CamYe_M8.js";
+import { O as t, Q as a } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.

package/dist/{tensor2d-jO8JY5Jd.js → tensor2d-CPEkynbH.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { V as t, Q as s, U as a } from "./index-CamYe_M8.js";
+import { V as t, O as s, Q as a } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.

package/dist/training/AdamExt.js CHANGED Viewed

@@ -1,4 +1,4 @@
-import { A as r, b as c, f as h, s as g, e as o } from "../index-CamYe_M8.js";
+import { A as r, a as c, s as h, b as g, e as o } from "../index-BAzbokzv.js";
 class u extends r {
   constructor(t, e, s, a, i) {
     super(t, e, s, a), this.config = i, this.startLearningRate = t;

package/dist/training/DatasetBuilder.js CHANGED Viewed

@@ -1,5 +1,5 @@
-import { t as u } from "../index-CamYe_M8.js";
-import { d as z, i as f } from "../dataset-BFFipD1c.js";
+import { t as u } from "../index-BAzbokzv.js";
+import { d as z, i as f } from "../dataset-pgqp-YfL.js";
 import "../index-Tf7vU29b.js";
 /**
  * @license

package/dist/training/FullTrainer.js CHANGED Viewed

@@ -1,7 +1,7 @@
 import { generateText as T } from "../utilities/generate.js";
 import L from "./Trainer.js";
 import x from "./Evaluator.js";
-import { a as h } from "../index-CamYe_M8.js";
+import { d as h } from "../index-BAzbokzv.js";
 import y from "../utilities/profile.js";
 const D = {
   desiredLoss: 0.01,

package/dist/training/Trainer.js CHANGED Viewed

@@ -1,8 +1,8 @@
 import { DatasetBuilder as g, flattenTokens as m, PAGE_FACTOR as u } from "./DatasetBuilder.js";
 import f from "./AdamExt.js";
-import { t as y, v as z, a as c } from "../index-CamYe_M8.js";
-import { n as S } from "../norm-B9dQTFYn.js";
-import { z as p } from "../zeros-DUkkVccu.js";
+import { t as y, v as z, d as c } from "../index-BAzbokzv.js";
+import { n as S } from "../norm-CzltS9Fz.js";
+import { z as p } from "../zeros-YJDE7oRb.js";
 class R {
   constructor(t, e, s = 1e-3) {
     this.tokenizer = e, this.model = t, this.learningRate = s, this.resetOptimizer(), this.datasetBuilder = new g(e, t.config.gpt.blockSize);

package/dist/training/sparseCrossEntropy.js CHANGED Viewed

@@ -1,9 +1,9 @@
 import { gatherSub as L } from "../ops/gatherSub.js";
 import { scatterSub as y } from "../ops/scatterSub.js";
-import { e as u, c as i, z as S, t as f, s as G } from "../index-CamYe_M8.js";
-import { s as v } from "../softmax-DvMvui-_.js";
-import { m as z } from "../max-JBBv7aUf.js";
-import { l as k } from "../log_sum_exp-CV_5-TTu.js";
+import { e as u, l as i, z as S, t as f, b as G } from "../index-BAzbokzv.js";
+import { s as v } from "../softmax-fsdtf6JC.js";
+import { m as z } from "../max-DtlIuVeW.js";
+import { l as k } from "../log_sum_exp-YEo2h3gb.js";
 function F(a, s) {
   return f(() => {
     const e = a.shape[a.shape.length - 1], o = a.shape.slice(0, -1).reduce((d, c) => d * c, 1), p = a.shape.length > 2 ? a.reshape([o, e]) : a, n = s.shape.length > 1 ? s.reshape([o]).cast("int32") : s.cast("int32"), t = z(p, -1, !0), r = G(p, t), h = k(r, -1);
@@ -23,7 +23,7 @@ function j() {
     (s, e, m) => {
       const o = s.shape[s.shape.length - 1], n = s.shape.slice(0, -1).reduce((d, c) => d * c, 1), t = s.reshape([n, o]), r = e.reshape([n]).cast("int32"), h = F(t, r);
       return m([t, r]), t.dispose(), r.dispose(), { value: h, gradFunc: (d, c) => f(() => {
-        const l = c[0], b = c[1], x = v(l), C = y(x, b, d), E = S(e);
+        const g = c[0], b = c[1], x = v(g), C = y(x, b, d), E = S(e);
         return [C.reshape(s.shape), E];
       }) };
     }

package/dist/utilities/dummy.js CHANGED Viewed

@@ -1,5 +1,5 @@
-import { m as f, v as S, e as w } from "../index-CamYe_M8.js";
-import { z as i } from "../zeros-DUkkVccu.js";
+import { m as f, v as S, e as w } from "../index-BAzbokzv.js";
+import { z as i } from "../zeros-YJDE7oRb.js";
 async function P(s) {
   const t = i([1, s.config.gpt.blockSize], "int32"), [e, n] = s.forward({ training: !1 }, t);
   await e.data(), e.dispose(), n && n.dispose(), t.dispose();

package/dist/utilities/generate.js CHANGED Viewed

@@ -1,6 +1,6 @@
-import { t as y } from "../index-CamYe_M8.js";
-import { t as x } from "../tensor2d-jO8JY5Jd.js";
-import { c as f } from "../concat-XOK9ANZu.js";
+import { t as y } from "../index-BAzbokzv.js";
+import { t as x } from "../tensor2d-CPEkynbH.js";
+import { c as f } from "../concat-5aPGqw3Z.js";
 async function A(o, r, a, c, T) {
   if (c <= 0)
     throw new Error("Length must be a positive integer");

package/dist/utilities/profile.js CHANGED Viewed

@@ -1,4 +1,4 @@
-import { m as a } from "../index-CamYe_M8.js";
+import { m as a } from "../index-BAzbokzv.js";
 const m = 1024 * 1024;
 class l {
   log = /* @__PURE__ */ new Map();

package/dist/utilities/safetensors.js CHANGED Viewed

@@ -1,5 +1,5 @@
-import "../index-CamYe_M8.js";
-import { t as y } from "../tensor-CDz5x1mP.js";
+import "../index-BAzbokzv.js";
+import { t as y } from "../tensor-Xyi595sG.js";
 function l(t) {
   if (t === "float32") return "F32";
   if (t === "int32") return "I32";

package/dist/utilities/save.js CHANGED Viewed

@@ -1,7 +1,7 @@
 import { j as p } from "../jszip.min-CjP2V1VV.js";
 import b from "../tokeniser/CharTokeniser.js";
 import { save_safetensors as l } from "./safetensors.js";
-import { VERSION as y } from "./load.js";
+import { VERSION as y } from "../loader/load.js";
 async function N(e, a, n) {
   const f = n?.includeLog ?? !0, s = /* @__PURE__ */ new Map();
   e.saveWeights(s);

package/dist/utilities/weights.js CHANGED Viewed

@@ -1,5 +1,5 @@
-import "../index-CamYe_M8.js";
-import { t as p } from "../tensor-CDz5x1mP.js";
+import "../index-BAzbokzv.js";
+import { t as p } from "../tensor-Xyi595sG.js";
 function h(n) {
   const e = n.reduce((s, o) => s + o.length, 0), a = new Float32Array(e);
   let t = 0;

package/dist/{variable-CLVXjN7F.js → variable-wSS22xj5.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { E as i } from "./index-CamYe_M8.js";
+import { E as i } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.

package/dist/{zeros-DUkkVccu.js → zeros-YJDE7oRb.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { q as m, w as r, Z as l, E as c, _ as i, y as p, $ as u, i as f } from "./index-CamYe_M8.js";
+import { o as m, q as r, Z as l, E as c, _ as i, x as p, $ as u, g as x } from "./index-BAzbokzv.js";
 /**
  * @license
  * Copyright 2020 Google LLC. All Rights Reserved.
@@ -15,13 +15,13 @@ import { q as m, w as r, Z as l, E as c, _ as i, y as p, $ as u, i as f } from "
  * limitations under the License.
  * =============================================================================
  */
-function x(a, e) {
-  const s = r(a, "real", "complex"), o = r(e, "imag", "complex");
-  l(s.shape, o.shape, `real and imag shapes, ${s.shape} and ${o.shape}, must match in call to tf.complex().`);
-  const n = { real: s, imag: o };
+function f(a, e) {
+  const o = r(a, "real", "complex"), s = r(e, "imag", "complex");
+  l(o.shape, s.shape, `real and imag shapes, ${o.shape} and ${s.shape}, must match in call to tf.complex().`);
+  const n = { real: o, imag: s };
   return c.runKernel(i, n);
 }
-const g = /* @__PURE__ */ m({ complex_: x });
+const g = /* @__PURE__ */ m({ complex_: f });
 /**
  * @license
  * Copyright 2018 Google LLC. All Rights Reserved.
@@ -40,11 +40,11 @@ const g = /* @__PURE__ */ m({ complex_: x });
  */
 function t(a, e = "float32") {
   if (p(a), e === "complex64") {
-    const o = t(a, "float32"), n = t(a, "float32");
-    return g(o, n);
+    const s = t(a, "float32"), n = t(a, "float32");
+    return g(s, n);
   }
-  const s = u(f(a), e);
-  return c.makeTensor(s, a, e);
+  const o = u(x(a), e);
+  return c.makeTensor(o, a, e);
 }
 export {
   g as c,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
     "name": "@genai-fi/nanogpt",
-    "version": "0.6.1",
+    "version": "0.6.2",
     "type": "module",
     "main": "dist/main.js",
     "types": "dist/main.d.ts",
@@ -49,10 +49,10 @@
     },
     "dependencies": {
         "@dsnp/parquetjs": "^1.8.7",
+        "@tensorflow/tfjs": "^4.22.0",
         "eventemitter3": "^5.0.1",
         "jszip": "^3.10.1",
         "papaparse": "^5.5.3",
-        "pdfjs-dist": "^5.4.149",
-        "@tensorflow/tfjs": "^4.22.0"
+        "pdfjs-dist": "^5.4.149"
     }
 }

package/dist/utilities/load.js DELETED Viewed

@@ -1,99 +0,0 @@
-import { j as v } from "../jszip.min-CjP2V1VV.js";
-import { importWeights as F } from "./weights.js";
-import h from "../tokeniser/CharTokeniser.js";
-import b from "../NanoGPTModel.js";
-import { dummyPassAsync as u } from "./dummy.js";
-import { d as k } from "../index-CamYe_M8.js";
-import j from "../tokeniser/bpe.js";
-import { load_safetensors as N } from "./safetensors.js";
-const I = 2;
-async function O(t) {
-  const s = await fetch(t);
-  if (!s.ok)
-    throw new Error(`Failed to fetch ${t}: ${s.statusText}`);
-  return s.arrayBuffer();
-}
-async function S(t) {
-  const s = /* @__PURE__ */ new Map(), r = await t.file("manifest.json")?.async("string");
-  if (!r)
-    throw new Error("Manifest file not found in the zip archive");
-  const p = JSON.parse(r);
-  for (const [o, a] of Object.entries(p.weightSpec))
-    s.set(o, { spec: a, data: new Float32Array() });
-  const e = await t.file("tokeniser.json")?.async("string");
-  if (!e)
-    throw new Error("Tokeniser file not found in the zip archive");
-  const i = JSON.parse(e), c = (i.type ?? "char") === "char" ? new h(i.vocab) : new j(i.vocab, i.merges), d = /* @__PURE__ */ new Map();
-  for (const o of Object.keys(t.files))
-    if (o.endsWith(".bin")) {
-      const a = o.replace(".bin", ""), w = await t.file(o).async("arraybuffer"), g = new Float32Array(w), l = s.get(a) || { spec: [], data: new Float32Array() };
-      l.data = g, s.set(a, l);
-      const n = await F(l);
-      d.set(a, n);
-    }
-  k();
-  const f = new b(p.config);
-  await u(f), f.loadWeights(d);
-  const m = await t.file("log.json")?.async("string");
-  if (m)
-    try {
-      const o = JSON.parse(m);
-      f.log = o;
-    } catch (o) {
-      throw console.error("Error parsing training log:", o), new Error(`Failed to parse training log: ${o}`);
-    }
-  return { model: f, tokeniser: c };
-}
-async function R(t) {
-  const s = typeof t == "string" ? await O(t) : t, r = await v.loadAsync(s);
-  if (r.file("manifest.json"))
-    return S(r);
-  {
-    const p = await r.file("config.json")?.async("string");
-    if (!p)
-      throw new Error("Config file not found in the zip archive");
-    const e = JSON.parse(p), i = {
-      vocabSize: e.vocab_size,
-      blockSize: e.block_size,
-      nLayer: e.num_hidden_layers,
-      nHead: e.num_attention_heads,
-      nEmbed: e.hidden_size,
-      dropout: e.dropout,
-      biasInLinear: e.biasInLinear,
-      biasInLayerNorm: e.biasInLayerNorm,
-      mlpFactor: e.mlpFactor,
-      useRope: e.useRope
-    }, y = await r.file("tokeniser.json")?.async("string");
-    if (!y)
-      throw new Error("Tokeniser file not found in the zip archive");
-    const c = JSON.parse(y), f = (c.type ?? "char") === "char" ? new h(c.vocab) : new j(c.vocab, c.merges), m = await N(await r.file("model.safetensors").async("arraybuffer")), o = /* @__PURE__ */ new Map();
-    for (const [n, E] of Object.entries(m))
-      o.set(n, [E]);
-    k();
-    const a = new b(i);
-    await u(a), a.loadWeights(o);
-    const w = await r.file("meta.json")?.async("string");
-    let g;
-    if (w)
-      try {
-        const n = JSON.parse(w);
-        n.name && (g = n.name);
-      } catch (n) {
-        console.error("Error parsing meta file:", n);
-      }
-    const l = await r.file("log.json")?.async("string");
-    if (l)
-      try {
-        const n = JSON.parse(l);
-        a.log = n;
-      } catch (n) {
-        throw console.error("Error parsing training log:", n), new Error(`Failed to parse training log: ${n}`);
-      }
-    return { model: a, tokeniser: f, name: g };
-  }
-}
-export {
-  I as VERSION,
-  R as loadModel,
-  S as loadOldModel
-};