@genai-fi/nanogpt 0.8.5 → 0.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/Generator.d.ts +4 -1
- package/dist/Generator.js +144 -124
- package/dist/{RealDiv-D_q39E3A.js → RealDiv-D4EzDsC0.js} +7 -7
- package/dist/{Reshape-Bh_jzKzV.js → Reshape-Bowtk9BP.js} +2 -2
- package/dist/{Reshape-41YpQqEo.js → Reshape-DUqYftGC.js} +1 -1
- package/dist/TeachableLLM.js +5 -5
- package/dist/Trainer.d.ts +1 -0
- package/dist/Trainer.js +3 -0
- package/dist/{axis_util-Did9235A.js → axis_util-TbGYJ208.js} +1 -1
- package/dist/backend.js +2 -2
- package/dist/{backend_util-yC3YH1jo.js → backend_util-CJIiDoV1.js} +4 -4
- package/dist/{broadcast_to-CUvOdOT5.js → broadcast_to-DzlNweb8.js} +2 -2
- package/dist/checks/appendCache.js +2 -2
- package/dist/checks/attentionMask.js +3 -3
- package/dist/checks/gelu.js +2 -2
- package/dist/checks/matMulGelu.js +5 -5
- package/dist/checks/normRMS.js +4 -4
- package/dist/checks/normRMSGrad.js +3 -3
- package/dist/checks/qkv.js +2 -2
- package/dist/checks/rope.js +2 -2
- package/dist/{concat-pHiVqR3L.js → concat-B912vBbo.js} +1 -1
- package/dist/{dataset-DPPl-iLT.js → dataset-DlZtKmBq.js} +3 -3
- package/dist/{dropout-CcKSfOYE.js → dropout-C-csYCLj.js} +6 -6
- package/dist/{exports_initializers-DKk7-bsx.js → exports_initializers-B8iZMgQ0.js} +1 -1
- package/dist/{gather-CPg6ZlQA.js → gather-Dnpgw-YQ.js} +1 -1
- package/dist/{gelu-BkcmEEyD.js → gelu-Bp_-935b.js} +1 -1
- package/dist/{gpgpu_math-D_ODOLix.js → gpgpu_math-CDaYiyE_.js} +2 -2
- package/dist/{index-DdmHGZjq.js → index-BzFyqcy-.js} +13 -13
- package/dist/{index-evZ57wr4.js → index-C1rx_Ajs.js} +10 -10
- package/dist/{kernel_funcs_utils-CDfFpUab.js → kernel_funcs_utils-DKLK0Mg3.js} +3 -3
- package/dist/layers/BaseLayer.js +2 -2
- package/dist/layers/CausalSelfAttention.js +6 -6
- package/dist/layers/MLP.js +5 -5
- package/dist/layers/PositionEmbedding.js +5 -5
- package/dist/layers/RMSNorm.js +3 -3
- package/dist/layers/RoPECache.js +4 -4
- package/dist/layers/TiedEmbedding.js +5 -5
- package/dist/layers/TransformerBlock.js +1 -1
- package/dist/loader/loadTransformers.js +1 -1
- package/dist/loader/oldZipLoad.js +5 -5
- package/dist/{log_sum_exp-C8yFJfZz.js → log_sum_exp-DO6z8tSE.js} +9 -9
- package/dist/main.d.ts +1 -0
- package/dist/main.js +18 -16
- package/dist/{mat_mul-Dpy2mMRu.js → mat_mul-DzjTFx-u.js} +1 -1
- package/dist/{mod-CbibJi3D.js → mod-Dobti4j4.js} +1 -1
- package/dist/models/NanoGPTV1.d.ts +1 -0
- package/dist/models/NanoGPTV1.js +12 -9
- package/dist/models/model.d.ts +1 -0
- package/dist/models/model.js +5 -5
- package/dist/{mulmat_packed_gpu-q_Gmwyld.js → mulmat_packed_gpu-BT60jmzP.js} +1 -1
- package/dist/{ones-BAqVh-eA.js → ones-tIJeHlq-.js} +2 -2
- package/dist/ops/adamAdjust.js +1 -1
- package/dist/ops/adamMoments.js +1 -1
- package/dist/ops/appendCache.js +3 -3
- package/dist/ops/attentionMask.js +1 -1
- package/dist/ops/cpu/adamAdjust.js +1 -1
- package/dist/ops/cpu/adamMoments.js +2 -2
- package/dist/ops/cpu/appendCache.js +2 -2
- package/dist/ops/cpu/attentionMask.js +5 -5
- package/dist/ops/cpu/fusedSoftmax.js +2 -2
- package/dist/ops/cpu/gatherSub.js +5 -5
- package/dist/ops/cpu/gelu.js +1 -1
- package/dist/ops/cpu/matMulGelu.js +2 -2
- package/dist/ops/cpu/matMulMul.js +1 -1
- package/dist/ops/cpu/mulDropout.js +1 -1
- package/dist/ops/cpu/normRMS.js +1 -1
- package/dist/ops/cpu/qkv.js +3 -3
- package/dist/ops/cpu/rope.js +5 -5
- package/dist/ops/cpu/scatterSub.js +13 -13
- package/dist/ops/fusedSoftmax.js +1 -1
- package/dist/ops/gatherSub.js +1 -1
- package/dist/ops/gelu.js +2 -2
- package/dist/ops/grads/attentionMask.js +1 -1
- package/dist/ops/grads/fusedSoftmax.js +2 -2
- package/dist/ops/grads/gelu.js +2 -2
- package/dist/ops/grads/matMulGelu.js +1 -1
- package/dist/ops/grads/normRMS.js +1 -1
- package/dist/ops/grads/qkv.js +1 -1
- package/dist/ops/grads/rope.js +1 -1
- package/dist/ops/matMulGelu.js +1 -1
- package/dist/ops/matMulMul.js +1 -1
- package/dist/ops/mulDrop.js +1 -1
- package/dist/ops/normRMS.js +1 -1
- package/dist/ops/qkv.js +1 -1
- package/dist/ops/rope.js +4 -4
- package/dist/ops/scatterSub.js +1 -1
- package/dist/ops/webgl/adamAdjust.js +2 -2
- package/dist/ops/webgl/adamMoments.js +1 -1
- package/dist/ops/webgl/appendCache.js +1 -1
- package/dist/ops/webgl/attentionMask.js +1 -1
- package/dist/ops/webgl/fusedSoftmax.js +4 -4
- package/dist/ops/webgl/gatherSub.js +1 -1
- package/dist/ops/webgl/gelu.js +2 -2
- package/dist/ops/webgl/log.js +3 -3
- package/dist/ops/webgl/matMulGelu.js +4 -4
- package/dist/ops/webgl/matMulMul.js +1 -1
- package/dist/ops/webgl/mulDropout.js +1 -1
- package/dist/ops/webgl/normRMS.js +2 -2
- package/dist/ops/webgl/qkv.js +1 -1
- package/dist/ops/webgl/rope.js +1 -1
- package/dist/ops/webgl/scatterSub.js +1 -1
- package/dist/ops/webgpu/adamAdjust.js +3 -3
- package/dist/ops/webgpu/adamMoments.js +3 -3
- package/dist/ops/webgpu/appendCache.js +3 -3
- package/dist/ops/webgpu/attentionMask.js +3 -3
- package/dist/ops/webgpu/gatherSub.js +3 -3
- package/dist/ops/webgpu/gelu.js +37 -35
- package/dist/ops/webgpu/normRMS.js +2 -2
- package/dist/ops/webgpu/normRMSGrad.js +5 -5
- package/dist/ops/webgpu/qkv.js +3 -3
- package/dist/ops/webgpu/rope.js +3 -3
- package/dist/ops/webgpu/scatterSub.js +3 -3
- package/dist/ops/webgpu/utils/reductions.js +4 -4
- package/dist/{ops-542ai2vG.js → ops-LuCMAnmM.js} +65 -65
- package/dist/{random_width-DKGeiFuR.js → random_width-CXVRloNK.js} +23 -23
- package/dist/{range-BcUvLuf5.js → range-CWcz7xFA.js} +3 -3
- package/dist/{reciprocal-DhDWSKiD.js → reciprocal-C4rNcM-S.js} +1 -1
- package/dist/{register_all_kernels-Do9VvZmo.js → register_all_kernels-DIGpEwcf.js} +31 -31
- package/dist/{relu-B1AXs7p5.js → relu-BjCh_SYb.js} +1 -1
- package/dist/{reshape-WeJkT3ja.js → reshape-CnIwVG1c.js} +1 -1
- package/dist/{scatter_nd_util-B7yDhiQr.js → scatter_nd_util-BQdz--Gn.js} +1 -1
- package/dist/{selu_util-BgUO9gHY.js → selu_util-OtRzVwW5.js} +23 -23
- package/dist/{shared-V6D_md-c.js → shared-DmRsFyaJ.js} +6 -6
- package/dist/{shared-CZiWmQCI.js → shared-DuP7ue-R.js} +1 -1
- package/dist/{sin-CPxad7Am.js → sin-gpDNRxE0.js} +1 -1
- package/dist/{slice-B7jXtPnp.js → slice-d0Vo9XTN.js} +1 -1
- package/dist/{softmax-BfsyI4As.js → softmax-D7Jj3p_P.js} +1 -1
- package/dist/{split-BPxr8_8m.js → split-DK2k5eHf.js} +1 -1
- package/dist/{stack-BNwLzE43.js → stack-DFatutCx.js} +1 -1
- package/dist/{sum-ByFINZgi.js → sum-CJ0ULhmt.js} +1 -1
- package/dist/{tensor-DbqgIV9B.js → tensor-CZr4dh61.js} +1 -1
- package/dist/{tensor1d-CtJq5BOv.js → tensor1d-vML0r3q6.js} +1 -1
- package/dist/{tensor2d-CObBWBkW.js → tensor2d-D76QGjF3.js} +1 -1
- package/dist/{tensor4d-DLtk7Nxh.js → tensor4d-Df1WlVDY.js} +1 -1
- package/dist/training/Adam.js +2 -2
- package/dist/training/AdamExt.js +1 -1
- package/dist/training/DatasetBuilder.js +2 -2
- package/dist/training/FullTrainer.js +1 -1
- package/dist/training/Trainer.js +2 -2
- package/dist/training/sparseCrossEntropy.js +3 -3
- package/dist/utilities/dummy.js +2 -2
- package/dist/utilities/multinomialCPU.js +2 -2
- package/dist/utilities/performance.js +1 -1
- package/dist/utilities/profile.js +1 -1
- package/dist/utilities/safetensors.js +2 -2
- package/dist/utilities/topP.d.ts +1 -0
- package/dist/utilities/topP.js +13 -0
- package/dist/utilities/weights.js +2 -2
- package/dist/{variable-DPFOJyRG.js → variable-Bm2OFwGI.js} +1 -1
- package/dist/{webgpu_program-Dhk9R5aG.js → webgpu_program-DkQJOJSd.js} +1 -1
- package/dist/{webgpu_util-BqGnZg8t.js → webgpu_util-pLEV9tks.js} +1 -1
- package/dist/{zeros-Dnwix0p4.js → zeros-Bj5rMYA7.js} +1 -1
- package/package.json +1 -1
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import {
|
|
1
|
+
import { E as l, F as h, G as m, ao as p, M as c, ap as f, af as g, n as u, T as V, o as v, q as N, a as w } from "./index-BzFyqcy-.js";
|
|
2
2
|
import { s as d } from "./index-C4L8Cm77.js";
|
|
3
3
|
/**
|
|
4
4
|
* @license
|
|
@@ -106,7 +106,7 @@ function $(r, t = 0, e = 1, s, n) {
|
|
|
106
106
|
a.values[i] = o.nextValue();
|
|
107
107
|
return a.toTensor();
|
|
108
108
|
}
|
|
109
|
-
const
|
|
109
|
+
const U = /* @__PURE__ */ l({ randomNormal_: $ });
|
|
110
110
|
/**
|
|
111
111
|
* @license
|
|
112
112
|
* Copyright 2020 Google LLC. All Rights Reserved.
|
|
@@ -176,18 +176,18 @@ function E(r, t) {
|
|
|
176
176
|
* limitations under the License.
|
|
177
177
|
* =============================================================================
|
|
178
178
|
*/
|
|
179
|
-
function
|
|
179
|
+
function F(r, t, e, s) {
|
|
180
180
|
const n = h(r, "x", "dropout");
|
|
181
181
|
if (u(n.dtype === "float32", () => `x has to be a floating point tensor since it's going to be scaled, but got a ${n.dtype} tensor instead.`), u(t >= 0 && t < 1, () => `rate must be a float in the range [0, 1), but got ${t}.`), t === 0)
|
|
182
182
|
return r instanceof V ? n.clone() : n;
|
|
183
183
|
const o = E(n, e), a = 1 - t, i = v(b(N(D(o, 0, 1, "float32", s), a)), a);
|
|
184
184
|
return w(n, i);
|
|
185
185
|
}
|
|
186
|
-
const
|
|
186
|
+
const _ = /* @__PURE__ */ l({ dropout_: F });
|
|
187
187
|
export {
|
|
188
188
|
T as M,
|
|
189
189
|
D as a,
|
|
190
|
-
|
|
190
|
+
_ as d,
|
|
191
191
|
b as f,
|
|
192
|
-
|
|
192
|
+
U as r
|
|
193
193
|
};
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
import { aD as z, ag as v, aE as oe, aF as ie, aG as ae, n as F, aH as me, aI as J, a3 as B, aJ as I, af as T, j as E, aK as H, aL as $e, aM as Y, ae as Te } from "./index-
|
|
1
|
+
import { aD as z, ag as v, aE as oe, aF as ie, aG as ae, n as F, aH as me, aI as J, a3 as B, aJ as I, af as T, j as E, aK as H, aL as $e, aM as Y, ae as Te } from "./index-BzFyqcy-.js";
|
|
2
2
|
import "./index-Tf7vU29b.js";
|
|
3
|
-
import { b as Se } from "./backend_util-
|
|
3
|
+
import { b as Se } from "./backend_util-CJIiDoV1.js";
|
|
4
4
|
/**
|
|
5
5
|
* @license
|
|
6
6
|
* Copyright 2018 Google LLC. All Rights Reserved.
|
|
@@ -4160,18 +4160,18 @@ function Bs() {
|
|
|
4160
4160
|
Bs();
|
|
4161
4161
|
export {
|
|
4162
4162
|
ho as $,
|
|
4163
|
-
|
|
4164
|
-
|
|
4165
|
-
|
|
4166
|
-
|
|
4167
|
-
|
|
4168
|
-
|
|
4169
|
-
|
|
4170
|
-
|
|
4171
|
-
|
|
4172
|
-
|
|
4173
|
-
|
|
4174
|
-
|
|
4163
|
+
C as A,
|
|
4164
|
+
Ps as B,
|
|
4165
|
+
Tn as C,
|
|
4166
|
+
vn as D,
|
|
4167
|
+
F as E,
|
|
4168
|
+
T as F,
|
|
4169
|
+
f as G,
|
|
4170
|
+
ta as H,
|
|
4171
|
+
An as I,
|
|
4172
|
+
Jn as J,
|
|
4173
|
+
Sr as K,
|
|
4174
|
+
bi as L,
|
|
4175
4175
|
Ct as M,
|
|
4176
4176
|
Ue as N,
|
|
4177
4177
|
H as O,
|
|
@@ -4453,5 +4453,5 @@ export {
|
|
|
4453
4453
|
nt as w,
|
|
4454
4454
|
Qt as x,
|
|
4455
4455
|
wi as y,
|
|
4456
|
-
|
|
4456
|
+
Si as z
|
|
4457
4457
|
};
|
|
@@ -1,14 +1,14 @@
|
|
|
1
|
-
import { ag as U, d4 as Jt, d5 as es, e as We, n as L, d6 as _e, j as $, aO as Ge, ap as de, d7 as st, d8 as ts, d9 as ss, aP as os, bn as Ct, a3 as Re, da as is, db as rs, dc as as, bv as ns, l as Z, cg as us, dd as ot, az as ds, aa as ls, u as ge, bm as cs, co as hs, cp as ps, bt as fs, cq as ms, bc as gs, af as ze, p as se, aB as xs, bJ as Cs, bK as ws, bL as bs, cr as ys, cs as Ss, ct as vs, cv as Is, cu as ks, cw as Rs, ah as Ps, b5 as Ds, bM as Ns, bN as $s, cx as zs, cy as As, U as Fs, $ as Ls, bP as Bs, aS as Es, de as Ts, b7 as Ws, b8 as _s, bq as Vs, br as Us, bw as Ms, bR as Os, cA as Gs, a$ as Hs,
|
|
2
|
-
import { m as hr, c as pr, P as He, t as B, g as y, a as J, b as q, d as Pe, e as fr, f as mr } from "./webgpu_program-
|
|
3
|
-
import { i as wt, G as it, a as gr, c as S, f as I, M as j, b as bt, d as yt, e as St } from "./webgpu_util-
|
|
4
|
-
import { m as rt, E as xr, u as Cr, w as wr, x as br, y as yr, z as Sr, f as at, A as vt, B as It, C as kt, D as vr, F as Ir, G as xe, H as kr, I as Rr, J as Pr, K as Dr, L as Nr, M as $r, N as zr, O as Ar, P as Fr, Q as Lr, S as Br } from "./backend_util-
|
|
5
|
-
import { S as Er, a as Tr, h as be, i as Ae, p as Wr, q as _r, j as ye, d as ee, e as Xe, g as Ke, k as Rt, A as Vr, B as Ur } from "./selu_util-
|
|
6
|
-
import { r as R, a as Mr } from "./Reshape-
|
|
7
|
-
import { s as Or } from "./shared-
|
|
8
|
-
import { c as qe, g as Se, a as ve, b as Ye, e as Gr, h as Pt } from "./axis_util-
|
|
9
|
-
import { z as Hr } from "./zeros-
|
|
1
|
+
import { ag as U, d4 as Jt, d5 as es, e as We, n as L, d6 as _e, j as $, aO as Ge, ap as de, d7 as st, d8 as ts, d9 as ss, aP as os, bn as Ct, a3 as Re, da as is, db as rs, dc as as, bv as ns, l as Z, cg as us, dd as ot, az as ds, aa as ls, u as ge, bm as cs, co as hs, cp as ps, bt as fs, cq as ms, bc as gs, af as ze, p as se, aB as xs, bJ as Cs, bK as ws, bL as bs, cr as ys, cs as Ss, ct as vs, cv as Is, cu as ks, cw as Rs, ah as Ps, b5 as Ds, bM as Ns, bN as $s, cx as zs, cy as As, U as Fs, $ as Ls, bP as Bs, aS as Es, de as Ts, b7 as Ws, b8 as _s, bq as Vs, br as Us, bw as Ms, bR as Os, cA as Gs, a$ as Hs, K as Xs, bS as Ks, cc as qs, bT as Ys, bU as Qs, cB as js, bV as Zs, ac as Js, bW as eo, bd as to, bX as so, bY as oo, bZ as io, df as ro, b_ as ao, ce as no, cf as uo, dg as lo, cC as co, cD as ho, cE as po, dh as fo, bB as mo, a1 as go, aU as xo, as as Co, cF as wo, bx as bo, b$ as yo, ai as So, aY as vo, by as Io, di as ko, be as Ro, ao as Po, bz as Do, dj as No, bQ as $o, cd as zo, dk as Ao, a8 as Fo, H as Lo, aZ as Bo, a_ as Eo, dl as To, cG as Wo, cH as _o, cI as Vo, at as Uo, b0 as Mo, b1 as Oo, dm as Go, aj as Ho, b2 as Xo, b4 as Ko, c1 as qo, dn as Yo, cL as Qo, cK as jo, bA as Zo, c2 as Jo, c3 as ei, cM as ti, cN as si, dp as oi, aV as ii, b6 as ri, cO as ai, Y as ni, S as ui, a6 as di, b3 as li, bg as ci, bh as hi, c4 as pi, cW as fi, c5 as mi, P as gi, a4 as xi, c6 as Ci, cP as wi, au as bi, bC as yi, R as Si, aC as vi, Z as Ii, _ as ki, av as Ri, bj as Pi, cQ as Di, bk as Ni, cR as $i, c8 as zi, bf as Ai, b9 as Fi, bD as Li, a7 as Bi, dq as Ei, aT as Ti, c9 as Wi, ar as _i, cS as Vi, ad as Ui, ca as Mi, c0 as Oi, c7 as Gi, dr as Hi, ds as Xi, X as Ki, dt as qi, ab as Yi, W as Qi, bF as ji, cT as Zi, ba as Ji, aw as er, du as tr, dv as sr, bH as or, cU as ir, bO as rr, dw as ar, dx as nr, bl as ur, bb as dr, cb as lr, f as cr } from "./index-BzFyqcy-.js";
|
|
2
|
+
import { m as hr, c as pr, P as He, t as B, g as y, a as J, b as q, d as Pe, e as fr, f as mr } from "./webgpu_program-DkQJOJSd.js";
|
|
3
|
+
import { i as wt, G as it, a as gr, c as S, f as I, M as j, b as bt, d as yt, e as St } from "./webgpu_util-pLEV9tks.js";
|
|
4
|
+
import { m as rt, E as xr, u as Cr, w as wr, x as br, y as yr, z as Sr, f as at, A as vt, B as It, C as kt, D as vr, F as Ir, G as xe, H as kr, I as Rr, J as Pr, K as Dr, L as Nr, M as $r, N as zr, O as Ar, P as Fr, Q as Lr, S as Br } from "./backend_util-CJIiDoV1.js";
|
|
5
|
+
import { S as Er, a as Tr, h as be, i as Ae, p as Wr, q as _r, j as ye, d as ee, e as Xe, g as Ke, k as Rt, A as Vr, B as Ur } from "./selu_util-OtRzVwW5.js";
|
|
6
|
+
import { r as R, a as Mr } from "./Reshape-DUqYftGC.js";
|
|
7
|
+
import { s as Or } from "./shared-DmRsFyaJ.js";
|
|
8
|
+
import { c as qe, g as Se, a as ve, b as Ye, e as Gr, h as Pt } from "./axis_util-TbGYJ208.js";
|
|
9
|
+
import { z as Hr } from "./zeros-Bj5rMYA7.js";
|
|
10
10
|
import { n as Xr, a as Kr } from "./non_max_suppression_impl-CsEgBuMA.js";
|
|
11
|
-
import { c as Qe } from "./scatter_nd_util-
|
|
11
|
+
import { c as Qe } from "./scatter_nd_util-BQdz--Gn.js";
|
|
12
12
|
/**
|
|
13
13
|
* @license
|
|
14
14
|
* Copyright 2019 Google LLC. All Rights Reserved.
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
import { l as B, j as G, az as K, aa as z, at as W, aA as V, ag as N, au as F, u as S } from "./index-
|
|
2
|
-
import { u as O, f as Y } from "./gpgpu_math-
|
|
3
|
-
import { f as v } from "./backend_util-
|
|
1
|
+
import { l as B, j as G, az as K, aa as z, at as W, aA as V, ag as N, au as F, u as S } from "./index-BzFyqcy-.js";
|
|
2
|
+
import { u as O, f as Y } from "./gpgpu_math-CDaYiyE_.js";
|
|
3
|
+
import { f as v } from "./backend_util-CJIiDoV1.js";
|
|
4
4
|
/**
|
|
5
5
|
* @license
|
|
6
6
|
* Copyright 2018 Google LLC. All Rights Reserved.
|
package/dist/layers/BaseLayer.js
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { T as p,
|
|
2
|
-
import { v as _ } from "../variable-
|
|
1
|
+
import { T as p, z as g, e as o, L as v } from "../index-BzFyqcy-.js";
|
|
2
|
+
import { v as _ } from "../variable-Bm2OFwGI.js";
|
|
3
3
|
class T {
|
|
4
4
|
parent;
|
|
5
5
|
config;
|
|
@@ -3,13 +3,13 @@ import O from "./BaseLayer.js";
|
|
|
3
3
|
import { qkv as _ } from "../ops/qkv.js";
|
|
4
4
|
import { rope as v } from "../ops/rope.js";
|
|
5
5
|
import { appendCache as V } from "../ops/appendCache.js";
|
|
6
|
-
import { k as c, t as P } from "../index-
|
|
6
|
+
import { k as c, t as P } from "../index-BzFyqcy-.js";
|
|
7
7
|
import { fusedSoftmax as b } from "../ops/fusedSoftmax.js";
|
|
8
|
-
import { d as C } from "../random_width-
|
|
9
|
-
import { v as k } from "../variable-
|
|
10
|
-
import { r as T, d as L } from "../dropout-
|
|
11
|
-
import { r as j } from "../reshape-
|
|
12
|
-
import { m as x } from "../mat_mul-
|
|
8
|
+
import { d as C } from "../random_width-CXVRloNK.js";
|
|
9
|
+
import { v as k } from "../variable-Bm2OFwGI.js";
|
|
10
|
+
import { r as T, d as L } from "../dropout-C-csYCLj.js";
|
|
11
|
+
import { r as j } from "../reshape-CnIwVG1c.js";
|
|
12
|
+
import { m as x } from "../mat_mul-DzjTFx-u.js";
|
|
13
13
|
class W extends O {
|
|
14
14
|
divisor;
|
|
15
15
|
index;
|
package/dist/layers/MLP.js
CHANGED
|
@@ -1,10 +1,10 @@
|
|
|
1
|
-
import { t as p } from "../index-
|
|
1
|
+
import { t as p } from "../index-BzFyqcy-.js";
|
|
2
2
|
import u from "./BaseLayer.js";
|
|
3
3
|
import { matMulGelu as M } from "../ops/matMulGelu.js";
|
|
4
|
-
import { v as a } from "../variable-
|
|
5
|
-
import { r as d, d as c } from "../dropout-
|
|
6
|
-
import { r as h } from "../reshape-
|
|
7
|
-
import { m as b } from "../mat_mul-
|
|
4
|
+
import { v as a } from "../variable-Bm2OFwGI.js";
|
|
5
|
+
import { r as d, d as c } from "../dropout-C-csYCLj.js";
|
|
6
|
+
import { r as h } from "../reshape-CnIwVG1c.js";
|
|
7
|
+
import { m as b } from "../mat_mul-DzjTFx-u.js";
|
|
8
8
|
class H extends u {
|
|
9
9
|
index;
|
|
10
10
|
hiddenUnits;
|
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
import { t as c, a9 as u, b as i } from "../index-
|
|
1
|
+
import { t as c, a9 as u, b as i } from "../index-BzFyqcy-.js";
|
|
2
2
|
import f from "./BaseLayer.js";
|
|
3
|
-
import { E as g, D as h } from "../random_width-
|
|
4
|
-
import { r as b } from "../exports_initializers-
|
|
5
|
-
import { m as l } from "../mod-
|
|
6
|
-
import { r as w } from "../range-
|
|
3
|
+
import { E as g, D as h } from "../random_width-CXVRloNK.js";
|
|
4
|
+
import { r as b } from "../exports_initializers-B8iZMgQ0.js";
|
|
5
|
+
import { m as l } from "../mod-Dobti4j4.js";
|
|
6
|
+
import { r as w } from "../range-CWcz7xFA.js";
|
|
7
7
|
/**
|
|
8
8
|
* @license
|
|
9
9
|
* Copyright 2018 Google LLC
|
package/dist/layers/RMSNorm.js
CHANGED
|
@@ -1,8 +1,8 @@
|
|
|
1
|
-
import { t as s } from "../index-
|
|
1
|
+
import { t as s } from "../index-BzFyqcy-.js";
|
|
2
2
|
import e from "./BaseLayer.js";
|
|
3
3
|
import { normRMS as a } from "../ops/normRMS.js";
|
|
4
|
-
import { v as i } from "../variable-
|
|
5
|
-
import { o as m } from "../ones-
|
|
4
|
+
import { v as i } from "../variable-Bm2OFwGI.js";
|
|
5
|
+
import { o as m } from "../ones-tIJeHlq-.js";
|
|
6
6
|
class l extends e {
|
|
7
7
|
GAMMA;
|
|
8
8
|
constructor(r, t = "", o) {
|
package/dist/layers/RoPECache.js
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
import { b as t, x as h, t as n, k as p } from "../index-
|
|
2
|
-
import { r as c } from "../reciprocal-
|
|
3
|
-
import { c as f, s as m } from "../sin-
|
|
4
|
-
import { r as a } from "../range-
|
|
1
|
+
import { b as t, x as h, t as n, k as p } from "../index-BzFyqcy-.js";
|
|
2
|
+
import { r as c } from "../reciprocal-C4rNcM-S.js";
|
|
3
|
+
import { c as f, s as m } from "../sin-gpDNRxE0.js";
|
|
4
|
+
import { r as a } from "../range-CWcz7xFA.js";
|
|
5
5
|
class D {
|
|
6
6
|
constructor(o) {
|
|
7
7
|
this.config = o;
|
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
import { d as r } from "../random_width-
|
|
2
|
-
import "../index-
|
|
3
|
-
import { r as a } from "../exports_initializers-
|
|
1
|
+
import { d as r } from "../random_width-CXVRloNK.js";
|
|
2
|
+
import "../index-BzFyqcy-.js";
|
|
3
|
+
import { r as a } from "../exports_initializers-B8iZMgQ0.js";
|
|
4
4
|
import s from "./BaseLayer.js";
|
|
5
|
-
import { v as o } from "../variable-
|
|
6
|
-
import { g as m } from "../gather-
|
|
5
|
+
import { v as o } from "../variable-Bm2OFwGI.js";
|
|
6
|
+
import { g as m } from "../gather-Dnpgw-YQ.js";
|
|
7
7
|
class S extends s {
|
|
8
8
|
vocabSize;
|
|
9
9
|
embedDim;
|
|
@@ -2,7 +2,7 @@ import l from "./CausalSelfAttention.js";
|
|
|
2
2
|
import p from "./MLP.js";
|
|
3
3
|
import o from "./RMSNorm.js";
|
|
4
4
|
import m from "./BaseLayer.js";
|
|
5
|
-
import { k as n, t as h } from "../index-
|
|
5
|
+
import { k as n, t as h } from "../index-BzFyqcy-.js";
|
|
6
6
|
class k extends m {
|
|
7
7
|
ln1;
|
|
8
8
|
attn;
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
import l from "../tokeniser/CharTokeniser.js";
|
|
2
2
|
import c from "../tokeniser/bpe.js";
|
|
3
3
|
import { load_safetensors as b } from "../utilities/safetensors.js";
|
|
4
|
-
import { a2 as y } from "../index-
|
|
4
|
+
import { a2 as y } from "../index-BzFyqcy-.js";
|
|
5
5
|
import { dummyPassAsync as u } from "../utilities/dummy.js";
|
|
6
6
|
import _ from "../models/factory.js";
|
|
7
7
|
async function L(e, a, r, t) {
|
|
@@ -1,14 +1,14 @@
|
|
|
1
|
-
import { a2 as y } from "../index-
|
|
1
|
+
import { a2 as y } from "../index-BzFyqcy-.js";
|
|
2
2
|
import "../ops/cpu/attentionMask.js";
|
|
3
3
|
import "../ops/webgl/attentionMask.js";
|
|
4
4
|
import "../ops/grads/attentionMask.js";
|
|
5
5
|
import "../ops/cpu/qkv.js";
|
|
6
6
|
import "../ops/webgl/qkv.js";
|
|
7
7
|
import "../ops/grads/qkv.js";
|
|
8
|
-
import "../random_width-
|
|
9
|
-
import "../register_all_kernels-
|
|
8
|
+
import "../random_width-CXVRloNK.js";
|
|
9
|
+
import "../register_all_kernels-DIGpEwcf.js";
|
|
10
10
|
import "../index-Tf7vU29b.js";
|
|
11
|
-
import "../dataset-
|
|
11
|
+
import "../dataset-DlZtKmBq.js";
|
|
12
12
|
import "../ops/cpu/rope.js";
|
|
13
13
|
import "../ops/webgl/rope.js";
|
|
14
14
|
import "../ops/grads/rope.js";
|
|
@@ -41,7 +41,7 @@ import "../ops/webgl/adamMoments.js";
|
|
|
41
41
|
import "../papaparse.min-C8l2Kvo1.js";
|
|
42
42
|
import "../ops/cpu/gelu.js";
|
|
43
43
|
import "../ops/webgl/gelu.js";
|
|
44
|
-
import "../gelu-
|
|
44
|
+
import "../gelu-Bp_-935b.js";
|
|
45
45
|
import "../ops/webgl/log.js";
|
|
46
46
|
import "../checks/normRMS.js";
|
|
47
47
|
import "../checks/normRMSGrad.js";
|
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
import {
|
|
2
|
-
import { e as _ } from "./axis_util-
|
|
3
|
-
import { r as m } from "./reshape-
|
|
4
|
-
import { s as T } from "./sum-
|
|
1
|
+
import { E as r, F as x, G as p, ah as h, ai as E, aj as $, p as d, c as S, q as K } from "./index-BzFyqcy-.js";
|
|
2
|
+
import { e as _ } from "./axis_util-TbGYJ208.js";
|
|
3
|
+
import { r as m } from "./reshape-CnIwVG1c.js";
|
|
4
|
+
import { s as T } from "./sum-CJ0ULhmt.js";
|
|
5
5
|
/**
|
|
6
6
|
* @license
|
|
7
7
|
* Copyright 2020 Google LLC. All Rights Reserved.
|
|
@@ -22,7 +22,7 @@ function b(s, o = null, n = !1) {
|
|
|
22
22
|
const t = { x: x(s, "x", "max") }, e = { reductionIndices: o, keepDims: n };
|
|
23
23
|
return p.runKernel(h, t, e);
|
|
24
24
|
}
|
|
25
|
-
const
|
|
25
|
+
const G = /* @__PURE__ */ r({ max_: b });
|
|
26
26
|
/**
|
|
27
27
|
* @license
|
|
28
28
|
* Copyright 2018 Google LLC. All Rights Reserved.
|
|
@@ -82,7 +82,7 @@ const j = /* @__PURE__ */ r({ log_: N });
|
|
|
82
82
|
* =============================================================================
|
|
83
83
|
*/
|
|
84
84
|
function q(s, o = null, n = !1) {
|
|
85
|
-
const a = x(s, "x", "logSumExp"), t = d(o, a.shape), e =
|
|
85
|
+
const a = x(s, "x", "logSumExp"), t = d(o, a.shape), e = G(
|
|
86
86
|
a,
|
|
87
87
|
t,
|
|
88
88
|
!0
|
|
@@ -94,10 +94,10 @@ function q(s, o = null, n = !1) {
|
|
|
94
94
|
}
|
|
95
95
|
return c;
|
|
96
96
|
}
|
|
97
|
-
const
|
|
97
|
+
const F = /* @__PURE__ */ r({ logSumExp_: q });
|
|
98
98
|
export {
|
|
99
99
|
j as a,
|
|
100
100
|
M as e,
|
|
101
|
-
|
|
102
|
-
|
|
101
|
+
F as l,
|
|
102
|
+
G as m
|
|
103
103
|
};
|
package/dist/main.d.ts
CHANGED
|
@@ -16,6 +16,7 @@ export type { ITokeniser } from './tokeniser/type';
|
|
|
16
16
|
export type { TrainingProgress, TrainingLogEntry } from './training/Trainer';
|
|
17
17
|
export type { GPTConfig } from './models/config';
|
|
18
18
|
export { estimateParameterCount, estimateMemoryUsage, estimateTrainingMemoryUsage, estimateResources, validateConfig, } from './utilities/parameters';
|
|
19
|
+
export { default as topP } from './utilities/topP';
|
|
19
20
|
export { selectBackend } from './backend';
|
|
20
21
|
export { default as performanceTest } from './utilities/performance';
|
|
21
22
|
export declare const layers: {
|
package/dist/main.js
CHANGED
|
@@ -6,8 +6,9 @@ import { default as to } from "./utilities/waitForModel.js";
|
|
|
6
6
|
import { default as eo } from "./data/textLoader.js";
|
|
7
7
|
import { default as io } from "./Generator.js";
|
|
8
8
|
import { default as fo } from "./models/model.js";
|
|
9
|
-
import { estimateMemoryUsage as lo, estimateParameterCount as xo, estimateResources as
|
|
10
|
-
import "./
|
|
9
|
+
import { estimateMemoryUsage as lo, estimateParameterCount as xo, estimateResources as uo, estimateTrainingMemoryUsage as no, validateConfig as co } from "./utilities/parameters.js";
|
|
10
|
+
import { default as ko } from "./utilities/topP.js";
|
|
11
|
+
import "./index-BzFyqcy-.js";
|
|
11
12
|
import "./ops/cpu/scatterSub.js";
|
|
12
13
|
import "./ops/webgl/scatterSub.js";
|
|
13
14
|
import "./ops/cpu/gatherSub.js";
|
|
@@ -18,10 +19,10 @@ import "./ops/grads/attentionMask.js";
|
|
|
18
19
|
import "./ops/cpu/qkv.js";
|
|
19
20
|
import "./ops/webgl/qkv.js";
|
|
20
21
|
import "./ops/grads/qkv.js";
|
|
21
|
-
import "./random_width-
|
|
22
|
-
import "./register_all_kernels-
|
|
22
|
+
import "./random_width-CXVRloNK.js";
|
|
23
|
+
import "./register_all_kernels-DIGpEwcf.js";
|
|
23
24
|
import "./index-Tf7vU29b.js";
|
|
24
|
-
import "./dataset-
|
|
25
|
+
import "./dataset-DlZtKmBq.js";
|
|
25
26
|
import "./ops/cpu/rope.js";
|
|
26
27
|
import "./ops/webgl/rope.js";
|
|
27
28
|
import "./ops/grads/rope.js";
|
|
@@ -35,7 +36,7 @@ import "./ops/webgl/matMulGelu.js";
|
|
|
35
36
|
import "./ops/grads/matMulGelu.js";
|
|
36
37
|
import "./ops/cpu/gelu.js";
|
|
37
38
|
import "./ops/webgl/gelu.js";
|
|
38
|
-
import "./gelu-
|
|
39
|
+
import "./gelu-Bp_-935b.js";
|
|
39
40
|
import "./ops/cpu/normRMS.js";
|
|
40
41
|
import "./ops/webgl/normRMS.js";
|
|
41
42
|
import "./ops/grads/normRMS.js";
|
|
@@ -44,14 +45,14 @@ import "./ops/cpu/adamMoments.js";
|
|
|
44
45
|
import "./ops/webgl/adamMoments.js";
|
|
45
46
|
import "./ops/cpu/adamAdjust.js";
|
|
46
47
|
import "./ops/webgl/adamAdjust.js";
|
|
47
|
-
import { selectBackend as
|
|
48
|
-
import { default as
|
|
48
|
+
import { selectBackend as Po } from "./backend.js";
|
|
49
|
+
import { default as go } from "./utilities/performance.js";
|
|
49
50
|
import o from "./layers/CausalSelfAttention.js";
|
|
50
51
|
import r from "./layers/MLP.js";
|
|
51
52
|
import t from "./layers/TransformerBlock.js";
|
|
52
53
|
import m from "./layers/RoPECache.js";
|
|
53
|
-
import { default as
|
|
54
|
-
import { default as
|
|
54
|
+
import { default as Bo } from "./training/AdamExt.js";
|
|
55
|
+
import { default as Eo } from "./checks/index.js";
|
|
55
56
|
const O = {
|
|
56
57
|
CausalSelfAttention: o,
|
|
57
58
|
MLP: r,
|
|
@@ -59,22 +60,23 @@ const O = {
|
|
|
59
60
|
RoPECache: m
|
|
60
61
|
};
|
|
61
62
|
export {
|
|
62
|
-
|
|
63
|
+
Bo as AdamExt,
|
|
63
64
|
oo as BPETokeniser,
|
|
64
65
|
_ as CharTokeniser,
|
|
65
66
|
io as Generator,
|
|
66
67
|
fo as Model,
|
|
67
68
|
W as NanoGPT,
|
|
68
69
|
Y as TeachableLLM,
|
|
69
|
-
|
|
70
|
+
Eo as checks,
|
|
70
71
|
lo as estimateMemoryUsage,
|
|
71
72
|
xo as estimateParameterCount,
|
|
72
|
-
|
|
73
|
-
|
|
73
|
+
uo as estimateResources,
|
|
74
|
+
no as estimateTrainingMemoryUsage,
|
|
74
75
|
O as layers,
|
|
75
76
|
eo as loadTextData,
|
|
76
|
-
|
|
77
|
-
|
|
77
|
+
go as performanceTest,
|
|
78
|
+
Po as selectBackend,
|
|
79
|
+
ko as topP,
|
|
78
80
|
co as validateConfig,
|
|
79
81
|
to as waitForModel
|
|
80
82
|
};
|
|
@@ -11,5 +11,6 @@ export default class NanoGPT extends Model<ModelForwardAttributes> {
|
|
|
11
11
|
getClassName(): string;
|
|
12
12
|
private inputPhase;
|
|
13
13
|
forward(attrs: ModelForwardAttributes, idx: Tensor, targets?: Tensor): Tensor[];
|
|
14
|
+
project(embeddings: Tensor): Tensor;
|
|
14
15
|
dispose(): void;
|
|
15
16
|
}
|
package/dist/models/NanoGPTV1.js
CHANGED
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
import { defaultConfig as
|
|
2
|
-
import
|
|
1
|
+
import { defaultConfig as u } from "./config.js";
|
|
2
|
+
import a from "../layers/TransformerBlock.js";
|
|
3
3
|
import f from "../layers/TiedEmbedding.js";
|
|
4
4
|
import g from "../layers/RoPECache.js";
|
|
5
5
|
import b from "../layers/RMSNorm.js";
|
|
6
|
-
import { t as
|
|
6
|
+
import { t as c, k as p } from "../index-BzFyqcy-.js";
|
|
7
7
|
import w from "./model.js";
|
|
8
8
|
import k from "../layers/PositionEmbedding.js";
|
|
9
9
|
class R extends w {
|
|
@@ -17,16 +17,16 @@ class R extends w {
|
|
|
17
17
|
// Final layer norm
|
|
18
18
|
ropeCache;
|
|
19
19
|
constructor(e = {}) {
|
|
20
|
-
super({ ...
|
|
20
|
+
super({ ...u, ...e }), this.wte = new f(this.config, "token_embedding", this), this.config.useRope === !1 ? this.wpe = new k(this.config, "positional_embedding", this) : this.ropeCache = new g(this.config), this.blocks = [];
|
|
21
21
|
for (let i = 0; i < this.config.nLayer; i++)
|
|
22
|
-
this.blocks.push(new
|
|
22
|
+
this.blocks.push(new a(i, this.config, this));
|
|
23
23
|
this.lnF = new b(this.config, "final_rms_norm", this);
|
|
24
24
|
}
|
|
25
25
|
getClassName() {
|
|
26
26
|
return "GenAI_NanoGPT_v1";
|
|
27
27
|
}
|
|
28
28
|
inputPhase(e, i) {
|
|
29
|
-
return
|
|
29
|
+
return c(() => {
|
|
30
30
|
const s = this.wte.embed(e);
|
|
31
31
|
if (this.config.useRope === !1) {
|
|
32
32
|
const o = this.wpe.call(i, s);
|
|
@@ -38,7 +38,7 @@ class R extends w {
|
|
|
38
38
|
});
|
|
39
39
|
}
|
|
40
40
|
forward(e, i, s) {
|
|
41
|
-
return this.validateInput(i), e.ropeCache = this.ropeCache, e.outputEmbeddings && (e.embeddings = []),
|
|
41
|
+
return this.validateInput(i), e.ropeCache = this.ropeCache, e.outputEmbeddings && (e.embeddings = []), c(() => {
|
|
42
42
|
this.startMemory();
|
|
43
43
|
let o = this.inputPhase(i, e);
|
|
44
44
|
if (e.cache && e.cache.length !== this.blocks.length)
|
|
@@ -46,11 +46,11 @@ class R extends w {
|
|
|
46
46
|
`Cache length ${e.cache.length} does not match number of blocks ${this.blocks.length}`
|
|
47
47
|
);
|
|
48
48
|
for (let t = 0; t < this.blocks.length; t++) {
|
|
49
|
-
const
|
|
49
|
+
const r = this.blocks[t], d = Math.random() * 1e9, l = {
|
|
50
50
|
...e,
|
|
51
51
|
seed: d,
|
|
52
52
|
pastKV: e.cache ? e.cache[t] : void 0
|
|
53
|
-
}, m = e.checkpointing && e.training ?
|
|
53
|
+
}, m = e.checkpointing && e.training ? r.callCheckpoint(l, o) : r.call(l, o);
|
|
54
54
|
e.outputEmbeddings ? (p(o), e.embeddings.push({ name: `block_output_${t}`, tensor: o })) : o.dispose(), o = m;
|
|
55
55
|
}
|
|
56
56
|
o = this.lnF.call(e, o);
|
|
@@ -60,6 +60,9 @@ class R extends w {
|
|
|
60
60
|
return s && (h = this.calculateLoss(n, s)), this.endMemory("Forward"), h ? [n, h] : [n];
|
|
61
61
|
});
|
|
62
62
|
}
|
|
63
|
+
project(e) {
|
|
64
|
+
return c(() => this.wte.project(e));
|
|
65
|
+
}
|
|
63
66
|
dispose() {
|
|
64
67
|
this.wte.dispose(), this.wpe && this.wpe.dispose(), this.blocks.forEach((e) => e.dispose()), this.lnF.dispose();
|
|
65
68
|
}
|
package/dist/models/model.d.ts
CHANGED
|
@@ -16,6 +16,7 @@ export default abstract class Model<T extends ModelForwardAttributes> extends Ba
|
|
|
16
16
|
trainingState: TrainingState | null;
|
|
17
17
|
abstract getClassName(): string;
|
|
18
18
|
abstract forward(attrs: T, idx: Tensor, targets?: Tensor): Tensor[];
|
|
19
|
+
abstract project(embeddings: Tensor): Tensor;
|
|
19
20
|
abstract dispose(): void;
|
|
20
21
|
getNumParams(): number;
|
|
21
22
|
protected validateInput(idx: Tensor): void;
|
package/dist/models/model.js
CHANGED
|
@@ -1,15 +1,15 @@
|
|
|
1
1
|
import i from "../layers/BaseLayer.js";
|
|
2
|
-
import "../index-
|
|
2
|
+
import "../index-BzFyqcy-.js";
|
|
3
3
|
import "../ops/cpu/attentionMask.js";
|
|
4
4
|
import "../ops/webgl/attentionMask.js";
|
|
5
5
|
import "../ops/grads/attentionMask.js";
|
|
6
6
|
import "../ops/cpu/qkv.js";
|
|
7
7
|
import "../ops/webgl/qkv.js";
|
|
8
8
|
import "../ops/grads/qkv.js";
|
|
9
|
-
import "../random_width-
|
|
10
|
-
import "../register_all_kernels-
|
|
9
|
+
import "../random_width-CXVRloNK.js";
|
|
10
|
+
import "../register_all_kernels-DIGpEwcf.js";
|
|
11
11
|
import "../index-Tf7vU29b.js";
|
|
12
|
-
import "../dataset-
|
|
12
|
+
import "../dataset-DlZtKmBq.js";
|
|
13
13
|
import "../ops/cpu/rope.js";
|
|
14
14
|
import "../ops/webgl/rope.js";
|
|
15
15
|
import "../ops/grads/rope.js";
|
|
@@ -39,7 +39,7 @@ import "../ops/cpu/gatherSub.js";
|
|
|
39
39
|
import "../ops/webgl/gatherSub.js";
|
|
40
40
|
import "../ops/cpu/gelu.js";
|
|
41
41
|
import "../ops/webgl/gelu.js";
|
|
42
|
-
import "../gelu-
|
|
42
|
+
import "../gelu-Bp_-935b.js";
|
|
43
43
|
import "../ops/webgl/log.js";
|
|
44
44
|
import "../checks/normRMS.js";
|
|
45
45
|
import "../checks/normRMSGrad.js";
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { M as n, N as t, j as m,
|
|
2
|
-
import { z as c, c as f } from "./zeros-
|
|
1
|
+
import { M as n, N as t, j as m, G as i } from "./index-BzFyqcy-.js";
|
|
2
|
+
import { z as c, c as f } from "./zeros-Bj5rMYA7.js";
|
|
3
3
|
/**
|
|
4
4
|
* @license
|
|
5
5
|
* Copyright 2018 Google LLC. All Rights Reserved.
|
package/dist/ops/adamAdjust.js
CHANGED
package/dist/ops/adamMoments.js
CHANGED
package/dist/ops/appendCache.js
CHANGED
|
@@ -1,8 +1,8 @@
|
|
|
1
|
-
import { e as a } from "../index-
|
|
1
|
+
import { e as a } from "../index-BzFyqcy-.js";
|
|
2
2
|
import "./cpu/appendCache.js";
|
|
3
3
|
import "./webgl/appendCache.js";
|
|
4
|
-
import { c as s } from "../concat-
|
|
5
|
-
import { z as c } from "../zeros-
|
|
4
|
+
import { c as s } from "../concat-B912vBbo.js";
|
|
5
|
+
import { z as c } from "../zeros-Bj5rMYA7.js";
|
|
6
6
|
function i(r, p, n, o) {
|
|
7
7
|
if (!o) {
|
|
8
8
|
const e = r.shape[2];
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { f as k, o as t, q as i, a as q, w } from "../../index-
|
|
1
|
+
import { f as k, o as t, q as i, a as q, w } from "../../index-BzFyqcy-.js";
|
|
2
2
|
function z(a) {
|
|
3
3
|
const { moments: s, value: r } = a.inputs, { beta1: l, beta2: u, epsilon: m, learningRate: d } = a.attrs, e = s.shape.length, c = new Array(e).fill(0), n = s.shape.slice();
|
|
4
4
|
n[e - 1] = 1;
|