@genai-fi/nanogpt 0.8.5 → 0.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/Generator.d.ts +4 -1
- package/dist/Generator.js +144 -124
- package/dist/{RealDiv-D_q39E3A.js → RealDiv-D4EzDsC0.js} +7 -7
- package/dist/{Reshape-Bh_jzKzV.js → Reshape-Bowtk9BP.js} +2 -2
- package/dist/{Reshape-41YpQqEo.js → Reshape-DUqYftGC.js} +1 -1
- package/dist/TeachableLLM.js +5 -5
- package/dist/Trainer.d.ts +1 -0
- package/dist/Trainer.js +3 -0
- package/dist/{axis_util-Did9235A.js → axis_util-TbGYJ208.js} +1 -1
- package/dist/backend.js +2 -2
- package/dist/{backend_util-yC3YH1jo.js → backend_util-CJIiDoV1.js} +4 -4
- package/dist/{broadcast_to-CUvOdOT5.js → broadcast_to-DzlNweb8.js} +2 -2
- package/dist/checks/appendCache.js +2 -2
- package/dist/checks/attentionMask.js +3 -3
- package/dist/checks/gelu.js +2 -2
- package/dist/checks/matMulGelu.js +5 -5
- package/dist/checks/normRMS.js +4 -4
- package/dist/checks/normRMSGrad.js +3 -3
- package/dist/checks/qkv.js +2 -2
- package/dist/checks/rope.js +2 -2
- package/dist/{concat-pHiVqR3L.js → concat-B912vBbo.js} +1 -1
- package/dist/{dataset-DPPl-iLT.js → dataset-DlZtKmBq.js} +3 -3
- package/dist/{dropout-CcKSfOYE.js → dropout-C-csYCLj.js} +6 -6
- package/dist/{exports_initializers-DKk7-bsx.js → exports_initializers-B8iZMgQ0.js} +1 -1
- package/dist/{gather-CPg6ZlQA.js → gather-Dnpgw-YQ.js} +1 -1
- package/dist/{gelu-BkcmEEyD.js → gelu-Bp_-935b.js} +1 -1
- package/dist/{gpgpu_math-D_ODOLix.js → gpgpu_math-CDaYiyE_.js} +2 -2
- package/dist/{index-DdmHGZjq.js → index-BzFyqcy-.js} +13 -13
- package/dist/{index-evZ57wr4.js → index-C1rx_Ajs.js} +10 -10
- package/dist/{kernel_funcs_utils-CDfFpUab.js → kernel_funcs_utils-DKLK0Mg3.js} +3 -3
- package/dist/layers/BaseLayer.js +2 -2
- package/dist/layers/CausalSelfAttention.js +6 -6
- package/dist/layers/MLP.js +5 -5
- package/dist/layers/PositionEmbedding.js +5 -5
- package/dist/layers/RMSNorm.js +3 -3
- package/dist/layers/RoPECache.js +4 -4
- package/dist/layers/TiedEmbedding.js +5 -5
- package/dist/layers/TransformerBlock.js +1 -1
- package/dist/loader/loadTransformers.js +1 -1
- package/dist/loader/oldZipLoad.js +5 -5
- package/dist/{log_sum_exp-C8yFJfZz.js → log_sum_exp-DO6z8tSE.js} +9 -9
- package/dist/main.d.ts +1 -0
- package/dist/main.js +18 -16
- package/dist/{mat_mul-Dpy2mMRu.js → mat_mul-DzjTFx-u.js} +1 -1
- package/dist/{mod-CbibJi3D.js → mod-Dobti4j4.js} +1 -1
- package/dist/models/NanoGPTV1.d.ts +1 -0
- package/dist/models/NanoGPTV1.js +12 -9
- package/dist/models/model.d.ts +1 -0
- package/dist/models/model.js +5 -5
- package/dist/{mulmat_packed_gpu-q_Gmwyld.js → mulmat_packed_gpu-BT60jmzP.js} +1 -1
- package/dist/{ones-BAqVh-eA.js → ones-tIJeHlq-.js} +2 -2
- package/dist/ops/adamAdjust.js +1 -1
- package/dist/ops/adamMoments.js +1 -1
- package/dist/ops/appendCache.js +3 -3
- package/dist/ops/attentionMask.js +1 -1
- package/dist/ops/cpu/adamAdjust.js +1 -1
- package/dist/ops/cpu/adamMoments.js +2 -2
- package/dist/ops/cpu/appendCache.js +2 -2
- package/dist/ops/cpu/attentionMask.js +5 -5
- package/dist/ops/cpu/fusedSoftmax.js +2 -2
- package/dist/ops/cpu/gatherSub.js +5 -5
- package/dist/ops/cpu/gelu.js +1 -1
- package/dist/ops/cpu/matMulGelu.js +2 -2
- package/dist/ops/cpu/matMulMul.js +1 -1
- package/dist/ops/cpu/mulDropout.js +1 -1
- package/dist/ops/cpu/normRMS.js +1 -1
- package/dist/ops/cpu/qkv.js +3 -3
- package/dist/ops/cpu/rope.js +5 -5
- package/dist/ops/cpu/scatterSub.js +13 -13
- package/dist/ops/fusedSoftmax.js +1 -1
- package/dist/ops/gatherSub.js +1 -1
- package/dist/ops/gelu.js +2 -2
- package/dist/ops/grads/attentionMask.js +1 -1
- package/dist/ops/grads/fusedSoftmax.js +2 -2
- package/dist/ops/grads/gelu.js +2 -2
- package/dist/ops/grads/matMulGelu.js +1 -1
- package/dist/ops/grads/normRMS.js +1 -1
- package/dist/ops/grads/qkv.js +1 -1
- package/dist/ops/grads/rope.js +1 -1
- package/dist/ops/matMulGelu.js +1 -1
- package/dist/ops/matMulMul.js +1 -1
- package/dist/ops/mulDrop.js +1 -1
- package/dist/ops/normRMS.js +1 -1
- package/dist/ops/qkv.js +1 -1
- package/dist/ops/rope.js +4 -4
- package/dist/ops/scatterSub.js +1 -1
- package/dist/ops/webgl/adamAdjust.js +2 -2
- package/dist/ops/webgl/adamMoments.js +1 -1
- package/dist/ops/webgl/appendCache.js +1 -1
- package/dist/ops/webgl/attentionMask.js +1 -1
- package/dist/ops/webgl/fusedSoftmax.js +4 -4
- package/dist/ops/webgl/gatherSub.js +1 -1
- package/dist/ops/webgl/gelu.js +2 -2
- package/dist/ops/webgl/log.js +3 -3
- package/dist/ops/webgl/matMulGelu.js +4 -4
- package/dist/ops/webgl/matMulMul.js +1 -1
- package/dist/ops/webgl/mulDropout.js +1 -1
- package/dist/ops/webgl/normRMS.js +2 -2
- package/dist/ops/webgl/qkv.js +1 -1
- package/dist/ops/webgl/rope.js +1 -1
- package/dist/ops/webgl/scatterSub.js +1 -1
- package/dist/ops/webgpu/adamAdjust.js +3 -3
- package/dist/ops/webgpu/adamMoments.js +3 -3
- package/dist/ops/webgpu/appendCache.js +3 -3
- package/dist/ops/webgpu/attentionMask.js +3 -3
- package/dist/ops/webgpu/gatherSub.js +3 -3
- package/dist/ops/webgpu/gelu.js +37 -35
- package/dist/ops/webgpu/normRMS.js +2 -2
- package/dist/ops/webgpu/normRMSGrad.js +5 -5
- package/dist/ops/webgpu/qkv.js +3 -3
- package/dist/ops/webgpu/rope.js +3 -3
- package/dist/ops/webgpu/scatterSub.js +3 -3
- package/dist/ops/webgpu/utils/reductions.js +4 -4
- package/dist/{ops-542ai2vG.js → ops-LuCMAnmM.js} +65 -65
- package/dist/{random_width-DKGeiFuR.js → random_width-CXVRloNK.js} +23 -23
- package/dist/{range-BcUvLuf5.js → range-CWcz7xFA.js} +3 -3
- package/dist/{reciprocal-DhDWSKiD.js → reciprocal-C4rNcM-S.js} +1 -1
- package/dist/{register_all_kernels-Do9VvZmo.js → register_all_kernels-DIGpEwcf.js} +31 -31
- package/dist/{relu-B1AXs7p5.js → relu-BjCh_SYb.js} +1 -1
- package/dist/{reshape-WeJkT3ja.js → reshape-CnIwVG1c.js} +1 -1
- package/dist/{scatter_nd_util-B7yDhiQr.js → scatter_nd_util-BQdz--Gn.js} +1 -1
- package/dist/{selu_util-BgUO9gHY.js → selu_util-OtRzVwW5.js} +23 -23
- package/dist/{shared-V6D_md-c.js → shared-DmRsFyaJ.js} +6 -6
- package/dist/{shared-CZiWmQCI.js → shared-DuP7ue-R.js} +1 -1
- package/dist/{sin-CPxad7Am.js → sin-gpDNRxE0.js} +1 -1
- package/dist/{slice-B7jXtPnp.js → slice-d0Vo9XTN.js} +1 -1
- package/dist/{softmax-BfsyI4As.js → softmax-D7Jj3p_P.js} +1 -1
- package/dist/{split-BPxr8_8m.js → split-DK2k5eHf.js} +1 -1
- package/dist/{stack-BNwLzE43.js → stack-DFatutCx.js} +1 -1
- package/dist/{sum-ByFINZgi.js → sum-CJ0ULhmt.js} +1 -1
- package/dist/{tensor-DbqgIV9B.js → tensor-CZr4dh61.js} +1 -1
- package/dist/{tensor1d-CtJq5BOv.js → tensor1d-vML0r3q6.js} +1 -1
- package/dist/{tensor2d-CObBWBkW.js → tensor2d-D76QGjF3.js} +1 -1
- package/dist/{tensor4d-DLtk7Nxh.js → tensor4d-Df1WlVDY.js} +1 -1
- package/dist/training/Adam.js +2 -2
- package/dist/training/AdamExt.js +1 -1
- package/dist/training/DatasetBuilder.js +2 -2
- package/dist/training/FullTrainer.js +1 -1
- package/dist/training/Trainer.js +2 -2
- package/dist/training/sparseCrossEntropy.js +3 -3
- package/dist/utilities/dummy.js +2 -2
- package/dist/utilities/multinomialCPU.js +2 -2
- package/dist/utilities/performance.js +1 -1
- package/dist/utilities/profile.js +1 -1
- package/dist/utilities/safetensors.js +2 -2
- package/dist/utilities/topP.d.ts +1 -0
- package/dist/utilities/topP.js +13 -0
- package/dist/utilities/weights.js +2 -2
- package/dist/{variable-DPFOJyRG.js → variable-Bm2OFwGI.js} +1 -1
- package/dist/{webgpu_program-Dhk9R5aG.js → webgpu_program-DkQJOJSd.js} +1 -1
- package/dist/{webgpu_util-BqGnZg8t.js → webgpu_util-pLEV9tks.js} +1 -1
- package/dist/{zeros-Dnwix0p4.js → zeros-Bj5rMYA7.js} +1 -1
- package/package.json +1 -1
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import {
|
|
1
|
+
import { G as e, R as f } from "./index-BzFyqcy-.js";
|
|
2
2
|
/**
|
|
3
3
|
* @license
|
|
4
4
|
* Copyright 2018 Google LLC. All Rights Reserved.
|
|
@@ -15,12 +15,12 @@ import { E as e, R as f } from "./index-DdmHGZjq.js";
|
|
|
15
15
|
* limitations under the License.
|
|
16
16
|
* =============================================================================
|
|
17
17
|
*/
|
|
18
|
-
function
|
|
18
|
+
function i(n, o, r = 1, a = "float32") {
|
|
19
19
|
if (r === 0)
|
|
20
20
|
throw new Error("Cannot have a step of zero");
|
|
21
21
|
const t = { start: n, stop: o, step: r, dtype: a };
|
|
22
22
|
return e.runKernel(f, {}, t);
|
|
23
23
|
}
|
|
24
24
|
export {
|
|
25
|
-
|
|
25
|
+
i as r
|
|
26
26
|
};
|
|
@@ -1,36 +1,36 @@
|
|
|
1
|
-
import {
|
|
2
|
-
import { e as Tr, s as Dr, l as Er, a as Fr, b as Pr, m as Or, c as Ar, r as Ms, f as $l, g as kl, h as wl, i as Nl, j as vl, k as Sl, n as Rl, o as Tl, q as Dl, t as El, u as Fl, v as Pl, w as Ol, x as Al, y as _l, z as Vl, p as Ll, A as Wl, B as Ml, C as Bl, F as Gl, G as zl, H as Ul, I as Hl } from "./random_width-
|
|
3
|
-
import { r as re } from "./reshape-
|
|
4
|
-
import { b as Xl } from "./broadcast_to-
|
|
5
|
-
import { c as os } from "./concat-
|
|
6
|
-
import { c as Kl, s as ql } from "./sin-
|
|
7
|
-
import { w as _r, r as Vr, n as ss, b as Bs, v as Gs, x as Lr, h as jl, g as Yl, e as Ql, c as Zl, f as Jl, j as eu, m as tu, q as su, k as nu, p as ou, y as au, z as ru, A as iu, B as cu, s as lu, d as uu, t as du, u as pu } from "./ops-
|
|
8
|
-
import { m as Tt } from "./mat_mul-
|
|
9
|
-
import { w as Wr, k as Ye, h as Le, x as hu, y as fu, z as mu, C as gu, v as xu, i as ot, j as lt, d as De, e as $t, g as vs, S as Mr, a as Br, A as Gr, B as zr, p as Cu, q as bu, r as Iu, u as yu } from "./selu_util-
|
|
10
|
-
import { e as $u, l as ku, a as wu, m as Nu } from "./log_sum_exp-
|
|
11
|
-
import { f as vu } from "./dropout-
|
|
12
|
-
import { g as Su } from "./gather-
|
|
13
|
-
import { c as zs, z as Ur } from "./zeros-
|
|
14
|
-
import { s as as } from "./slice-
|
|
15
|
-
import { m as Ru } from "./mod-
|
|
16
|
-
import { r as Tu } from "./reciprocal-
|
|
17
|
-
import { r as Du } from "./relu-
|
|
18
|
-
import { s as Us } from "./split-
|
|
19
|
-
import { s as Eu } from "./softmax-
|
|
20
|
-
import { s as Fu } from "./stack-
|
|
21
|
-
import { s as Pu } from "./sum-
|
|
22
|
-
import { a as j, u as le, c as ut, i as dt, b as Ou, d as Pt, t as Pe, e as kt, f as gt, g as Hr, r as Ot, h as Be, j as Au, k as _u, l as Pn, z as Vu, m as On, n as Xr, o as Lu, p as Wu, q as Mu, v as Bu, w as Gu, x as zu, y as Uu, A as Hu, B as Xu, C as Ku, D as ft, E as qu, F as ju, G as Kr, H as Yu, I as Qu, J as Zu, K as Ju, L as ed, M as td, N as sd, O as nd, P as od, Q as ad, R as rd, S as id, T as cd, U as ld, V as ud, W as dd, X as pd, Y as hd, Z as fd, _ as md, $ as gd, a0 as xd, a1 as Cd, a2 as bd, a3 as Id, a4 as yd, a5 as $d, a6 as kd, a7 as wd, a8 as Nd, a9 as vd, aa as Sd, ab as Rd, ac as Td, ad as Dd, ae as Ed, af as Fd, ag as Pd, ah as Od, ai as Ad } from "./shared-
|
|
23
|
-
import { m as xt, A as Ss, B as Rs, C as Ts, D as qr, F as jr, H as Yr, G as je, I as Qr, J as Zr, K as Jr, L as ei, M as ti, z as si, y as ni, x as oi, w as ai, u as ri, E as ii, T as ci, U as _d, V as Vd, W as Ld, X as Wd, Y as Md, Z as Bd, N as li, O as ui, P as di, Q as pi, c as hi, f as Gd, S as zd, _ as Ud } from "./backend_util-
|
|
24
|
-
import { g as ye, a as $e, b as Re, c as Ee, e as Oe, h as Ds } from "./axis_util-
|
|
1
|
+
import { E as ae, F as ne, G as he, co as ps, cp as hs, cr as Zs, cs as fs, ct as ms, cv as gs, Q as Ro, cu as xs, cw as Cs, bw as To, n as Y, df as Js, cC as en, o as Do, A as tn, by as Eo, cG as bs, cH as Is, cI as ys, aq as wc, cL as sn, z as Nc, a as nn, l as Se, dn as $s, cO as on, a0 as It, bC as Fo, cS as ks, di as an, dl as rn, b as Po, du as cn, cU as ws, dx as ln, dy as un, ap as xe, dz as S, aW as vc, q as Sc, T as Oo, dA as Rc, cV as Tc, x as Dc, w as Ec, aX as Fc, c as Pc, ag as V, d4 as Ao, d5 as _o, e as Me, aR as Lt, d9 as Vo, aP as Lo, d6 as Oc, aO as Wt, an as Ke, da as Wo, as as dn, at as Ac, j as z, bn as Ge, au as _c, _ as pn, av as hn, V as Vc, a5 as Lc, U as Mo, a3 as se, cg as Bo, cq as Go, bJ as zo, p as me, ab as st, bK as Uo, bL as Ho, bM as Xo, af as ct, bN as Ko, cx as qo, cy as jo, bQ as Yo, bP as Qo, aS as Zo, de as Jo, bR as fn, cA as ea, a$ as ta, K as sa, bS as na, bE as Te, cc as oa, bT as aa, bU as ra, cB as ia, bV as ca, ac as mn, bW as gn, bd as la, bX as ua, u as nt, N as Wc, bY as da, bZ as pa, b_ as ha, ce as fa, cf as ma, dg as ga, bv as Ns, bp as Ft, bs as xn, cD as Xn, dB as mt, dC as xa, cE as Kn, dh as Mc, a1 as Bc, aU as Ca, cF as ba, b$ as Cn, aY as Ia, aC as ya, aA as yt, db as $a, dc as ka, be as wa, cd as Na, dk as va, a8 as Sa, H as Ra, dm as Ta, b2 as bn, b4 as In, c1 as yn, cK as Da, ah as Gc, c2 as Ea, c3 as Fa, cM as Pa, cN as Oa, dp as Aa, b5 as _a, aV as Va, bo as La, Y as $n, S as Wa, a6 as Ma, bg as Ba, bi as Ga, bh as za, c4 as Ua, cW as Ha, c5 as Xa, P as Ka, a4 as qa, c6 as ja, cP as kn, dD as Ya, dE as Qa, dF as Za, R as Ja, Z as wn, bj as er, cQ as tr, bk as sr, cR as nr, c8 as or, bf as ar, b9 as Nn, a7 as rr, dq as ir, aT as cr, c9 as vn, ad as Sn, ca as Rn, c0 as Tn, c7 as lr, dG as ur, dH as dr, dr as pr, ds as hr, dt as fr, W as mr, cT as gr, aw as Dn, dv as xr, dI as Cr, dJ as br, bO as En, dw as Ir, X as yr, bl as $r, ay as Fn, bb as kr, cb as wr, f as Nr, dK as vr, dL as qn, d7 as jn, d8 as zc, t as Uc, dM as Hc, dN as Xc, bB as Kc, bc as qc, bm as jc, bt as Yc, $ as Qc, bu as Zc, b7 as Jc, b8 as el, bq as tl, br as sl, aL as Sr, bx as nl, ai as ol, ao as al, bz as rl, dj as il, aZ as cl, a_ as ll, b0 as ul, b1 as dl, aj as pl, bA as hl, b6 as fl, bH as ml, b3 as gl, aB as Rr, bD as xl, ar as Cl, bF as bl, ba as Il, bG as yl } from "./index-BzFyqcy-.js";
|
|
2
|
+
import { e as Tr, s as Dr, l as Er, a as Fr, b as Pr, m as Or, c as Ar, r as Ms, f as $l, g as kl, h as wl, i as Nl, j as vl, k as Sl, n as Rl, o as Tl, q as Dl, t as El, u as Fl, v as Pl, w as Ol, x as Al, y as _l, z as Vl, p as Ll, A as Wl, B as Ml, C as Bl, F as Gl, G as zl, H as Ul, I as Hl } from "./random_width-CXVRloNK.js";
|
|
3
|
+
import { r as re } from "./reshape-CnIwVG1c.js";
|
|
4
|
+
import { b as Xl } from "./broadcast_to-DzlNweb8.js";
|
|
5
|
+
import { c as os } from "./concat-B912vBbo.js";
|
|
6
|
+
import { c as Kl, s as ql } from "./sin-gpDNRxE0.js";
|
|
7
|
+
import { w as _r, r as Vr, n as ss, b as Bs, v as Gs, x as Lr, h as jl, g as Yl, e as Ql, c as Zl, f as Jl, j as eu, m as tu, q as su, k as nu, p as ou, y as au, z as ru, A as iu, B as cu, s as lu, d as uu, t as du, u as pu } from "./ops-LuCMAnmM.js";
|
|
8
|
+
import { m as Tt } from "./mat_mul-DzjTFx-u.js";
|
|
9
|
+
import { w as Wr, k as Ye, h as Le, x as hu, y as fu, z as mu, C as gu, v as xu, i as ot, j as lt, d as De, e as $t, g as vs, S as Mr, a as Br, A as Gr, B as zr, p as Cu, q as bu, r as Iu, u as yu } from "./selu_util-OtRzVwW5.js";
|
|
10
|
+
import { e as $u, l as ku, a as wu, m as Nu } from "./log_sum_exp-DO6z8tSE.js";
|
|
11
|
+
import { f as vu } from "./dropout-C-csYCLj.js";
|
|
12
|
+
import { g as Su } from "./gather-Dnpgw-YQ.js";
|
|
13
|
+
import { c as zs, z as Ur } from "./zeros-Bj5rMYA7.js";
|
|
14
|
+
import { s as as } from "./slice-d0Vo9XTN.js";
|
|
15
|
+
import { m as Ru } from "./mod-Dobti4j4.js";
|
|
16
|
+
import { r as Tu } from "./reciprocal-C4rNcM-S.js";
|
|
17
|
+
import { r as Du } from "./relu-BjCh_SYb.js";
|
|
18
|
+
import { s as Us } from "./split-DK2k5eHf.js";
|
|
19
|
+
import { s as Eu } from "./softmax-D7Jj3p_P.js";
|
|
20
|
+
import { s as Fu } from "./stack-DFatutCx.js";
|
|
21
|
+
import { s as Pu } from "./sum-CJ0ULhmt.js";
|
|
22
|
+
import { a as j, u as le, c as ut, i as dt, b as Ou, d as Pt, t as Pe, e as kt, f as gt, g as Hr, r as Ot, h as Be, j as Au, k as _u, l as Pn, z as Vu, m as On, n as Xr, o as Lu, p as Wu, q as Mu, v as Bu, w as Gu, x as zu, y as Uu, A as Hu, B as Xu, C as Ku, D as ft, E as qu, F as ju, G as Kr, H as Yu, I as Qu, J as Zu, K as Ju, L as ed, M as td, N as sd, O as nd, P as od, Q as ad, R as rd, S as id, T as cd, U as ld, V as ud, W as dd, X as pd, Y as hd, Z as fd, _ as md, $ as gd, a0 as xd, a1 as Cd, a2 as bd, a3 as Id, a4 as yd, a5 as $d, a6 as kd, a7 as wd, a8 as Nd, a9 as vd, aa as Sd, ab as Rd, ac as Td, ad as Dd, ae as Ed, af as Fd, ag as Pd, ah as Od, ai as Ad } from "./shared-DmRsFyaJ.js";
|
|
23
|
+
import { m as xt, A as Ss, B as Rs, C as Ts, D as qr, F as jr, H as Yr, G as je, I as Qr, J as Zr, K as Jr, L as ei, M as ti, z as si, y as ni, x as oi, w as ai, u as ri, E as ii, T as ci, U as _d, V as Vd, W as Ld, X as Wd, Y as Md, Z as Bd, N as li, O as ui, P as di, Q as pi, c as hi, f as Gd, S as zd, _ as Ud } from "./backend_util-CJIiDoV1.js";
|
|
24
|
+
import { g as ye, a as $e, b as Re, c as Ee, e as Oe, h as Ds } from "./axis_util-TbGYJ208.js";
|
|
25
25
|
import { s as Hd } from "./index-C4L8Cm77.js";
|
|
26
26
|
import { n as fi, b as mi, a as gi } from "./non_max_suppression_impl-CsEgBuMA.js";
|
|
27
|
-
import { c as wt } from "./scatter_nd_util-
|
|
28
|
-
import { h as Yn, j as Xd, k as Kd, l as qd, m as jd, n as Yd, o as Qd, P as An, p as ze, u as We, q as xi, c as Ci, T as _e, E as bi, g as Ii, a as yi, r as Zd, s as Jd, t as Z, v as Mt, w as ep, x as Qn, y as tp, z as sp, A as Bt, B as np, C as op, D as Hs, F as jt, G as Yt, H as ap, I as rp, J as Zn, K as ip, L as cp, M as _s, N as lp, O as up, Q as dp, R as Qt, S as Vs, U as pp, f as Ce, V as we, W as Zt, X as Jt, Y as hp, d as Jn, e as eo, i as $i, Z as fp, _ as mp, $ as gp, a0 as xp, a1 as Cp, a2 as bp, a3 as Gt } from "./gpgpu_math-
|
|
29
|
-
import { s as ki, a as Ip, t as wi, b as yp, c as $p, d as Ni, e as kp, n as wp, f as Np, g as vp, h as Sp, i as Rp, j as Tp, k as Dp, l as Ep, o as Fp, p as Pp, q as Op, r as Ap, u as _p, v as Vp, w as Lp, x as Wp, y as Mp, z as Bp, A as Gp, B as zp, C as Up, D as Hp, E as Xp, F as Kp, G as qp, H as jp, I as Yp, J as Qp, K as Zp, L as Jp, M as vi, N as eh, O as th, P as sh, Q as nh, R as oh, S as ah, T as rh, U as ih, V as ch, W as lh } from "./shared-
|
|
30
|
-
import { a as ve, c as uh, U as it, d as tt, e as qe, A as to, f as Nt, B as _n, h as Vn, m as At, u as oe, C as Ue, b as ke, i as Ve, j as Ln, k as pt, l as vt, n as dh, o as ph, p as hh, q as fh } from "./kernel_funcs_utils-
|
|
31
|
-
import { R as mh, r as H, a as gh } from "./Reshape-
|
|
32
|
-
import { M as Si } from "./mulmat_packed_gpu-
|
|
33
|
-
import { t as Ri, s as Wn, a as zt, m as xh, r as Ch, b as bh, c as Ih, d as yh } from "./RealDiv-
|
|
27
|
+
import { c as wt } from "./scatter_nd_util-BQdz--Gn.js";
|
|
28
|
+
import { h as Yn, j as Xd, k as Kd, l as qd, m as jd, n as Yd, o as Qd, P as An, p as ze, u as We, q as xi, c as Ci, T as _e, E as bi, g as Ii, a as yi, r as Zd, s as Jd, t as Z, v as Mt, w as ep, x as Qn, y as tp, z as sp, A as Bt, B as np, C as op, D as Hs, F as jt, G as Yt, H as ap, I as rp, J as Zn, K as ip, L as cp, M as _s, N as lp, O as up, Q as dp, R as Qt, S as Vs, U as pp, f as Ce, V as we, W as Zt, X as Jt, Y as hp, d as Jn, e as eo, i as $i, Z as fp, _ as mp, $ as gp, a0 as xp, a1 as Cp, a2 as bp, a3 as Gt } from "./gpgpu_math-CDaYiyE_.js";
|
|
29
|
+
import { s as ki, a as Ip, t as wi, b as yp, c as $p, d as Ni, e as kp, n as wp, f as Np, g as vp, h as Sp, i as Rp, j as Tp, k as Dp, l as Ep, o as Fp, p as Pp, q as Op, r as Ap, u as _p, v as Vp, w as Lp, x as Wp, y as Mp, z as Bp, A as Gp, B as zp, C as Up, D as Hp, E as Xp, F as Kp, G as qp, H as jp, I as Yp, J as Qp, K as Zp, L as Jp, M as vi, N as eh, O as th, P as sh, Q as nh, R as oh, S as ah, T as rh, U as ih, V as ch, W as lh } from "./shared-DuP7ue-R.js";
|
|
30
|
+
import { a as ve, c as uh, U as it, d as tt, e as qe, A as to, f as Nt, B as _n, h as Vn, m as At, u as oe, C as Ue, b as ke, i as Ve, j as Ln, k as pt, l as vt, n as dh, o as ph, p as hh, q as fh } from "./kernel_funcs_utils-DKLK0Mg3.js";
|
|
31
|
+
import { R as mh, r as H, a as gh } from "./Reshape-Bowtk9BP.js";
|
|
32
|
+
import { M as Si } from "./mulmat_packed_gpu-BT60jmzP.js";
|
|
33
|
+
import { t as Ri, s as Wn, a as zt, m as xh, r as Ch, b as bh, c as Ih, d as yh } from "./RealDiv-D4EzDsC0.js";
|
|
34
34
|
/**
|
|
35
35
|
* @license
|
|
36
36
|
* Copyright 2018 Google LLC. All Rights Reserved.
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { j as p, a3 as w } from "./index-
|
|
1
|
+
import { j as p, a3 as w } from "./index-BzFyqcy-.js";
|
|
2
2
|
function k(o, t, r) {
|
|
3
3
|
const n = t.rank > 1 ? t.shape[t.rank - 1] : 1, e = t.rank > 1 ? t.rank - 1 : 1, h = `Must have updates.shape = indices.shape[:batchDim] + shape[sliceDim:], got updates.shape: ${r.shape}, indices.shape: ${t.shape}, shape: ${o}, sliceDim: ${n}, and batchDim: ${e}.`;
|
|
4
4
|
if (r.rank < e)
|
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
import { n as D, aq as H, C,
|
|
2
|
-
import { r as fe } from "./relu-
|
|
3
|
-
import { r as ce } from "./reshape-
|
|
4
|
-
import { s as ae } from "./sum-
|
|
1
|
+
import { n as D, aq as H, E as C, F as N, G, ar as te, as as ne, at as se, au as re, av as ie, aw as oe, a as le, ax as ue, ay as O } from "./index-BzFyqcy-.js";
|
|
2
|
+
import { r as fe } from "./relu-BjCh_SYb.js";
|
|
3
|
+
import { r as ce } from "./reshape-CnIwVG1c.js";
|
|
4
|
+
import { s as ae } from "./sum-CJ0ULhmt.js";
|
|
5
5
|
/**
|
|
6
6
|
* @license
|
|
7
7
|
* Copyright 2020 Google LLC. All Rights Reserved.
|
|
@@ -85,9 +85,9 @@ function he(e, t, n, s, r, u = !1, i = "channelsLast", o) {
|
|
|
85
85
|
[c, l, a, p, g] = e;
|
|
86
86
|
else
|
|
87
87
|
throw new Error(`Unknown dataFormat ${i}`);
|
|
88
|
-
const [h, d, A, , m] = t, [b, k, f] = W(n), [w, E, I] = W(s), y = L(h, w), x = L(d, E), $ = L(A, I), { padInfo: _, outDepth: M, outHeight: S, outWidth:
|
|
88
|
+
const [h, d, A, , m] = t, [b, k, f] = W(n), [w, E, I] = W(s), y = L(h, w), x = L(d, E), $ = L(A, I), { padInfo: _, outDepth: M, outHeight: S, outWidth: R } = me(r, a, p, g, b, k, f, y, x, $, o), V = u ? m * l : m;
|
|
89
89
|
let U;
|
|
90
|
-
return i === "channelsFirst" ? U = [c, V, M, S,
|
|
90
|
+
return i === "channelsFirst" ? U = [c, V, M, S, R] : i === "channelsLast" && (U = [c, M, S, R, V]), {
|
|
91
91
|
batchSize: c,
|
|
92
92
|
dataFormat: i,
|
|
93
93
|
inDepth: a,
|
|
@@ -96,7 +96,7 @@ function he(e, t, n, s, r, u = !1, i = "channelsLast", o) {
|
|
|
96
96
|
inChannels: l,
|
|
97
97
|
outDepth: M,
|
|
98
98
|
outHeight: S,
|
|
99
|
-
outWidth:
|
|
99
|
+
outWidth: R,
|
|
100
100
|
outChannels: V,
|
|
101
101
|
padInfo: _,
|
|
102
102
|
strideDepth: b,
|
|
@@ -118,14 +118,14 @@ function he(e, t, n, s, r, u = !1, i = "channelsLast", o) {
|
|
|
118
118
|
}
|
|
119
119
|
function ge(e, t, n, s, r) {
|
|
120
120
|
s == null && (s = B(e, t, n));
|
|
121
|
-
const u = e[0], i = e[1], o =
|
|
121
|
+
const u = e[0], i = e[1], o = F((u - t + 2 * s) / n + 1, r), c = F((i - t + 2 * s) / n + 1, r);
|
|
122
122
|
return [o, c];
|
|
123
123
|
}
|
|
124
124
|
function pe(e, t, n, s, r, u) {
|
|
125
125
|
r == null && (r = B(e, t[0], s[0]));
|
|
126
126
|
const i = [0, 0, 0, n];
|
|
127
127
|
for (let o = 0; o < 3; o++)
|
|
128
|
-
e[o] + 2 * r >= t[o] && (i[o] =
|
|
128
|
+
e[o] + 2 * r >= t[o] && (i[o] = F((e[o] - t[o] + 2 * r) / s[o] + 1, u));
|
|
129
129
|
return i;
|
|
130
130
|
}
|
|
131
131
|
function B(e, t, n, s = 1) {
|
|
@@ -155,7 +155,7 @@ function de(e, t, n, s, r, u, i, o, c) {
|
|
|
155
155
|
a = { top: 0, bottom: 0, left: 0, right: 0, type: "VALID" }, p = Math.ceil((t - u + 1) / s), g = Math.ceil((n - i + 1) / r);
|
|
156
156
|
else if (typeof e == "object") {
|
|
157
157
|
const l = c === "channelsLast" ? e[1][0] : e[2][0], h = c === "channelsLast" ? e[1][1] : e[2][1], d = c === "channelsLast" ? e[2][0] : e[3][0], A = c === "channelsLast" ? e[2][1] : e[3][1];
|
|
158
|
-
a = { top: l, bottom: h, left: d, right: A, type: l === 0 && h === 0 && d === 0 && A === 0 ? "VALID" : "EXPLICIT" }, p =
|
|
158
|
+
a = { top: l, bottom: h, left: d, right: A, type: l === 0 && h === 0 && d === 0 && A === 0 ? "VALID" : "EXPLICIT" }, p = F((t - u + l + h) / s + 1, o), g = F((n - i + d + A) / r + 1, o);
|
|
159
159
|
} else
|
|
160
160
|
throw Error(`Unknown padding parameter: ${e}`);
|
|
161
161
|
return { padInfo: a, outHeight: p, outWidth: g };
|
|
@@ -182,7 +182,7 @@ function me(e, t, n, s, r, u, i, o, c, a, p) {
|
|
|
182
182
|
throw Error(`Unknown padding parameter: ${e}`);
|
|
183
183
|
return { padInfo: g, outDepth: l, outHeight: h, outWidth: d };
|
|
184
184
|
}
|
|
185
|
-
function
|
|
185
|
+
function F(e, t) {
|
|
186
186
|
if (!t)
|
|
187
187
|
return Math.trunc(e);
|
|
188
188
|
switch (t) {
|
|
@@ -498,7 +498,7 @@ function Y(e, t, n, s, r) {
|
|
|
498
498
|
}
|
|
499
499
|
for (let o = 0; o < u.length; o++) {
|
|
500
500
|
const c = r[o];
|
|
501
|
-
u[o] < 0 && (u[o] += c), u[o] =
|
|
501
|
+
u[o] < 0 && (u[o] += c), u[o] = O(0, u[o], r[o]);
|
|
502
502
|
}
|
|
503
503
|
return u;
|
|
504
504
|
}
|
|
@@ -511,16 +511,16 @@ function z(e, t, n, s, r, u) {
|
|
|
511
511
|
const o = n[r] || 1;
|
|
512
512
|
(e & 1 << r || u & 1 << r || i == null) && (o > 0 ? i = Number.MIN_SAFE_INTEGER : i = Number.MAX_SAFE_INTEGER);
|
|
513
513
|
const c = s[r];
|
|
514
|
-
return i < 0 && (i += c), i =
|
|
514
|
+
return i < 0 && (i += c), i = O(0, i, c - 1), i;
|
|
515
515
|
}
|
|
516
516
|
function ee(e, t, n, s, r, u) {
|
|
517
517
|
let i = t[r];
|
|
518
518
|
const o = n[r] || 1;
|
|
519
519
|
(e & 1 << r || u & 1 << r || i == null) && (o > 0 ? i = Number.MAX_SAFE_INTEGER : i = Number.MIN_SAFE_INTEGER);
|
|
520
520
|
const c = s[r];
|
|
521
|
-
return i < 0 && (i += c), o > 0 ? i =
|
|
521
|
+
return i < 0 && (i += c), o > 0 ? i = O(0, i, c) : i = O(-1, i, c - 1), i;
|
|
522
522
|
}
|
|
523
|
-
function
|
|
523
|
+
function Fe(e, t, n) {
|
|
524
524
|
let s = n.length;
|
|
525
525
|
for (let r = 0; r < n.length; r++)
|
|
526
526
|
if (n[r] > 1) {
|
|
@@ -532,13 +532,13 @@ function Oe(e, t, n) {
|
|
|
532
532
|
return !1;
|
|
533
533
|
return !0;
|
|
534
534
|
}
|
|
535
|
-
function
|
|
535
|
+
function Oe(e, t) {
|
|
536
536
|
let n = e.length > 0 ? e[e.length - 1] : 1;
|
|
537
537
|
for (let s = 0; s < e.length - 1; s++)
|
|
538
538
|
n += e[s] * t[s];
|
|
539
539
|
return n;
|
|
540
540
|
}
|
|
541
|
-
function
|
|
541
|
+
function Re(e, t, n) {
|
|
542
542
|
let s;
|
|
543
543
|
const r = e.shape.length;
|
|
544
544
|
typeof t == "number" ? s = [t, ...new Array(r - 1).fill(0)] : t.length < r ? s = t.concat(new Array(r - t.length).fill(0)) : s = t.slice(), s.forEach((i) => {
|
|
@@ -654,12 +654,12 @@ function K(e, t, n, s, r, u) {
|
|
|
654
654
|
const et = /* @__PURE__ */ Object.freeze(/* @__PURE__ */ Object.defineProperty({
|
|
655
655
|
__proto__: null,
|
|
656
656
|
assertParamsValid: Le,
|
|
657
|
-
computeFlatOffset:
|
|
657
|
+
computeFlatOffset: Oe,
|
|
658
658
|
computeOutShape: Ge,
|
|
659
659
|
getNormalizedAxes: Te,
|
|
660
|
-
isSliceContinous:
|
|
660
|
+
isSliceContinous: Fe,
|
|
661
661
|
maskToAxes: Ce,
|
|
662
|
-
parseSliceParams:
|
|
662
|
+
parseSliceParams: Re,
|
|
663
663
|
sliceInfo: Ve,
|
|
664
664
|
startForAxis: z,
|
|
665
665
|
startIndicesWithElidedDims: Q,
|
|
@@ -705,12 +705,12 @@ export {
|
|
|
705
705
|
Qe as m,
|
|
706
706
|
et as n,
|
|
707
707
|
qe as o,
|
|
708
|
-
|
|
708
|
+
Re as p,
|
|
709
709
|
Le as q,
|
|
710
|
-
|
|
710
|
+
Fe as r,
|
|
711
711
|
ze as s,
|
|
712
712
|
P as t,
|
|
713
|
-
|
|
713
|
+
Oe as u,
|
|
714
714
|
Ne as v,
|
|
715
715
|
Ee as w,
|
|
716
716
|
$e as x,
|
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
import { n as Lt, bm as Ce, j as V, l as Pt, a3 as K, bn as et, ae as ht, bo as dt, bp as at, aa as De, ab as st, az as We, b8 as $e, bq as Ue, br as ze, bs as Be, bt as At, ap as H, bu as qt, bv as W, bw as _t, bx as Vt, ai as Ct, by as Dt, ao as Wt, bz as $t, aZ as Ut, a_ as zt, b0 as Bt, b1 as jt, aj as Gt, bA as Zt, b6 as Ht, bB as Kt, b3 as je, aA as Ge, b7 as Xt, bc as Ze, bC as He, p as Jt, u as Ke, t as Xe, bD as Qt, bE as It, ar as Yt, $ as Je, bF as te, ba as ee, bG as ne, aP as pt, bH as se, bI as ot } from "./index-
|
|
2
|
-
import { f as it, m as kt, g as Qe, a as Ye, R as tn, v as en, d as nn, e as sn, h as on, i as rn, j as an, k as ln, l as cn, n as un, o as hn, p as fn, q as Nt, r as dn, s as gn, t as mn } from "./backend_util-
|
|
3
|
-
import { g as pn, a as wn, e as In, c as bn } from "./axis_util-
|
|
4
|
-
import { b as xn } from "./broadcast_to-
|
|
5
|
-
import { r as En } from "./reshape-
|
|
6
|
-
import { p as Fn, q as yn, r as kn, u as Nn } from "./selu_util-
|
|
1
|
+
import { n as Lt, bm as Ce, j as V, l as Pt, a3 as K, bn as et, ae as ht, bo as dt, bp as at, aa as De, ab as st, az as We, b8 as $e, bq as Ue, br as ze, bs as Be, bt as At, ap as H, bu as qt, bv as W, bw as _t, bx as Vt, ai as Ct, by as Dt, ao as Wt, bz as $t, aZ as Ut, a_ as zt, b0 as Bt, b1 as jt, aj as Gt, bA as Zt, b6 as Ht, bB as Kt, b3 as je, aA as Ge, b7 as Xt, bc as Ze, bC as He, p as Jt, u as Ke, t as Xe, bD as Qt, bE as It, ar as Yt, $ as Je, bF as te, ba as ee, bG as ne, aP as pt, bH as se, bI as ot } from "./index-BzFyqcy-.js";
|
|
2
|
+
import { f as it, m as kt, g as Qe, a as Ye, R as tn, v as en, d as nn, e as sn, h as on, i as rn, j as an, k as ln, l as cn, n as un, o as hn, p as fn, q as Nt, r as dn, s as gn, t as mn } from "./backend_util-CJIiDoV1.js";
|
|
3
|
+
import { g as pn, a as wn, e as In, c as bn } from "./axis_util-TbGYJ208.js";
|
|
4
|
+
import { b as xn } from "./broadcast_to-DzlNweb8.js";
|
|
5
|
+
import { r as En } from "./reshape-CnIwVG1c.js";
|
|
6
|
+
import { p as Fn, q as yn, r as kn, u as Nn } from "./selu_util-OtRzVwW5.js";
|
|
7
7
|
import { g as vn } from "./_commonjsHelpers-ByX85dGu.js";
|
|
8
8
|
function Sn(e, t) {
|
|
9
9
|
for (var n = 0; n < t.length; n++) {
|
package/dist/training/Adam.js
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
import { adamAdjust as b } from "../ops/adamAdjust.js";
|
|
2
2
|
import { adamMoments as d } from "../ops/adamMoments.js";
|
|
3
|
-
import { O as g, e as h, t as o, d as B } from "../index-
|
|
4
|
-
import { z as M } from "../zeros-
|
|
3
|
+
import { O as g, e as h, t as o, d as B } from "../index-BzFyqcy-.js";
|
|
4
|
+
import { z as M } from "../zeros-Bj5rMYA7.js";
|
|
5
5
|
/**
|
|
6
6
|
* @license
|
|
7
7
|
* Copyright 2018 Google LLC. All Rights Reserved.
|
package/dist/training/AdamExt.js
CHANGED
package/dist/training/Trainer.js
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
import { DatasetBuilder as m, flattenTokens as c, PAGE_FACTOR as g } from "./DatasetBuilder.js";
|
|
2
2
|
import u from "./AdamExt.js";
|
|
3
|
-
import { t as f, v as y, d as p } from "../index-
|
|
4
|
-
import { z as h } from "../zeros-
|
|
3
|
+
import { t as f, v as y, d as p } from "../index-BzFyqcy-.js";
|
|
4
|
+
import { z as h } from "../zeros-Bj5rMYA7.js";
|
|
5
5
|
class x {
|
|
6
6
|
constructor(t, e, i = 1e-3) {
|
|
7
7
|
this.tokenizer = e, this.model = t, this.learningRate = i, this.resetOptimizer(), this.datasetBuilder = new m(e, t.config.blockSize);
|
|
@@ -1,8 +1,8 @@
|
|
|
1
1
|
import { gatherSub as x } from "../ops/gatherSub.js";
|
|
2
2
|
import { scatterSub as L } from "../ops/scatterSub.js";
|
|
3
|
-
import {
|
|
4
|
-
import { s as y } from "../softmax-
|
|
5
|
-
import { m as z, l as v } from "../log_sum_exp-
|
|
3
|
+
import { z as C, t as u, A as E, c as G } from "../index-BzFyqcy-.js";
|
|
4
|
+
import { s as y } from "../softmax-D7Jj3p_P.js";
|
|
5
|
+
import { m as z, l as v } from "../log_sum_exp-DO6z8tSE.js";
|
|
6
6
|
function k(t, s) {
|
|
7
7
|
return u(() => {
|
|
8
8
|
const n = t.shape[t.shape.length - 1], c = t.shape.slice(0, -1).reduce((o, e) => o * e, 1), h = t.shape.length > 2 ? t.reshape([c, n]) : t, p = s.shape.length > 1 ? s.reshape([c]).cast("int32") : s.cast("int32"), r = z(h, -1, !0), a = G(h, r), d = v(a, -1);
|
package/dist/utilities/dummy.js
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { m as y, v as P, e as S } from "../index-
|
|
2
|
-
import { z as i } from "../zeros-
|
|
1
|
+
import { m as y, v as P, e as S } from "../index-BzFyqcy-.js";
|
|
2
|
+
import { z as i } from "../zeros-Bj5rMYA7.js";
|
|
3
3
|
async function w(s) {
|
|
4
4
|
const t = i([1, s.config.blockSize], "int32"), [e, n] = s.forward({ training: !1 }, t);
|
|
5
5
|
await e.data(), e.dispose(), n && n.dispose(), t.dispose();
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
export default function topP(probs: number[][], tP: number): number[];
|
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
function c(s, a) {
|
|
2
|
+
const t = s[0].map((o, r) => ({ prob: o, index: r })).sort((o, r) => r.prob - o.prob);
|
|
3
|
+
let n = 0;
|
|
4
|
+
const e = new Array(t.length).fill(0);
|
|
5
|
+
for (const o of t)
|
|
6
|
+
if (n += o.prob, e[o.index] = o.prob, n >= a)
|
|
7
|
+
break;
|
|
8
|
+
const b = e.reduce((o, r) => o + r, 0);
|
|
9
|
+
return e.map((o) => o / b);
|
|
10
|
+
}
|
|
11
|
+
export {
|
|
12
|
+
c as default
|
|
13
|
+
};
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import "../index-
|
|
2
|
-
import { t as p } from "../tensor-
|
|
1
|
+
import "../index-BzFyqcy-.js";
|
|
2
|
+
import { t as p } from "../tensor-CZr4dh61.js";
|
|
3
3
|
function h(n) {
|
|
4
4
|
const e = n.reduce((s, o) => s + o.length, 0), a = new Float32Array(e);
|
|
5
5
|
let t = 0;
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import {
|
|
1
|
+
import { E as m, F as r, a4 as l, G as c, aa as i, M as p, ab as u, j as f } from "./index-BzFyqcy-.js";
|
|
2
2
|
/**
|
|
3
3
|
* @license
|
|
4
4
|
* Copyright 2020 Google LLC. All Rights Reserved.
|