@genai-fi/nanogpt 0.15.2 → 0.15.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/Generator.js +42 -41
- package/dist/{RealDiv-CJpH9Bif.js → RealDiv-Blil1IAl.js} +7 -7
- package/dist/{Reshape-CKzb2DIN.js → Reshape-CZVlscuS.js} +2 -2
- package/dist/{Reshape-C4ZzbS5c.js → Reshape-rNDnWBJS.js} +1 -1
- package/dist/TeachableLLM.js +10 -10
- package/dist/{axis_util-BBaWKQoo.js → axis_util-BTeTGnZF.js} +1 -1
- package/dist/backend.js +2 -2
- package/dist/backend_util-DGV1tIji.js +425 -0
- package/dist/{backend_webgpu-BwfUOSiJ.js → backend_webgpu-WReHKYZJ.js} +3 -3
- package/dist/{broadcast_to-CxKUM6zp.js → broadcast_to-BHFjzMSF.js} +2 -2
- package/dist/checks/appendCache.js +2 -2
- package/dist/checks/attentionMask.js +3 -3
- package/dist/checks/gelu.js +2 -2
- package/dist/checks/matMulGelu.js +2 -2
- package/dist/checks/normRMS.js +4 -4
- package/dist/checks/normRMSGrad.js +3 -3
- package/dist/checks/packUnpack.js +2 -2
- package/dist/checks/qkv.js +2 -2
- package/dist/checks/rope.js +2 -2
- package/dist/{clip_by_value-lDwNWeyI.js → clip_by_value-q6njgxYg.js} +1 -1
- package/dist/{complex-NXAORdbW.js → complex-W1ugWfNb.js} +1 -1
- package/dist/{concat-DCm6KW65.js → concat-ByAvdM_j.js} +1 -1
- package/dist/{concat_util-DT0Mofs3.js → concat_util-Bk6ay4Ob.js} +1 -1
- package/dist/data/parquet.js +1 -1
- package/dist/{dataset-Bwcib9pp.js → dataset-CtujTjY_.js} +3 -3
- package/dist/{dropout_util-Crmm4aOV.js → dropout_util-D1mAkyan.js} +1 -1
- package/dist/{expand_dims-DgU0Vlpg.js → expand_dims-B_9x_xWm.js} +1 -1
- package/dist/{exports_initializers-VKuLTIiX.js → exports_initializers-Br2S2v4K.js} +1 -1
- package/dist/{floor-Bhmfrtly.js → floor-DJ37xPdi.js} +1 -1
- package/dist/{gather-FIoUa4Zd.js → gather-DvRBFTfQ.js} +1 -1
- package/dist/{gelu-CmkPheOK.js → gelu-Bq6zXPEw.js} +1 -1
- package/dist/{gpgpu_math-D83bWKYw.js → gpgpu_math-C0Hfh1As.js} +7 -7
- package/dist/{index-nwvWLdRt.js → index-BSjeovee.js} +105 -104
- package/dist/{index-D0b5F1JD.js → index-BU-PZJ0l.js} +311 -315
- package/dist/{index-CSl8jhsR.js → index-CynxJ6AT.js} +83 -83
- package/dist/{index-lJWNfe6P.js → index-SkD4n5bj.js} +1 -1
- package/dist/{kernel_funcs_utils-Bu6bS4D_.js → kernel_funcs_utils-BNsajF26.js} +3 -3
- package/dist/layers/BaseLayer.js +1 -1
- package/dist/layers/CausalSelfAttention.js +6 -6
- package/dist/layers/LoRA.js +5 -5
- package/dist/layers/MLP.js +4 -4
- package/dist/layers/PositionEmbedding.js +5 -5
- package/dist/layers/RMSNorm.js +3 -3
- package/dist/layers/RoPECache.js +4 -4
- package/dist/layers/TiedEmbedding.js +6 -6
- package/dist/layers/TransformerBlock.js +1 -1
- package/dist/layers/WeightStore.js +3 -3
- package/dist/loader/loadTransformers.js +1 -1
- package/dist/loader/oldZipLoad.js +9 -9
- package/dist/main.js +9 -9
- package/dist/{matMul16-bI7XM831.js → matMul16-qjE_mKX8.js} +6 -6
- package/dist/{matMulGelu-Cbtq3pxJ.js → matMulGelu-BM8qerU0.js} +4 -4
- package/dist/{mat_mul-BQY_GSqm.js → mat_mul-dDBRouCf.js} +1 -1
- package/dist/{mod-ChddM4vN.js → mod-COvikySw.js} +1 -1
- package/dist/models/NanoGPTV1.js +2 -2
- package/dist/models/NanoGPTV2.js +2 -2
- package/dist/models/model.js +9 -9
- package/dist/{not_equal-duCIyEXv.js → not_equal-C7_nnOW4.js} +5 -5
- package/dist/{ones-Piv0gZxv.js → ones-B0Fr32MP.js} +3 -3
- package/dist/ops/adamAdjust.js +1 -1
- package/dist/ops/adamMoments.js +1 -1
- package/dist/ops/add16.js +1 -1
- package/dist/ops/appendCache.js +3 -3
- package/dist/ops/attentionMask.js +1 -1
- package/dist/ops/concat16.js +2 -2
- package/dist/ops/cpu/adamAdjust.js +1 -1
- package/dist/ops/cpu/adamMoments.js +2 -2
- package/dist/ops/cpu/appendCache.js +2 -2
- package/dist/ops/cpu/attentionMask.js +6 -6
- package/dist/ops/cpu/fusedSoftmax.js +2 -2
- package/dist/ops/cpu/gatherSub.js +3 -3
- package/dist/ops/cpu/gelu.js +1 -1
- package/dist/ops/cpu/matMul16.js +2 -2
- package/dist/ops/cpu/matMulGelu.js +3 -3
- package/dist/ops/cpu/matMulMul.js +1 -1
- package/dist/ops/cpu/mulDropout.js +1 -1
- package/dist/ops/cpu/normRMS.js +1 -1
- package/dist/ops/cpu/qkv.js +3 -3
- package/dist/ops/cpu/rope.js +5 -5
- package/dist/ops/cpu/scatterSub.js +5 -5
- package/dist/ops/dot16.js +2 -2
- package/dist/ops/dropout.js +3 -3
- package/dist/ops/dropout16.js +1 -1
- package/dist/ops/gatherSub.js +1 -1
- package/dist/ops/gelu.js +2 -2
- package/dist/ops/globalNorm.js +2 -2
- package/dist/ops/grads/add16.js +1 -1
- package/dist/ops/grads/attentionMask.js +2 -2
- package/dist/ops/grads/dropout16.js +1 -1
- package/dist/ops/grads/gelu.js +2 -2
- package/dist/ops/grads/matMul16.js +3 -3
- package/dist/ops/grads/matMulGelu.js +1 -1
- package/dist/ops/grads/mul16.js +1 -1
- package/dist/ops/grads/normRMS.js +1 -1
- package/dist/ops/grads/pack16.js +3 -3
- package/dist/ops/grads/qkv.js +3 -3
- package/dist/ops/grads/rope.js +2 -2
- package/dist/ops/grads/softmax16.js +1 -1
- package/dist/ops/grads/unpack16.js +2 -2
- package/dist/ops/matMul16.js +3 -3
- package/dist/ops/matMulGelu.js +2 -2
- package/dist/ops/matMulMul.js +1 -1
- package/dist/ops/mul16.js +1 -1
- package/dist/ops/mulDrop.js +1 -1
- package/dist/ops/normRMS.js +1 -1
- package/dist/ops/pack16.js +2 -2
- package/dist/ops/qkv.js +1 -1
- package/dist/ops/reshape16.js +2 -2
- package/dist/ops/rope.js +2 -2
- package/dist/ops/scatterSub.js +1 -1
- package/dist/ops/slice16.js +2 -2
- package/dist/ops/softmax16.js +1 -1
- package/dist/ops/sub16.js +1 -1
- package/dist/ops/sum16.js +2 -2
- package/dist/ops/transpose16.js +3 -3
- package/dist/ops/unpack16.js +2 -2
- package/dist/ops/webgl/adamAdjust.js +2 -2
- package/dist/ops/webgl/adamMoments.js +1 -1
- package/dist/ops/webgl/appendCache.js +1 -1
- package/dist/ops/webgl/attentionMask.js +1 -1
- package/dist/ops/webgl/dropout16.js +1 -1
- package/dist/ops/webgl/fusedSoftmax.js +4 -4
- package/dist/ops/webgl/gatherSub.js +1 -1
- package/dist/ops/webgl/gelu.js +2 -2
- package/dist/ops/webgl/log.js +3 -3
- package/dist/ops/webgl/matMul16.js +5 -5
- package/dist/ops/webgl/matMulGelu.js +4 -4
- package/dist/ops/webgl/matMulMul.js +2 -2
- package/dist/ops/webgl/mulDropout.js +1 -1
- package/dist/ops/webgl/normRMS.js +2 -2
- package/dist/ops/webgl/qkv.js +1 -1
- package/dist/ops/webgl/rope.js +1 -1
- package/dist/ops/webgl/scatterSub.js +1 -1
- package/dist/ops/webgpu/adamAdjust.js +3 -3
- package/dist/ops/webgpu/adamMoments.js +3 -3
- package/dist/ops/webgpu/add16.js +1 -1
- package/dist/ops/webgpu/appendCache.js +3 -3
- package/dist/ops/webgpu/attentionMask.js +2 -2
- package/dist/ops/webgpu/attentionMask32_program.js +2 -2
- package/dist/ops/webgpu/clipScale.js +1 -1
- package/dist/ops/webgpu/concat16.js +5 -5
- package/dist/ops/webgpu/dropout16.js +3 -3
- package/dist/ops/webgpu/gatherSub.js +3 -3
- package/dist/ops/webgpu/gelu.js +3 -3
- package/dist/ops/webgpu/matMul16.js +5 -5
- package/dist/ops/webgpu/matMul16_program.js +2 -2
- package/dist/ops/webgpu/mul16.js +1 -1
- package/dist/ops/webgpu/norm2.js +1 -1
- package/dist/ops/webgpu/normRMS.js +2 -2
- package/dist/ops/webgpu/normRMSGrad.js +4 -4
- package/dist/ops/webgpu/pack16.js +1 -1
- package/dist/ops/webgpu/pack16_program.js +2 -2
- package/dist/ops/webgpu/qkv.js +2 -2
- package/dist/ops/webgpu/rope.js +3 -3
- package/dist/ops/webgpu/scatterSub.js +3 -3
- package/dist/ops/webgpu/slice16.js +4 -4
- package/dist/ops/webgpu/softmax16.js +2 -2
- package/dist/ops/webgpu/softmax16_program.js +2 -2
- package/dist/ops/webgpu/softmax16_subgroup_program.js +2 -2
- package/dist/ops/webgpu/softmax16grad.js +1 -1
- package/dist/ops/webgpu/sub16.js +1 -1
- package/dist/ops/webgpu/sum16.js +3 -3
- package/dist/ops/webgpu/transpose16.js +2 -2
- package/dist/ops/webgpu/transpose16_program.js +2 -2
- package/dist/ops/webgpu/transpose16_shared_program.js +3 -3
- package/dist/ops/webgpu/unpack16.js +3 -3
- package/dist/ops/webgpu/utils/binary_op.js +3 -3
- package/dist/ops/webgpu/utils/reductions.js +5 -5
- package/dist/{ops-BXr-37bF.js → ops-DJqZQEpR.js} +86 -86
- package/dist/{pack16-DO9GrRdk.js → pack16-CQUYvE0Y.js} +2 -2
- package/dist/{parquet-BNNuofNs.js → parquet-CXSmguvD.js} +2065 -2065
- package/dist/patches/webgpu_backend.js +4 -4
- package/dist/patches/webgpu_base.js +1 -1
- package/dist/patches/webgpu_program.js +2 -2
- package/dist/{random_normal-CO9xf9dz.js → random_normal-m_v8bCWs.js} +1 -1
- package/dist/{random_width-CliSj-et.js → random_width-DvNaD5W3.js} +131 -131
- package/dist/{range-Dx4PwA2-.js → range-HI-DFEwl.js} +1 -1
- package/dist/{readers-DwZhCW0C.js → readers-EC5q8HtM.js} +2 -2
- package/dist/{relu-BnpM8PVa.js → relu-CdxfMLya.js} +1 -1
- package/dist/{reshape-DVh8yLpI.js → reshape-Dxch7IXb.js} +1 -1
- package/dist/{resize_nearest_neighbor-Dl7ehaQl.js → resize_nearest_neighbor-B8XxmKCX.js} +34 -34
- package/dist/{rope-DjON_IMj.js → rope-DaRtCQFa.js} +1 -1
- package/dist/{scatter_nd_util-SSoGmfpx.js → scatter_nd_util-DJ8GpL1I.js} +1 -1
- package/dist/segment_util-CXELxApp.js +43 -0
- package/dist/{selu_util-C0DN3KhX.js → selu_util-CPAAI9PC.js} +5 -5
- package/dist/{shared-DgNUoqSc.js → shared-DORJR6eU.js} +45 -45
- package/dist/{shared-CefTy5O1.js → shared-DVZEsT-0.js} +1 -1
- package/dist/{slice-BluUPHKL.js → slice-DR1nQEmX.js} +1 -1
- package/dist/slice_util-DDbd6eyd.js +153 -0
- package/dist/{softmax-HULrSwJC.js → softmax-CRzm-wNL.js} +1 -1
- package/dist/{split-QwVeUPZt.js → split-B3dYPTIQ.js} +1 -1
- package/dist/{squeeze-Brkwo5OI.js → squeeze-D8r4RiDQ.js} +2 -2
- package/dist/{stack-C_8ubcjt.js → stack-CVsp4-gn.js} +1 -1
- package/dist/{step-wz0MZ7BP.js → step-A_sBP7En.js} +1 -1
- package/dist/{sum-iKJXG43N.js → sum-DfuUvBem.js} +1 -1
- package/dist/{tensor-Dfy8cN1y.js → tensor-Gz_zmSjb.js} +1 -1
- package/dist/{tensor1d-CoOFcAZs.js → tensor1d-D218DD0-.js} +1 -1
- package/dist/{tensor2d-C8gFDiIC.js → tensor2d-BieJDjvb.js} +1 -1
- package/dist/{tensor4d-Bvqzr_Wu.js → tensor4d-Bptdqjb1.js} +1 -1
- package/dist/{tfjs_backend-9QO-TAAZ.js → tfjs_backend-DmRY5T6A.js} +29 -29
- package/dist/{tile-CcpklBqG.js → tile-ksYNlaAo.js} +1 -1
- package/dist/training/AdamW.js +2 -2
- package/dist/training/BasicTrainer.js +2 -2
- package/dist/training/DatasetBuilder.js +3 -3
- package/dist/training/Evaluator.js +2 -2
- package/dist/training/SFTDatasetBuilder.js +3 -3
- package/dist/training/orthoGrad.js +1 -1
- package/dist/training/sparseCrossEntropy.js +4 -4
- package/dist/training/validation.js +9 -9
- package/dist/{transpose-CwEYsCv1.js → transpose-C4a4Zcdu.js} +2 -2
- package/dist/{unsorted_segment_sum-DRVX2bX2.js → unsorted_segment_sum-Cx23B-vz.js} +14 -14
- package/dist/utilities/dummy.js +2 -2
- package/dist/utilities/multinomialCPU.js +2 -2
- package/dist/utilities/packed.js +1 -1
- package/dist/utilities/performance.js +1 -1
- package/dist/utilities/profile.js +1 -1
- package/dist/utilities/safetensors.js +2 -2
- package/dist/utilities/sentences.js +5 -5
- package/dist/utilities/weights.js +2 -2
- package/dist/{variable-CqrRzzxM.js → variable-BEihhVWu.js} +1 -1
- package/dist/{webgpu_program-BlAY4Q29.js → webgpu_program-BhNO5Knw.js} +1 -1
- package/dist/{webgpu_util-D1Ynuktt.js → webgpu_util-CASYKKsD.js} +1 -1
- package/dist/{zeros-B8VPk-mx.js → zeros-CkHJh2fz.js} +2 -2
- package/dist/{zeros_like-DfWM-ezN.js → zeros_like-CGnKYJEe.js} +62 -62
- package/package.json +1 -1
- package/dist/backend_util-DLIicY0X.js +0 -473
- package/dist/slice_util-DK4kHJjN.js +0 -261
package/dist/Generator.js
CHANGED
|
@@ -1,40 +1,41 @@
|
|
|
1
1
|
import { E as Ui } from "./index-DvYrXKkX.js";
|
|
2
|
-
import { o as Hi, q as Xi, E as Ki,
|
|
3
|
-
import { n as Mc } from "./random_width-
|
|
4
|
-
import { t as Bc } from "./zeros_like-
|
|
2
|
+
import { o as Hi, q as Xi, E as Ki, dl as Ss, a5 as pe, ab as _, as as oo, at as ao, e as Oe, aY as Dt, ay as ro, az as io, au as ji, av as Ft, aD as Ge, ae as co, aG as ws, aH as qi, U as G, af as _e, aI as Yi, H as Ns, aJ as Rs, R as Qi, aj as Zi, x as te, D as lo, _ as Ne, a9 as ee, bb as uo, c7 as Ts, c8 as Es, cO as po, bm as ho, ah as ue, Q as Ye, bn as fo, bo as mo, c9 as go, ca as Ds, cb as Fs, cc as Ps, cd as Os, ce as As, bp as xo, ac as nt, cy as Co, cP as bo, cQ as Io, bs as yo, br as ko, bd as $o, de as vo, C as _s, cS as So, ao as wo, z as No, bt as Ro, c2 as $e, cD as To, bu as Eo, cz as Do, cT as Fo, cA as Po, bv as Ls, bw as Vs, bf as Oo, bx as Ao, am as Qe, V as Ji, by as _o, cB as Lo, cf as Vo, bz as Wo, cF as Mo, cG as Bo, df as Go, cg as zo, bX as ns, bR as St, bU as Ws, cU as yn, dt as ut, du as Uo, cV as kn, dg as ec, N as tc, be as Ho, cW as Xo, bB as Ms, A as Ko, aX as jo, aV as mt, cp as qo, dc as Yo, dd as Qo, bg as Zo, cE as Jo, di as ea, al as ta, G as sa, cq as na, ch as Bs, ci as Gs, cj as zs, dj as oa, b3 as Us, b4 as Hs, bD as Xs, cl as Ks, ck as aa, cY as ra, aM as sc, bE as ia, cC as ca, cZ as la, c_ as ua, dk as da, aP as pa, aZ as ha, cm as fa, bQ as ma, M as js, I as ga, bi as xa, bk as Ca, bj as ba, bF as Ia, d3 as ya, bG as ka, P as $a, a6 as va, bH as Sa, c$ as qs, dv as wa, dw as Na, dx as Ra, Z as Ta, cn as Ys, b9 as Ea, d0 as Da, ba as Fa, d1 as Pa, bJ as Oa, bh as Aa, b6 as Qs, ak as _a, dm as La, aL as Va, bL as Zs, co as Js, bM as en, bN as tn, bC as sn, bI as Wa, dy as Ma, dz as Ba, dn as Ga, dp as za, dq as Ua, J as Ha, d2 as Xa, aK as nn, cr as Ka, dr as ja, dA as qa, dB as Ya, cs as on, bq as an, ds as Qa, T as Za, ct as Ja, bl as er, dC as rn, cu as tr, b8 as sr, bO as nr, c as or, dD as ar, dE as $n, aw as vn, ax as nc, t as rr, a as oc, dF as ac, dG as rc, c0 as ic, ar as cc, bP as lc, bV as uc, S as dc, bW as pc, aQ as hc, aq as fc, bS as mc, bT as gc, bY as xc, aS as ir, bA as Cc, aN as bc, bZ as Ic, F as yc, b_ as kc, dh as $c, a$ as vc, b0 as Sc, b1 as wc, b2 as Nc, aO as Rc, b$ as Tc, b5 as Ec, c5 as Dc, ap as Fc, c1 as Pc, aW as cr, bK as Oc, aF as Ac, c3 as _c, b7 as Lc, c4 as Vc, k as Wc } from "./index-BU-PZJ0l.js";
|
|
3
|
+
import { n as Mc } from "./random_width-DvNaD5W3.js";
|
|
4
|
+
import { t as Bc } from "./zeros_like-CGnKYJEe.js";
|
|
5
5
|
import "./index-Cp39cXWe.js";
|
|
6
|
-
import "./dataset-
|
|
7
|
-
import { a as j, u as ae, c as ot, i as at, b as Gc, d as wt, t as Re, e as gt, f as dt, g as lr, r as Nt, h as Ae, j as zc, k as Uc, l as cn, z as Hc, m as ln, n as ur, o as Xc, p as Kc, q as jc, v as qc, w as Yc, x as Qc, y as Zc, A as Jc, B as el, C as tl, D as lt, E as sl, F as nl, G as dr, H as ol, I as al, J as rl, K as il, L as cl, M as ll, N as ul, O as dl, P as pl, Q as hl, R as fl, S as ml, T as gl, U as xl, V as Cl, W as bl, X as Il, Y as yl, Z as kl, _ as $l, $ as vl, a0 as Sl, a1 as wl, a2 as Nl, a3 as Rl, a4 as Tl, a5 as El, a6 as Dl, a7 as Fl, a8 as Pl, a9 as Ol, aa as Al, ab as _l, ac as Ll, ad as Vl, ae as Wl, af as Ml, ag as Bl, ah as Gl, ai as zl } from "./shared-
|
|
6
|
+
import "./dataset-CtujTjY_.js";
|
|
7
|
+
import { a as j, u as ae, c as ot, i as at, b as Gc, d as wt, t as Re, e as gt, f as dt, g as lr, r as Nt, h as Ae, j as zc, k as Uc, l as cn, z as Hc, m as ln, n as ur, o as Xc, p as Kc, q as jc, v as qc, w as Yc, x as Qc, y as Zc, A as Jc, B as el, C as tl, D as lt, E as sl, F as nl, G as dr, H as ol, I as al, J as rl, K as il, L as cl, M as ll, N as ul, O as dl, P as pl, Q as hl, R as fl, S as ml, T as gl, U as xl, V as Cl, W as bl, X as Il, Y as yl, Z as kl, _ as $l, $ as vl, a0 as Sl, a1 as wl, a2 as Nl, a3 as Rl, a4 as Tl, a5 as El, a6 as Dl, a7 as Fl, a8 as Pl, a9 as Ol, aa as Al, ab as _l, ac as Ll, ad as Vl, ae as Wl, af as Ml, ag as Bl, ah as Gl, ai as zl } from "./shared-DORJR6eU.js";
|
|
8
8
|
import { m as pt, g as pr, s as Ul, c as Hl, b as Xl, d as Kl, a as jl, e as ql } from "./complex_util-Yc1A_gV1.js";
|
|
9
|
-
import { a as ge, b as xe, d as ke, c as ve, e as Te, g as os } from "./axis_util-
|
|
10
|
-
import { k as Ze, h as Le, i as Je, j as rt, b as Se, d as xt, g as as } from "./step-
|
|
11
|
-
import { z as rs, A as is, B as cs, C as hr, D as fr, F as mr, G as gr, H as xr, I as Cr, J as br, y as Ir, x as yr, w as kr, u as $r, t as vr, E as Sr, K as wr, L as Nr, M as Rr,
|
|
12
|
-
import { a as
|
|
9
|
+
import { a as ge, b as xe, d as ke, c as ve, e as Te, g as os } from "./axis_util-BTeTGnZF.js";
|
|
10
|
+
import { k as Ze, h as Le, i as Je, j as rt, b as Se, d as xt, g as as } from "./step-A_sBP7En.js";
|
|
11
|
+
import { z as rs, A as is, B as cs, C as hr, D as fr, F as mr, G as gr, H as xr, I as Cr, J as br, y as Ir, x as yr, w as kr, u as $r, t as vr, E as Sr, K as wr, L as Nr, M as Rr, c as Tr, f as Yl } from "./backend_util-DGV1tIji.js";
|
|
12
|
+
import { a as Er, c as Ue } from "./concat_util-Bk6ay4Ob.js";
|
|
13
|
+
import { c as Dr, a as Ql, s as Zl } from "./segment_util-CXELxApp.js";
|
|
13
14
|
import { s as Jl } from "./index-CieiGp4Y.js";
|
|
14
15
|
import { n as Fr, b as Pr, a as Or } from "./non_max_suppression_impl-B2W7YjZB.js";
|
|
15
|
-
import { c as Ct } from "./scatter_nd_util-
|
|
16
|
-
import { S as Ar, a as _r } from "./selu_util-
|
|
17
|
-
import {
|
|
18
|
-
import { h as Sn, j as ou, k as au, l as ru, m as iu, n as cu, o as lu, P as un, p as Ve, u as Pe, q as Wr, c as Mr, T as De, E as Br, g as Gr, a as zr, r as uu, s as du, t as Y, v as
|
|
19
|
-
import { s as Hr, a as Fu, t as Xr, b as Pu, c as Ou, d as Kr, e as Au, n as _u, f as Lu, g as Vu, h as Wu, i as Mu, j as Bu, k as Gu, l as zu, o as Uu, p as Hu, q as Xu, r as Ku, u as ju, v as qu, w as Yu, x as Qu, y as Zu, z as Ju, A as ed, B as td, C as sd, D as nd, E as od, F as ad, G as rd, H as id, I as cd, J as ld, K as ud, L as dd, M as jr, N as pd, O as hd, P as fd, Q as md, R as gd, S as xd, T as Cd, U as bd, V as Id, W as yd } from "./shared-
|
|
20
|
-
import { a as ye, c as kd, U as st, d as qe, e as ze, A as En, f as bt, B as dn, h as pn, m as Rt, u as se, C as We, b as Ce, i as Fe, j as hn, k as it, l as It, n as $d, o as vd, p as Sd, q as wd } from "./kernel_funcs_utils-
|
|
21
|
-
import { R as Nd, r as U, a as Rd } from "./Reshape-
|
|
22
|
-
import { M as qr } from "./matMulGelu-
|
|
23
|
-
import { t as Yr, s as fn, a as _t, m as Td, r as Ed, b as Dd, c as Fd, d as Pd } from "./RealDiv-
|
|
24
|
-
import { z as Od } from "./zeros-
|
|
16
|
+
import { c as Ct } from "./scatter_nd_util-DJ8GpL1I.js";
|
|
17
|
+
import { S as Ar, a as _r } from "./selu_util-CPAAI9PC.js";
|
|
18
|
+
import { s as Lr, b as Vr, p as eu, a as tu, i as su, c as nu } from "./slice_util-DDbd6eyd.js";
|
|
19
|
+
import { h as Sn, j as ou, k as au, l as ru, m as iu, n as cu, o as lu, P as un, p as Ve, u as Pe, q as Wr, c as Mr, T as De, E as Br, g as Gr, a as zr, r as uu, s as du, t as Y, v as pu, w as wn, x as hu, y as fu, z as Pt, A as Ot, B as mu, C as gu, D as bs, F as Gt, G as zt, H as xu, I as Cu, J as Nn, K as bu, L as Iu, M as fs, N as yu, O as ku, Q as $u, R as Ut, S as ms, U as vu, f as he, V as be, W as Ht, X as Xt, Y as Su, d as Rn, e as Tn, i as Ur, Z as wu, _ as Nu, $ as Ru, a0 as Tu, a1 as Eu, a2 as Du, a3 as At } from "./gpgpu_math-C0Hfh1As.js";
|
|
20
|
+
import { s as Hr, a as Fu, t as Xr, b as Pu, c as Ou, d as Kr, e as Au, n as _u, f as Lu, g as Vu, h as Wu, i as Mu, j as Bu, k as Gu, l as zu, o as Uu, p as Hu, q as Xu, r as Ku, u as ju, v as qu, w as Yu, x as Qu, y as Zu, z as Ju, A as ed, B as td, C as sd, D as nd, E as od, F as ad, G as rd, H as id, I as cd, J as ld, K as ud, L as dd, M as jr, N as pd, O as hd, P as fd, Q as md, R as gd, S as xd, T as Cd, U as bd, V as Id, W as yd } from "./shared-DVZEsT-0.js";
|
|
21
|
+
import { a as ye, c as kd, U as st, d as qe, e as ze, A as En, f as bt, B as dn, h as pn, m as Rt, u as se, C as We, b as Ce, i as Fe, j as hn, k as it, l as It, n as $d, o as vd, p as Sd, q as wd } from "./kernel_funcs_utils-BNsajF26.js";
|
|
22
|
+
import { R as Nd, r as U, a as Rd } from "./Reshape-CZVlscuS.js";
|
|
23
|
+
import { M as qr } from "./matMulGelu-BM8qerU0.js";
|
|
24
|
+
import { t as Yr, s as fn, a as _t, m as Td, r as Ed, b as Dd, c as Fd, d as Pd } from "./RealDiv-Blil1IAl.js";
|
|
25
|
+
import { z as Od } from "./zeros-CkHJh2fz.js";
|
|
25
26
|
import "./ops/cpu/attentionMask.js";
|
|
26
27
|
import "./ops/webgl/attentionMask.js";
|
|
27
28
|
import "./ops/grads/attentionMask.js";
|
|
28
29
|
import "./ops/cpu/rope.js";
|
|
29
30
|
import "./ops/webgl/rope.js";
|
|
30
|
-
import "./rope-
|
|
31
|
+
import "./rope-DaRtCQFa.js";
|
|
31
32
|
import "./ops/cpu/appendCache.js";
|
|
32
33
|
import "./ops/webgl/appendCache.js";
|
|
33
34
|
import "./ops/grads/softmax16.js";
|
|
34
|
-
import "./matMul16-
|
|
35
|
+
import "./matMul16-qjE_mKX8.js";
|
|
35
36
|
import "./ops/webgl/matMul16.js";
|
|
36
37
|
import "./ops/cpu/matMul16.js";
|
|
37
|
-
import "./pack16-
|
|
38
|
+
import "./pack16-CQUYvE0Y.js";
|
|
38
39
|
import "./ops/transpose16.js";
|
|
39
40
|
import "./ops/reshape16.js";
|
|
40
41
|
import "./ops/cpu/qkv.js";
|
|
@@ -64,17 +65,17 @@ import "./ops/cpu/matMulGelu.js";
|
|
|
64
65
|
import "./ops/grads/matMulGelu.js";
|
|
65
66
|
import "./ops/cpu/gelu.js";
|
|
66
67
|
import "./ops/webgl/gelu.js";
|
|
67
|
-
import "./gelu-
|
|
68
|
+
import "./gelu-Bq6zXPEw.js";
|
|
68
69
|
import "./ops/webgl/log.js";
|
|
69
70
|
import "./checks/normRMS.js";
|
|
70
71
|
import "./checks/normRMSGrad.js";
|
|
71
72
|
import Wd from "./utilities/multinomialCPU.js";
|
|
72
|
-
import { r as Dn } from "./reshape-
|
|
73
|
-
import { t as Kt } from "./tensor2d-
|
|
74
|
-
import { z as Md } from "./unsorted_segment_sum-
|
|
75
|
-
import { s as gs } from "./softmax-
|
|
76
|
-
import { g as Bd } from "./gather-
|
|
77
|
-
import { c as Gd } from "./concat-
|
|
73
|
+
import { r as Dn } from "./reshape-Dxch7IXb.js";
|
|
74
|
+
import { t as Kt } from "./tensor2d-BieJDjvb.js";
|
|
75
|
+
import { z as Md } from "./unsorted_segment_sum-Cx23B-vz.js";
|
|
76
|
+
import { s as gs } from "./softmax-CRzm-wNL.js";
|
|
77
|
+
import { g as Bd } from "./gather-DvRBFTfQ.js";
|
|
78
|
+
import { c as Gd } from "./concat-ByAvdM_j.js";
|
|
78
79
|
function zd(a, t, e, n = !1) {
|
|
79
80
|
const s = Xi(a, "logits", "multinomial"), o = s.size, r = s.rank;
|
|
80
81
|
if (o < 2)
|
|
@@ -847,7 +848,7 @@ const jp = {
|
|
|
847
848
|
};
|
|
848
849
|
function ft(a) {
|
|
849
850
|
const { inputs: t, backend: e, attrs: n } = a, { axis: s } = n, o = ue(s, t[0].shape)[0], r = t.map((m) => m.shape);
|
|
850
|
-
|
|
851
|
+
Er(r, o);
|
|
851
852
|
let c = Ue(t.map((m) => m.shape), o);
|
|
852
853
|
if (G(c) === 0)
|
|
853
854
|
return e.makeTensorInfo(c, t[0].dtype, []);
|
|
@@ -1857,7 +1858,7 @@ function lf(a) {
|
|
|
1857
1858
|
}
|
|
1858
1859
|
let p = c;
|
|
1859
1860
|
c == null && (p = 0);
|
|
1860
|
-
const d = G(o.shape), h =
|
|
1861
|
+
const d = G(o.shape), h = Dr(s, o, i, p), f = ce({
|
|
1861
1862
|
inputs: { x: s },
|
|
1862
1863
|
backend: e,
|
|
1863
1864
|
attrs: {
|
|
@@ -2591,7 +2592,7 @@ const Gm = {
|
|
|
2591
2592
|
kernelName: Aa,
|
|
2592
2593
|
backendName: "cpu",
|
|
2593
2594
|
kernelFunc: ({ inputs: a, attrs: t, backend: e }) => {
|
|
2594
|
-
const { image: n } = a, { radians: s, fillValue: o, center: r } = t, c = e, i = _e(n.dtype, G(n.shape)), [l, u, p, d] = n.shape, [h, f] =
|
|
2595
|
+
const { image: n } = a, { radians: s, fillValue: o, center: r } = t, c = e, i = _e(n.dtype, G(n.shape)), [l, u, p, d] = n.shape, [h, f] = Nr(r, u, p), m = 255, x = Math.sin(s), g = Math.cos(s), C = c.data.get(n.dataId).values;
|
|
2595
2596
|
for (let b = 0; b < l; b++) {
|
|
2596
2597
|
const y = b * p * u * d;
|
|
2597
2598
|
for (let k = 0; k < u; k++) {
|
|
@@ -2850,7 +2851,7 @@ const vg = {
|
|
|
2850
2851
|
kernelFunc: $g
|
|
2851
2852
|
};
|
|
2852
2853
|
function Sg(a) {
|
|
2853
|
-
const { inputs: t, backend: e, attrs: n } = a, { x: s } = t, { numOrSizeSplits: o, axis: r } = n, c = ue(r, s.shape)[0], i =
|
|
2854
|
+
const { inputs: t, backend: e, attrs: n } = a, { x: s } = t, { numOrSizeSplits: o, axis: r } = n, c = ue(r, s.shape)[0], i = Rr(s, o, c), l = new Array(s.shape.length).fill(0), u = s.shape.slice();
|
|
2854
2855
|
return i.map((p) => {
|
|
2855
2856
|
const d = [...u];
|
|
2856
2857
|
d[c] = p;
|
|
@@ -5056,7 +5057,7 @@ class fC {
|
|
|
5056
5057
|
function Ii(a, t, e, n = null) {
|
|
5057
5058
|
let s = t.shape[0], o = t.shape[1];
|
|
5058
5059
|
n != null && (s = n.shape[0], o = n.shape[1]);
|
|
5059
|
-
const r =
|
|
5060
|
+
const r = Tr(o), c = { windowSize: r, inSize: o, batchSize: s, outSize: Math.ceil(o / r) }, i = new hC(c, e, n == null), l = [t];
|
|
5060
5061
|
n != null && l.push(n);
|
|
5061
5062
|
const u = a.runWebGLProgram(i, l, "int32");
|
|
5062
5063
|
if (u.shape[1] === 1)
|
|
@@ -5065,7 +5066,7 @@ function Ii(a, t, e, n = null) {
|
|
|
5065
5066
|
return a.disposeIntermediateTensorInfo(u), p;
|
|
5066
5067
|
}
|
|
5067
5068
|
function yi(a, t, e, n = null) {
|
|
5068
|
-
const s = n != null ? n.shape : t.shape, o = s[s.length - 1], r =
|
|
5069
|
+
const s = n != null ? n.shape : t.shape, o = s[s.length - 1], r = Tr(o), c = new fC(s, r, e, n == null), i = n == null ? [t] : [t, n], l = a.runWebGLProgram(c, i, "int32");
|
|
5069
5070
|
if (l.shape.length === t.shape.length) {
|
|
5070
5071
|
const u = yi(a, t, e, l);
|
|
5071
5072
|
return a.disposeIntermediateTensorInfo(l), u;
|
|
@@ -6179,7 +6180,7 @@ function Eb(a, t, e) {
|
|
|
6179
6180
|
}
|
|
6180
6181
|
function vi(a) {
|
|
6181
6182
|
const { inputs: t, backend: e, attrs: n } = a, { axis: s } = n, o = ue(s, t[0].shape)[0], r = t.map((l) => l.shape);
|
|
6182
|
-
|
|
6183
|
+
Er(r, o);
|
|
6183
6184
|
const c = Ue(t.map((l) => l.shape), o);
|
|
6184
6185
|
if (G(c) === 0)
|
|
6185
6186
|
return e.makeTensorInfo(c, t[0].dtype, []);
|
|
@@ -8582,7 +8583,7 @@ function Oi(a) {
|
|
|
8582
8583
|
te(y <= I - 1 && y >= 0, () => `GatherV2: the index value ${y} is not in [0, ${I - 1}]`);
|
|
8583
8584
|
}
|
|
8584
8585
|
}
|
|
8585
|
-
const l =
|
|
8586
|
+
const l = Dr(s, o, i, c), u = G(o.shape), p = [], d = U({
|
|
8586
8587
|
inputs: { x: s },
|
|
8587
8588
|
backend: e,
|
|
8588
8589
|
attrs: {
|
|
@@ -10357,7 +10358,7 @@ const Ik = {
|
|
|
10357
10358
|
kernelName: Aa,
|
|
10358
10359
|
backendName: "webgl",
|
|
10359
10360
|
kernelFunc: ({ inputs: a, attrs: t, backend: e }) => {
|
|
10360
|
-
const { image: n } = a, { radians: s, fillValue: o, center: r } = t, c = e, i = new bk(n.shape, o), [l, u] =
|
|
10361
|
+
const { image: n } = a, { radians: s, fillValue: o, center: r } = t, c = e, i = new bk(n.shape, o), [l, u] = Nr(r, n.shape[1], n.shape[2]), p = [[l, u, Math.sin(s), Math.cos(s)]];
|
|
10361
10362
|
return c.runWebGLProgram(i, [n], n.dtype, p);
|
|
10362
10363
|
}
|
|
10363
10364
|
};
|
|
@@ -10772,7 +10773,7 @@ const h$ = {
|
|
|
10772
10773
|
kernelFunc: p$
|
|
10773
10774
|
};
|
|
10774
10775
|
function f$(a) {
|
|
10775
|
-
const { inputs: t, backend: e, attrs: n } = a, { x: s } = t, { numOrSizeSplits: o, axis: r } = n, c = ue(r, s.shape)[0], i =
|
|
10776
|
+
const { inputs: t, backend: e, attrs: n } = a, { x: s } = t, { numOrSizeSplits: o, axis: r } = n, c = ue(r, s.shape)[0], i = Rr(s, o, c), l = s.shape.length, u = new Array(l).fill(0), p = s.shape.slice();
|
|
10776
10777
|
return i.map((d) => {
|
|
10777
10778
|
const h = [...p];
|
|
10778
10779
|
h[c] = d;
|
|
@@ -11678,7 +11679,7 @@ const lv = [
|
|
|
11678
11679
|
function uv(a, t) {
|
|
11679
11680
|
return a.length === t ? a : a.length > t ? a.slice(0, t) : a.concat(Array(t - a.length).fill(""));
|
|
11680
11681
|
}
|
|
11681
|
-
class
|
|
11682
|
+
class AS extends Ui {
|
|
11682
11683
|
constructor(t, e) {
|
|
11683
11684
|
super(), this.model = t, this.tokeniser = e, this.actualTokeniser = e;
|
|
11684
11685
|
}
|
|
@@ -11874,6 +11875,6 @@ class OS extends Ui {
|
|
|
11874
11875
|
}
|
|
11875
11876
|
}
|
|
11876
11877
|
export {
|
|
11877
|
-
|
|
11878
|
+
AS as default,
|
|
11878
11879
|
cv as isConversation
|
|
11879
11880
|
};
|
|
@@ -1,10 +1,10 @@
|
|
|
1
|
-
import { aE as E, ab as T, ah as O, U as V, aW as B, N as F, aM as U, aX as W } from "./index-
|
|
2
|
-
import { r as $ } from "./Reshape-
|
|
3
|
-
import { a as A, b as k, d as C, c as N, e as R } from "./axis_util-
|
|
4
|
-
import { t as K, m as _ } from "./shared-
|
|
5
|
-
import { c as j } from "./backend_util-
|
|
6
|
-
import { f as y } from "./gpgpu_math-
|
|
7
|
-
import { g as G, b as L } from "./kernel_funcs_utils-
|
|
1
|
+
import { aE as E, ab as T, ah as O, U as V, aW as B, N as F, aM as U, aX as W } from "./index-BU-PZJ0l.js";
|
|
2
|
+
import { r as $ } from "./Reshape-CZVlscuS.js";
|
|
3
|
+
import { a as A, b as k, d as C, c as N, e as R } from "./axis_util-BTeTGnZF.js";
|
|
4
|
+
import { t as K, m as _ } from "./shared-DVZEsT-0.js";
|
|
5
|
+
import { c as j } from "./backend_util-DGV1tIji.js";
|
|
6
|
+
import { f as y } from "./gpgpu_math-C0Hfh1As.js";
|
|
7
|
+
import { g as G, b as L } from "./kernel_funcs_utils-BNsajF26.js";
|
|
8
8
|
class w {
|
|
9
9
|
constructor(s, e) {
|
|
10
10
|
this.variableNames = ["x"];
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { R as C, U as c, aj as R, x as f } from "./index-
|
|
2
|
-
import { u as g, g as I, a as x, b as F, c as $, d as u, e as m, i as l } from "./gpgpu_math-
|
|
1
|
+
import { R as C, U as c, aj as R, x as f } from "./index-BU-PZJ0l.js";
|
|
2
|
+
import { u as g, g as I, a as x, b as F, c as $, d as u, e as m, i as l } from "./gpgpu_math-C0Hfh1As.js";
|
|
3
3
|
class S {
|
|
4
4
|
constructor(t, i) {
|
|
5
5
|
this.variableNames = ["A"], this.packedInputs = !0, this.packedOutput = !0, this.customUniforms = [{ name: "inputShape", type: "ivec3" }], this.outputShape = t, this.enableShapeUniforms = g(this.outputShape.length);
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { U as h, aj as d, x as c, R as m } from "./index-
|
|
1
|
+
import { U as h, aj as d, x as c, R as m } from "./index-BU-PZJ0l.js";
|
|
2
2
|
function i(n) {
|
|
3
3
|
const { inputs: p, attrs: o } = n, { x: e } = p, { shape: r } = o, a = h(e.shape), s = d(r, a), t = h(s);
|
|
4
4
|
return c(a === t, () => `The new shape (${s}) has ${t} elements and the old shape (${e.shape}) has ${a} elements. The new shape and old shape must have the same number of elements.`), n.backend.incRef(e.dataId), { dataId: e.dataId, shape: s, dtype: e.dtype };
|
package/dist/TeachableLLM.js
CHANGED
|
@@ -5,24 +5,24 @@ import u from "./Generator.js";
|
|
|
5
5
|
import h from "./Trainer.js";
|
|
6
6
|
import { E as f } from "./index-DvYrXKkX.js";
|
|
7
7
|
import { dummyPassTrainAsync as l } from "./utilities/dummy.js";
|
|
8
|
-
import "./index-
|
|
9
|
-
import "./random_width-
|
|
10
|
-
import "./zeros_like-
|
|
8
|
+
import "./index-BU-PZJ0l.js";
|
|
9
|
+
import "./random_width-DvNaD5W3.js";
|
|
10
|
+
import "./zeros_like-CGnKYJEe.js";
|
|
11
11
|
import "./index-Cp39cXWe.js";
|
|
12
|
-
import "./dataset-
|
|
12
|
+
import "./dataset-CtujTjY_.js";
|
|
13
13
|
import "./ops/cpu/attentionMask.js";
|
|
14
14
|
import "./ops/webgl/attentionMask.js";
|
|
15
15
|
import "./ops/grads/attentionMask.js";
|
|
16
16
|
import "./ops/cpu/rope.js";
|
|
17
17
|
import "./ops/webgl/rope.js";
|
|
18
|
-
import "./rope-
|
|
18
|
+
import "./rope-DaRtCQFa.js";
|
|
19
19
|
import "./ops/cpu/appendCache.js";
|
|
20
20
|
import "./ops/webgl/appendCache.js";
|
|
21
21
|
import "./ops/grads/softmax16.js";
|
|
22
|
-
import "./matMul16-
|
|
22
|
+
import "./matMul16-qjE_mKX8.js";
|
|
23
23
|
import "./ops/webgl/matMul16.js";
|
|
24
24
|
import "./ops/cpu/matMul16.js";
|
|
25
|
-
import "./pack16-
|
|
25
|
+
import "./pack16-CQUYvE0Y.js";
|
|
26
26
|
import "./ops/transpose16.js";
|
|
27
27
|
import "./ops/reshape16.js";
|
|
28
28
|
import "./ops/cpu/qkv.js";
|
|
@@ -43,11 +43,11 @@ import "./ops/webgl/gatherSub.js";
|
|
|
43
43
|
import "./ops/cpu/scatterSub.js";
|
|
44
44
|
import "./ops/webgl/scatterSub.js";
|
|
45
45
|
import "./ops/cpu/matMulGelu.js";
|
|
46
|
-
import "./matMulGelu-
|
|
46
|
+
import "./matMulGelu-BM8qerU0.js";
|
|
47
47
|
import "./ops/grads/matMulGelu.js";
|
|
48
48
|
import "./ops/cpu/gelu.js";
|
|
49
49
|
import "./ops/webgl/gelu.js";
|
|
50
|
-
import "./gelu-
|
|
50
|
+
import "./gelu-Bq6zXPEw.js";
|
|
51
51
|
import "./ops/webgl/log.js";
|
|
52
52
|
import "./ops/cpu/adamMoments.js";
|
|
53
53
|
import "./ops/webgl/adamMoments.js";
|
|
@@ -175,7 +175,7 @@ class a {
|
|
|
175
175
|
const n = this.ee.listeners("trainStep");
|
|
176
176
|
for (const i of n)
|
|
177
177
|
await i(o);
|
|
178
|
-
}), this._trainer && this._trainer !== e && this._trainer.
|
|
178
|
+
}), this._trainer && this._trainer !== e && this._trainer.removeAllListeners(), this._trainer = e, e;
|
|
179
179
|
}
|
|
180
180
|
async train(t, r, e) {
|
|
181
181
|
const o = this.trainer(e, r);
|
package/dist/backend.js
CHANGED
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
import { g as o, s as e, r as s } from "./index-
|
|
1
|
+
import { g as o, s as e, r as s } from "./index-BU-PZJ0l.js";
|
|
2
2
|
async function c(t, a) {
|
|
3
3
|
if (o() !== t) {
|
|
4
4
|
if (t === "webgpu") {
|
|
5
5
|
const { registerWebGPUBackend: i } = await import("./patches/webgpu_base.js");
|
|
6
|
-
i(a), await import("./index-
|
|
6
|
+
i(a), await import("./index-BSjeovee.js"), await import("./ops/webgpu/index.js");
|
|
7
7
|
}
|
|
8
8
|
await e(t), await s(), console.log(`Backend set to ${t}`);
|
|
9
9
|
}
|