@genai-fi/nanogpt 0.17.4 → 0.18.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/Generator.d.ts +2 -15
- package/dist/Generator.js +45 -34
- package/dist/{RealDiv-CGwv0liw.js → RealDiv-ioj6Z-ox.js} +9 -9
- package/dist/{Reshape-BW__R4mZ.js → Reshape-BZC-ebeR.js} +7 -7
- package/dist/{Reshape-CPBkTIH2.js → Reshape-pwprEaej.js} +1 -1
- package/dist/TeachableLLM.d.ts +3 -8
- package/dist/TeachableLLM.js +61 -44
- package/dist/Trainer.d.ts +6 -4
- package/dist/Trainer.js +107 -92
- package/dist/{axis_util-GTVlo58H.js → axis_util-QWWgLjut.js} +1 -1
- package/dist/backend.js +2 -2
- package/dist/{backend_util-GaFarB78.js → backend_util-qwSFfxYx.js} +21 -21
- package/dist/{backend_webgpu-BqASlsbV.js → backend_webgpu-DI2wXEC2.js} +8 -8
- package/dist/{broadcast_to-eS93CCN_.js → broadcast_to-C_EJTVTZ.js} +2 -2
- package/dist/checks/appendCache.js +2 -2
- package/dist/checks/attentionMask.js +5 -5
- package/dist/checks/gelu.js +2 -2
- package/dist/checks/matMulGelu.js +2 -2
- package/dist/checks/normRMS.js +6 -6
- package/dist/checks/normRMSGrad.js +3 -3
- package/dist/checks/packUnpack.js +6 -6
- package/dist/checks/qkv.js +2 -2
- package/dist/checks/rope.js +2 -2
- package/dist/{clip_by_value-DDA7rrcT.js → clip_by_value-CLAD4h_I.js} +1 -1
- package/dist/complex-3DpPEG9B.js +11 -0
- package/dist/{concat-CAQpCret.js → concat-Dqk7Xk7h.js} +5 -5
- package/dist/{concat_util-D18dJ4fD.js → concat_util-C1Mxe27t.js} +1 -1
- package/dist/{dataset-CGGp1z9P.js → dataset-DlqAN81i.js} +3 -3
- package/dist/{dropout_util--NxWuYg2.js → dropout_util-N0z8Os-K.js} +1 -1
- package/dist/{expand_dims-Bkd1YD5x.js → expand_dims-D0rBtgT1.js} +4 -4
- package/dist/{exports_initializers-CYzKLjN7.js → exports_initializers-DIOZQt_L.js} +1 -1
- package/dist/{floor-BQtb-Azg.js → floor-CymuCmTO.js} +1 -1
- package/dist/{gather-qIqEqaGn.js → gather-DEyjXNb1.js} +1 -1
- package/dist/{gelu-B220X1Go.js → gelu-DpTCC3eB.js} +1 -1
- package/dist/{gpgpu_math-BwvV12df.js → gpgpu_math-3bCb5ooU.js} +25 -25
- package/dist/{index-CjOWnMXP.js → index-BQvB7LCC.js} +15 -15
- package/dist/{index-CUXkjxiT.js → index-DSGwv2Yx.js} +33 -33
- package/dist/inference/types.d.ts +16 -0
- package/dist/inference/types.js +1 -0
- package/dist/{kernel_funcs_utils-pq0CK9co.js → kernel_funcs_utils-DGqzNlHT.js} +6 -6
- package/dist/layers/BaseLayer.js +4 -4
- package/dist/layers/CausalSelfAttention.js +6 -6
- package/dist/layers/LoRA.js +4 -4
- package/dist/layers/MLP.js +4 -4
- package/dist/layers/PositionEmbedding.js +5 -5
- package/dist/layers/RMSNorm.js +3 -3
- package/dist/layers/RoPECache.js +4 -4
- package/dist/layers/TiedEmbedding.js +6 -6
- package/dist/layers/TransformerBlock.js +1 -1
- package/dist/layers/WeightStore.js +2 -2
- package/dist/loader/load.d.ts +2 -8
- package/dist/loader/loadTransformers.d.ts +2 -8
- package/dist/loader/loadTransformers.js +13 -11
- package/dist/loader/newZipLoad.d.ts +2 -8
- package/dist/loader/newZipLoad.js +25 -10
- package/dist/loader/oldZipLoad.js +13 -13
- package/dist/loader/save.d.ts +9 -2
- package/dist/loader/save.js +64 -55
- package/dist/loader/types.d.ts +29 -1
- package/dist/main.d.ts +2 -0
- package/dist/main.js +45 -43
- package/dist/{matMul16-BcVC_E62.js → matMul16-BIT70Vya.js} +3 -3
- package/dist/{matMulGelu-JNLZqKQp.js → matMulGelu-CsZnh18H.js} +18 -18
- package/dist/mat_mul-DP86qZtZ.js +11 -0
- package/dist/mod-BXjLYwvM.js +11 -0
- package/dist/models/NanoGPTV1.js +2 -2
- package/dist/models/NanoGPTV2.js +2 -2
- package/dist/models/model.d.ts +3 -2
- package/dist/models/model.js +13 -13
- package/dist/{not_equal-hurPF26l.js → not_equal-CkQKkKZy.js} +15 -15
- package/dist/{ones-BytntneX.js → ones-DbVB5N58.js} +3 -3
- package/dist/ops/adamAdjust.js +3 -3
- package/dist/ops/adamMoments.js +3 -3
- package/dist/ops/add16.js +1 -1
- package/dist/ops/appendCache.js +6 -6
- package/dist/ops/attentionMask.js +3 -3
- package/dist/ops/concat16.js +3 -3
- package/dist/ops/cpu/adamAdjust.js +9 -9
- package/dist/ops/cpu/adamMoments.js +5 -5
- package/dist/ops/cpu/appendCache.js +2 -2
- package/dist/ops/cpu/attentionMask.js +6 -6
- package/dist/ops/cpu/fusedSoftmax.js +4 -4
- package/dist/ops/cpu/gatherSub.js +5 -5
- package/dist/ops/cpu/gelu.js +4 -4
- package/dist/ops/cpu/matMul16.js +2 -2
- package/dist/ops/cpu/matMulGelu.js +7 -7
- package/dist/ops/cpu/matMulMul.js +2 -2
- package/dist/ops/cpu/mulDropout.js +5 -5
- package/dist/ops/cpu/normRMS.js +1 -1
- package/dist/ops/cpu/qkv.js +3 -3
- package/dist/ops/cpu/rope.js +5 -5
- package/dist/ops/cpu/scatterSub.js +5 -5
- package/dist/ops/dot16.js +2 -2
- package/dist/ops/dropout.js +6 -6
- package/dist/ops/dropout16.js +1 -1
- package/dist/ops/gatherSub.js +1 -1
- package/dist/ops/gelu.js +2 -2
- package/dist/ops/globalNorm.js +7 -7
- package/dist/ops/grads/add16.js +1 -1
- package/dist/ops/grads/attentionMask.js +2 -2
- package/dist/ops/grads/dropout16.js +1 -1
- package/dist/ops/grads/gelu.js +2 -2
- package/dist/ops/grads/matMul16.js +3 -3
- package/dist/ops/grads/matMulGelu.js +1 -1
- package/dist/ops/grads/mul16.js +1 -1
- package/dist/ops/grads/normRMS.js +7 -7
- package/dist/ops/grads/pack16.js +3 -3
- package/dist/ops/grads/qkv.js +11 -11
- package/dist/ops/grads/rope.js +2 -2
- package/dist/ops/grads/softmax16.js +1 -1
- package/dist/ops/grads/unpack16.js +2 -2
- package/dist/ops/matMul16.js +3 -3
- package/dist/ops/matMulGelu.js +6 -6
- package/dist/ops/matMulMul.js +3 -3
- package/dist/ops/mul16.js +1 -1
- package/dist/ops/mulDrop.js +3 -3
- package/dist/ops/normRMS.js +4 -4
- package/dist/ops/pack16.js +2 -2
- package/dist/ops/qkv.js +3 -3
- package/dist/ops/reshape16.js +6 -6
- package/dist/ops/rope.js +2 -2
- package/dist/ops/scatterSub.js +1 -1
- package/dist/ops/slice16.js +2 -2
- package/dist/ops/softmax16.js +1 -1
- package/dist/ops/sub16.js +1 -1
- package/dist/ops/sum16.js +6 -6
- package/dist/ops/transpose16.js +3 -3
- package/dist/ops/unpack16.js +2 -2
- package/dist/ops/webgl/adamAdjust.js +2 -2
- package/dist/ops/webgl/adamMoments.js +1 -1
- package/dist/ops/webgl/appendCache.js +1 -1
- package/dist/ops/webgl/attentionMask.js +1 -1
- package/dist/ops/webgl/dropout16.js +1 -1
- package/dist/ops/webgl/fusedSoftmax.js +7 -7
- package/dist/ops/webgl/gatherSub.js +3 -3
- package/dist/ops/webgl/gelu.js +2 -2
- package/dist/ops/webgl/log.js +3 -3
- package/dist/ops/webgl/matMul16.js +13 -13
- package/dist/ops/webgl/matMulGelu.js +4 -4
- package/dist/ops/webgl/matMulMul.js +2 -2
- package/dist/ops/webgl/mulDropout.js +1 -1
- package/dist/ops/webgl/normRMS.js +2 -2
- package/dist/ops/webgl/qkv.js +1 -1
- package/dist/ops/webgl/rope.js +1 -1
- package/dist/ops/webgl/scatterSub.js +2 -2
- package/dist/ops/webgpu/adamAdjust.js +3 -3
- package/dist/ops/webgpu/adamMoments.js +3 -3
- package/dist/ops/webgpu/add16.js +6 -6
- package/dist/ops/webgpu/appendCache.js +3 -3
- package/dist/ops/webgpu/attentionMask.js +2 -2
- package/dist/ops/webgpu/attentionMask32_program.js +2 -2
- package/dist/ops/webgpu/clipScale.js +7 -7
- package/dist/ops/webgpu/concat16.js +5 -5
- package/dist/ops/webgpu/dropout16.js +6 -6
- package/dist/ops/webgpu/gatherSub.js +3 -3
- package/dist/ops/webgpu/gelu.js +8 -8
- package/dist/ops/webgpu/matMul16.js +16 -16
- package/dist/ops/webgpu/matMul16_program.js +2 -2
- package/dist/ops/webgpu/mul16.js +5 -5
- package/dist/ops/webgpu/norm2.js +1 -1
- package/dist/ops/webgpu/normRMS.js +2 -2
- package/dist/ops/webgpu/normRMSGrad.js +4 -4
- package/dist/ops/webgpu/pack16.js +4 -4
- package/dist/ops/webgpu/pack16_program.js +2 -2
- package/dist/ops/webgpu/qkv.js +2 -2
- package/dist/ops/webgpu/rope.js +3 -3
- package/dist/ops/webgpu/scatterSub.js +3 -3
- package/dist/ops/webgpu/slice16.js +4 -4
- package/dist/ops/webgpu/softmax16.js +4 -4
- package/dist/ops/webgpu/softmax16_program.js +2 -2
- package/dist/ops/webgpu/softmax16_subgroup_program.js +2 -2
- package/dist/ops/webgpu/softmax16grad.js +4 -4
- package/dist/ops/webgpu/sub16.js +6 -6
- package/dist/ops/webgpu/sum16.js +3 -3
- package/dist/ops/webgpu/transpose16.js +8 -8
- package/dist/ops/webgpu/transpose16_program.js +2 -2
- package/dist/ops/webgpu/transpose16_shared_program.js +3 -3
- package/dist/ops/webgpu/unpack16.js +3 -3
- package/dist/ops/webgpu/utils/binary_op.js +3 -3
- package/dist/ops/webgpu/utils/reductions.js +5 -5
- package/dist/{ops-CsXeTq1P.js → ops-CURIZSVt.js} +100 -100
- package/dist/{pack16-bqltoUlR.js → pack16-WlOSOuZA.js} +2 -2
- package/dist/patches/webgpu_backend.js +6 -6
- package/dist/patches/webgpu_base.js +1 -1
- package/dist/patches/webgpu_program.js +2 -2
- package/dist/{random_normal-IBRrha8a.js → random_normal-CIm8lk2-.js} +1 -1
- package/dist/{random_width-DN5ZtQkM.js → random_width-B_fVXhGx.js} +131 -131
- package/dist/{range-C-CjF-LI.js → range-BDxO73mk.js} +1 -1
- package/dist/{readers-iz5u3HBo.js → readers-17HLdxVM.js} +2 -2
- package/dist/relu-DTvZKBsZ.js +9 -0
- package/dist/{reshape-BDOuCSNW.js → reshape-BIN71H3p.js} +1 -1
- package/dist/{resize_nearest_neighbor-BojqlfRe.js → resize_nearest_neighbor-C6_0dAnK.js} +41 -41
- package/dist/{rope-0j_f1TPm.js → rope-CC5RjmKU.js} +4 -4
- package/dist/{scatter_nd_util-ByNJaL6I.js → scatter_nd_util-C-x73Cj6.js} +1 -1
- package/dist/{segment_util-Dasb2Zaf.js → segment_util-4zuHV5IG.js} +2 -2
- package/dist/{selu_util-BLhIqRkw.js → selu_util-BXdhy_W6.js} +5 -5
- package/dist/{shared-CagdqkLh.js → shared-DRWDyk9w.js} +6 -6
- package/dist/{shared-3agzAqQ_.js → shared-zTaJ5siv.js} +1 -1
- package/dist/slice-BvItlgXu.js +12 -0
- package/dist/{slice_util-CC35pLmT.js → slice_util-DPY56GzQ.js} +5 -5
- package/dist/{softmax-D4q1LJN7.js → softmax-BLGJqdwx.js} +1 -1
- package/dist/split-BN9LkEgS.js +9 -0
- package/dist/{squeeze-ho4wLUek.js → squeeze-O_YWJpw_.js} +2 -2
- package/dist/{stack-DudVrtmG.js → stack-z6QE7kmP.js} +1 -1
- package/dist/{step-BTxPtq1r.js → step-DQY6_ABw.js} +4 -4
- package/dist/{sum-BpiwSWvg.js → sum-D39FeU5h.js} +3 -3
- package/dist/{tensor-BWFldCso.js → tensor-D8e0Gd7c.js} +1 -1
- package/dist/{tensor1d-LMGMIUlr.js → tensor1d-BMl0eZYV.js} +1 -1
- package/dist/{tensor2d-BnXMKScO.js → tensor2d-DTtQ1QcT.js} +1 -1
- package/dist/{tensor4d-C6UCG_u8.js → tensor4d-Dj4rDssL.js} +1 -1
- package/dist/{tfjs_backend-BGnG-ppu.js → tfjs_backend-Bk3PmK91.js} +65 -65
- package/dist/{tile-CFy-xTO6.js → tile-CsWlVKKz.js} +1 -1
- package/dist/tokeniser/BaseTokeniser.d.ts +4 -1
- package/dist/tokeniser/BaseTokeniser.js +21 -5
- package/dist/tokeniser/CharTokeniser.d.ts +1 -1
- package/dist/tokeniser/CharTokeniser.js +62 -50
- package/dist/tokeniser/bpe.d.ts +1 -1
- package/dist/tokeniser/bpe.js +41 -35
- package/dist/tokeniser/type.d.ts +3 -1
- package/dist/training/AdamW.d.ts +3 -0
- package/dist/training/AdamW.js +59 -30
- package/dist/training/BasicTrainer.d.ts +1 -0
- package/dist/training/BasicTrainer.js +112 -92
- package/dist/training/DatasetBuilder.js +3 -3
- package/dist/training/Evaluator.js +2 -2
- package/dist/training/LRScheduler.d.ts +1 -0
- package/dist/training/LRScheduler.js +18 -12
- package/dist/training/PreTrainer.js +3 -3
- package/dist/training/SFTDatasetBuilder.js +3 -3
- package/dist/training/SFTTrainer.js +1 -1
- package/dist/training/orthoGrad.js +1 -1
- package/dist/training/sparseCrossEntropy.js +30 -30
- package/dist/training/types.d.ts +5 -3
- package/dist/training/validation.js +13 -13
- package/dist/{transpose-9kRxIXWR.js → transpose-Qxz-4os3.js} +7 -7
- package/dist/{unsorted_segment_sum-DJvk5xnh.js → unsorted_segment_sum-BfFVV9Zm.js} +20 -20
- package/dist/utilities/datasetID.d.ts +2 -0
- package/dist/utilities/datasetID.js +21 -0
- package/dist/utilities/dummy.js +6 -6
- package/dist/utilities/multinomialCPU.js +2 -2
- package/dist/utilities/packed.js +1 -1
- package/dist/utilities/performance.js +1 -1
- package/dist/utilities/profile.js +1 -1
- package/dist/utilities/safetensors.js +2 -2
- package/dist/utilities/sentences.js +5 -5
- package/dist/utilities/weights.js +2 -2
- package/dist/{variable-Ck482e3n.js → variable-SSATClyt.js} +1 -1
- package/dist/{webgpu_program-B4HmApL1.js → webgpu_program-CbjdYLYk.js} +1 -1
- package/dist/{webgpu_util-DYlGSwOJ.js → webgpu_util-DuofJBMo.js} +7 -7
- package/dist/{zeros-DvZpK8s6.js → zeros-Bw0puq_w.js} +2 -2
- package/dist/{zeros_like-CWjDdwr-.js → zeros_like-rOHr54NY.js} +69 -69
- package/package.json +3 -3
- package/dist/complex-DI35Q-gW.js +0 -11
- package/dist/mat_mul-DhG0Newp.js +0 -11
- package/dist/mod-CSdCpRjf.js +0 -11
- package/dist/relu-J_X6MUzx.js +0 -9
- package/dist/slice-BzS11Qh0.js +0 -12
- package/dist/split-C2Sj255c.js +0 -9
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { o as a,
|
|
1
|
+
import { o as a, n as f, v as m, f as y, E as c, C as p } from "./index-DSGwv2Yx.js";
|
|
2
2
|
function u(o, s, t) {
|
|
3
3
|
const r = f(o, "x", "clipByValue");
|
|
4
4
|
if (m(s <= t, () => `Error in clip: min (${s}) must be less than or equal to max (${t}).`), s === t)
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
import { o as t, n as s, a6 as c, E as m, a7 as r } from "./index-DSGwv2Yx.js";
|
|
2
|
+
function l(o, n) {
|
|
3
|
+
const a = s(o, "real", "complex"), e = s(n, "imag", "complex");
|
|
4
|
+
c(a.shape, e.shape, `real and imag shapes, ${a.shape} and ${e.shape}, must match in call to tf.complex().`);
|
|
5
|
+
const p = { real: a, imag: e };
|
|
6
|
+
return m.runKernel(r, p);
|
|
7
|
+
}
|
|
8
|
+
const i = /* @__PURE__ */ t({ complex_: l });
|
|
9
|
+
export {
|
|
10
|
+
i as c
|
|
11
|
+
};
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { o as s,
|
|
2
|
-
function
|
|
1
|
+
import { o as s, v as a, w as p, u as i, E as l, x as u } from "./index-DSGwv2Yx.js";
|
|
2
|
+
function f(o, e = 0) {
|
|
3
3
|
a(o.length >= 1, () => "Pass at least one tensor to concat");
|
|
4
4
|
const t = p(o, "tensors", "concat", "string_or_numeric");
|
|
5
5
|
if (t[0].dtype === "complex64" && t.forEach((n) => {
|
|
@@ -9,9 +9,9 @@ function h(o, e = 0) {
|
|
|
9
9
|
}), t.length === 1)
|
|
10
10
|
return i(t[0]);
|
|
11
11
|
const r = t, c = { axis: e };
|
|
12
|
-
return l.runKernel(
|
|
12
|
+
return l.runKernel(u, r, c);
|
|
13
13
|
}
|
|
14
|
-
const
|
|
14
|
+
const m = /* @__PURE__ */ s({ concat_: f });
|
|
15
15
|
export {
|
|
16
|
-
|
|
16
|
+
m as c
|
|
17
17
|
};
|
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
import { ag as h, aA as S, ab as N,
|
|
1
|
+
import { ag as h, aA as S, ab as N, l as v, aB as o, aC as p, aD as g, v as k, t as y } from "./index-DSGwv2Yx.js";
|
|
2
2
|
import { s as R } from "./index-CieiGp4Y.js";
|
|
3
|
-
import { s as B } from "./stack-
|
|
4
|
-
import { t as $ } from "./tensor-
|
|
3
|
+
import { s as B } from "./stack-z6QE7kmP.js";
|
|
4
|
+
import { t as $ } from "./tensor-D8e0Gd7c.js";
|
|
5
5
|
function _(s, t) {
|
|
6
6
|
return b(s, t);
|
|
7
7
|
}
|
|
@@ -1,11 +1,11 @@
|
|
|
1
|
-
import { o as e,
|
|
2
|
-
function
|
|
1
|
+
import { o as e, n as a, v as i, E as m, y as p } from "./index-DSGwv2Yx.js";
|
|
2
|
+
function c(t, n = 0) {
|
|
3
3
|
const s = a(t, "x", "expandDims", "string_or_numeric");
|
|
4
4
|
i(n <= s.rank, () => "Axis must be <= rank of the tensor");
|
|
5
5
|
const r = { input: s }, o = { dim: n };
|
|
6
6
|
return m.runKernel(p, r, o);
|
|
7
7
|
}
|
|
8
|
-
const
|
|
8
|
+
const x = /* @__PURE__ */ e({ expandDims_: c });
|
|
9
9
|
export {
|
|
10
|
-
|
|
10
|
+
x as e
|
|
11
11
|
};
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { o as g,
|
|
1
|
+
import { o as g, n as t, E as h, G as p } from "./index-DSGwv2Yx.js";
|
|
2
2
|
function u(n, s, r = 0, e = 0) {
|
|
3
3
|
const o = t(n, "x", "gather"), a = t(s, "indices", "gather", "int32"), c = { x: o, indices: a }, i = { axis: r, batchDims: e };
|
|
4
4
|
return h.runKernel(p, c, i);
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { ab as $,
|
|
2
|
-
import { b as se } from "./backend_util-
|
|
1
|
+
import { ab as $, N as E, aR as X, ac as T, aS as ae, I as N, aT as G, v as ie, a9 as k, ad as ce } from "./index-DSGwv2Yx.js";
|
|
2
|
+
import { b as se } from "./backend_util-qwSFfxYx.js";
|
|
3
3
|
const w = {}, M = {
|
|
4
4
|
alpha: !1,
|
|
5
5
|
antialias: !1,
|
|
@@ -215,7 +215,7 @@ function Ot(e, t, n) {
|
|
|
215
215
|
function It(e, t) {
|
|
216
216
|
v(e, () => e.bindFramebuffer(e.FRAMEBUFFER, t)), v(e, () => e.framebufferTexture2D(e.FRAMEBUFFER, e.COLOR_ATTACHMENT0, e.TEXTURE_2D, null, 0));
|
|
217
217
|
}
|
|
218
|
-
function
|
|
218
|
+
function Lt(e) {
|
|
219
219
|
const t = e.checkFramebufferStatus(e.FRAMEBUFFER);
|
|
220
220
|
if (t !== e.FRAMEBUFFER_COMPLETE)
|
|
221
221
|
throw new Error("Error binding framebuffer: " + Se(e, t));
|
|
@@ -258,7 +258,7 @@ function J(e) {
|
|
|
258
258
|
e[e.length - 1]
|
|
259
259
|
];
|
|
260
260
|
}
|
|
261
|
-
function
|
|
261
|
+
function Ut(e) {
|
|
262
262
|
let t = [1, 1, 1];
|
|
263
263
|
return e.length === 0 || e.length === 1 && e[0] === 1 || (t = [Z(e), ...J(e)]), t;
|
|
264
264
|
}
|
|
@@ -378,7 +378,7 @@ function Xt(e, t) {
|
|
|
378
378
|
n != null && ie(n.dtype !== "complex64", () => `${t} does not support complex64 tensors in the WebGL backend.`);
|
|
379
379
|
});
|
|
380
380
|
}
|
|
381
|
-
function
|
|
381
|
+
function L() {
|
|
382
382
|
let e, t, n, r, o, a, i, c, s, l;
|
|
383
383
|
return $().getNumber("WEBGL_VERSION") === 2 ? (e = "#version 300 es", t = "in", n = "out", r = "in", o = "texture", a = "outputColor", i = "out vec4 outputColor;", c = $().getBool("WEBGL2_ISNAN_CUSTOM") ? `
|
|
384
384
|
bool isnan_custom(float val) {
|
|
@@ -567,8 +567,8 @@ function Fe(e, t, n) {
|
|
|
567
567
|
});
|
|
568
568
|
const o = r.join(`
|
|
569
569
|
`), a = e.map((x) => _e(x, t, n.packedInputs, n.enableShapeUniforms)).join(`
|
|
570
|
-
`), i = t.texShape, c =
|
|
571
|
-
let l, u, f =
|
|
570
|
+
`), i = t.texShape, c = L(), s = Ne(c);
|
|
571
|
+
let l, u, f = Le(c);
|
|
572
572
|
return t.isPacked ? (l = Ae(t.logicalShape, i, n.enableShapeUniforms), u = Ie(c)) : (l = we(t.logicalShape, i, n.enableShapeUniforms), u = Oe(c)), n.packedInputs && (f += be), [
|
|
573
573
|
f,
|
|
574
574
|
s,
|
|
@@ -580,7 +580,7 @@ function Fe(e, t, n) {
|
|
|
580
580
|
].join(`
|
|
581
581
|
`);
|
|
582
582
|
}
|
|
583
|
-
function
|
|
583
|
+
function U(e, t = !1) {
|
|
584
584
|
const n = e.shapeInfo.logicalShape;
|
|
585
585
|
switch (n.length) {
|
|
586
586
|
case 0:
|
|
@@ -617,7 +617,7 @@ function te(e, t) {
|
|
|
617
617
|
}
|
|
618
618
|
function _e(e, t, n = !1, r) {
|
|
619
619
|
let o = "";
|
|
620
|
-
n ? o += te(e, r) : o +=
|
|
620
|
+
n ? o += te(e, r) : o += U(e, r);
|
|
621
621
|
const a = e.shapeInfo.logicalShape, i = t.logicalShape;
|
|
622
622
|
return a.length <= i.length && (n ? o += ot(e, t) : o += at(e, t)), o;
|
|
623
623
|
}
|
|
@@ -676,7 +676,7 @@ function Ie(e) {
|
|
|
676
676
|
}
|
|
677
677
|
`;
|
|
678
678
|
}
|
|
679
|
-
function
|
|
679
|
+
function Le(e) {
|
|
680
680
|
return `${e.version}
|
|
681
681
|
precision highp float;
|
|
682
682
|
precision highp int;
|
|
@@ -732,12 +732,12 @@ function Ue(e) {
|
|
|
732
732
|
return fract((p3.x + p3.y) * p3.z);
|
|
733
733
|
}
|
|
734
734
|
|
|
735
|
-
${
|
|
735
|
+
${Ue}
|
|
736
736
|
${De}
|
|
737
737
|
${ge}
|
|
738
738
|
`;
|
|
739
739
|
}
|
|
740
|
-
const
|
|
740
|
+
const Ue = `
|
|
741
741
|
vec2 uvFromFlat(int texNumR, int texNumC, int index) {
|
|
742
742
|
int texR = index / texNumC;
|
|
743
743
|
int texC = index - texR * texNumC;
|
|
@@ -1112,7 +1112,7 @@ function O(e) {
|
|
|
1112
1112
|
return `offset${e}`;
|
|
1113
1113
|
}
|
|
1114
1114
|
function He(e) {
|
|
1115
|
-
const t = e.name, n = "get" + t.charAt(0).toUpperCase() + t.slice(1), r =
|
|
1115
|
+
const t = e.name, n = "get" + t.charAt(0).toUpperCase() + t.slice(1), r = L();
|
|
1116
1116
|
return `
|
|
1117
1117
|
vec4 ${n}() {
|
|
1118
1118
|
return ${r.texture2D}(${t}, halfCR);
|
|
@@ -1147,7 +1147,7 @@ function qe(e, t) {
|
|
|
1147
1147
|
`;
|
|
1148
1148
|
}
|
|
1149
1149
|
function je(e, t) {
|
|
1150
|
-
const n = e.name, r = "get" + n.charAt(0).toUpperCase() + n.slice(1), o = e.shapeInfo.texShape, a =
|
|
1150
|
+
const n = e.name, r = "get" + n.charAt(0).toUpperCase() + n.slice(1), o = e.shapeInfo.texShape, a = L();
|
|
1151
1151
|
if (t)
|
|
1152
1152
|
return `
|
|
1153
1153
|
vec4 ${r}(int index) {
|
|
@@ -1215,7 +1215,7 @@ function Ye(e, t) {
|
|
|
1215
1215
|
`;
|
|
1216
1216
|
}
|
|
1217
1217
|
function Ke(e, t) {
|
|
1218
|
-
const n = e.shapeInfo.logicalShape, r = e.name, o = "get" + r.charAt(0).toUpperCase() + r.slice(1), a = e.shapeInfo.texShape, i = a[0], c = a[1], s =
|
|
1218
|
+
const n = e.shapeInfo.logicalShape, r = e.name, o = "get" + r.charAt(0).toUpperCase() + r.slice(1), a = e.shapeInfo.texShape, i = a[0], c = a[1], s = L();
|
|
1219
1219
|
if (a != null && T(n, a))
|
|
1220
1220
|
return t ? `
|
|
1221
1221
|
vec4 ${o}(int row, int col) {
|
|
@@ -1269,7 +1269,7 @@ function Ze(e, t) {
|
|
|
1269
1269
|
if (s.length < n.length) {
|
|
1270
1270
|
const d = g(e, s), x = ["row", "col"];
|
|
1271
1271
|
return `
|
|
1272
|
-
${
|
|
1272
|
+
${U(d, t)}
|
|
1273
1273
|
float ${o}(int row, int col) {
|
|
1274
1274
|
return ${o}(${b(x, c)});
|
|
1275
1275
|
}
|
|
@@ -1334,7 +1334,7 @@ function Je(e, t) {
|
|
|
1334
1334
|
}
|
|
1335
1335
|
`;
|
|
1336
1336
|
}
|
|
1337
|
-
const c =
|
|
1337
|
+
const c = L();
|
|
1338
1338
|
if (t)
|
|
1339
1339
|
return `
|
|
1340
1340
|
vec4 ${o}(int b, int row, int col) {
|
|
@@ -1360,7 +1360,7 @@ function Qe(e, t) {
|
|
|
1360
1360
|
if (l.length < n.length) {
|
|
1361
1361
|
const p = g(e, l), m = ["row", "col", "depth"];
|
|
1362
1362
|
return `
|
|
1363
|
-
${
|
|
1363
|
+
${U(p, t)}
|
|
1364
1364
|
float ${o}(int row, int col, int depth) {
|
|
1365
1365
|
return ${o}(${b(m, s)});
|
|
1366
1366
|
}
|
|
@@ -1430,7 +1430,7 @@ function Qe(e, t) {
|
|
|
1430
1430
|
`;
|
|
1431
1431
|
}
|
|
1432
1432
|
function et(e, t) {
|
|
1433
|
-
const n = e.name, r = "get" + n.charAt(0).toUpperCase() + n.slice(1), o =
|
|
1433
|
+
const n = e.name, r = "get" + n.charAt(0).toUpperCase() + n.slice(1), o = L();
|
|
1434
1434
|
if (t)
|
|
1435
1435
|
return `
|
|
1436
1436
|
vec4 ${r}(int b2, int b, int row, int col) {
|
|
@@ -1464,7 +1464,7 @@ function tt(e, t) {
|
|
|
1464
1464
|
if (s.length < n.length) {
|
|
1465
1465
|
const R = g(e, s), F = ["row", "col", "depth", "depth2"];
|
|
1466
1466
|
return `
|
|
1467
|
-
${
|
|
1467
|
+
${U(R, t)}
|
|
1468
1468
|
float ${o}(int row, int col, int depth, int depth2) {
|
|
1469
1469
|
return ${o}(${b(F, l)});
|
|
1470
1470
|
}
|
|
@@ -1550,7 +1550,7 @@ function nt(e) {
|
|
|
1550
1550
|
if (s.length < t.length) {
|
|
1551
1551
|
const p = g(e, s), m = ["row", "col", "depth", "depth2", "depth3"];
|
|
1552
1552
|
return `
|
|
1553
|
-
${
|
|
1553
|
+
${U(p)}
|
|
1554
1554
|
float ${r}(int row, int col, int depth, int depth2, int depth3) {
|
|
1555
1555
|
return ${r}(${b(m, l)});
|
|
1556
1556
|
}
|
|
@@ -1607,7 +1607,7 @@ function rt(e) {
|
|
|
1607
1607
|
if (o.length < t.length) {
|
|
1608
1608
|
const m = g(e, o), S = ["row", "col", "depth", "depth2", "depth3", "depth4"];
|
|
1609
1609
|
return `
|
|
1610
|
-
${
|
|
1610
|
+
${U(m)}
|
|
1611
1611
|
float ${r}(int row, int col, int depth,
|
|
1612
1612
|
int depth2, int depth3, int depth4) {
|
|
1613
1613
|
return ${r}(${b(S, a)});
|
|
@@ -1979,12 +1979,12 @@ export {
|
|
|
1979
1979
|
wt as O,
|
|
1980
1980
|
H as P,
|
|
1981
1981
|
Nt as Q,
|
|
1982
|
-
|
|
1982
|
+
Lt as R,
|
|
1983
1983
|
Ot as S,
|
|
1984
1984
|
q as T,
|
|
1985
1985
|
ut as U,
|
|
1986
1986
|
j as V,
|
|
1987
|
-
|
|
1987
|
+
Ut as W,
|
|
1988
1988
|
xt as X,
|
|
1989
1989
|
ht as Y,
|
|
1990
1990
|
Yt as Z,
|
|
@@ -2008,7 +2008,7 @@ export {
|
|
|
2008
2008
|
yt as m,
|
|
2009
2009
|
Pt as n,
|
|
2010
2010
|
Vt as o,
|
|
2011
|
-
|
|
2011
|
+
L as p,
|
|
2012
2012
|
Q as q,
|
|
2013
2013
|
St as r,
|
|
2014
2014
|
Rt as s,
|
|
@@ -1,20 +1,20 @@
|
|
|
1
|
-
import { W as Mt } from "./backend_webgpu-
|
|
2
|
-
import { ae as Et, ab as X,
|
|
3
|
-
import { i as Qi, a as Zi, c as b, f as v, M as Y, b as nt, d as ut, e as dt } from "./webgpu_util-
|
|
1
|
+
import { W as Mt } from "./backend_webgpu-DI2wXEC2.js";
|
|
2
|
+
import { ae as Et, ab as X, v as L, dc as Ut, dd as Ht, bX as Gt, N as D, _ as j, bb as Xt, ai as Ye, aU as Kt, a7 as qt, am as fe, bP as Yt, c7 as jt, c8 as Qt, bV as Zt, cO as Jt, ar as es, ac as De, ah as te, aW as ts, bm as ss, bn as os, bo as is, c9 as as, ca as rs, cb as ns, cc as us, cd as ds, ce as ls, aM as cs, aP as hs, bp as ps, cy as fs, cP as ms, cQ as gs, B as xs, S as Cs, br as ws, bd as ys, de as Ss, aQ as bs, aq as vs, bS as ks, bT as Is, af as Rs, bY as Ps, C as $s, cS as Ds, ao as Ns, x as zs, bt as As, cD as Fs, bu as Ws, cz as Ls, cT as Vs, cA as Bs, bv as Ts, bw as _s, bf as Os, bx as Ms, by as Es, cB as Us, cf as Hs, bz as Gs, cF as Xs, cG as Ks, df as qs, cg as Ys, cU as js, cV as Qs, dg as Zs, c0 as Js, K as eo, be as to, aG as so, cW as oo, bA as io, bB as ao, aN as ro, y as no, bZ as uo, cp as lo, bg as co, F as ho, b_ as po, dh as fo, a9 as at, bs as mo, cE as go, di as xo, al as Co, G as wo, a5 as ke, a$ as yo, b0 as So, cq as bo, ch as vo, ci as ko, cj as Io, aH as Ro, b1 as Po, b2 as $o, dj as Do, aO as No, b3 as zo, b4 as Ao, bD as Fo, cl as Wo, ck as Lo, cY as Vo, b$ as Bo, bE as To, cC as _o, cZ as Oo, c_ as Mo, dk as Eo, aZ as Uo, b5 as Ho, cm as Go, M as Xo, D as Ko, dl as qo, ap as Yo, bi as jo, bj as Qo, bF as Zo, d3 as Jo, bG as ei, P as ti, a6 as si, bH as oi, c$ as ii, aI as ai, c1 as ri, X as ni, aX as ui, cn as di, A as li, aJ as ci, b9 as hi, d0 as pi, ba as fi, d1 as mi, bJ as gi, bh as xi, b6 as Ci, bK as wi, ak as yi, dm as Si, aL as bi, bL as vi, aF as ki, co as Ii, bM as Ri, bN as Pi, bC as $i, bI as Di, dn as Ni, dp as zi, T as Ai, av as rt, dq as Fi, L as Wi, H as Li, c3 as Vi, d2 as Bi, b7 as Ti, aK as _i, cr as Oi, dr as Mi, c5 as Ei, cs as Ui, bq as Hi, ds as Gi, ct as Xi, bl as Ki, b8 as qi, bO as Yi, a as ji } from "./index-DSGwv2Yx.js";
|
|
3
|
+
import { i as Qi, a as Zi, c as b, f as v, M as Y, b as nt, d as ut, e as dt } from "./webgpu_util-DuofJBMo.js";
|
|
4
4
|
import { g as _e, B as F } from "./binary_op_util-pKXltfxI.js";
|
|
5
|
-
import { S as Ji, a as ea } from "./selu_util-
|
|
6
|
-
import { E as ta, t as sa, u as oa, w as ia, x as aa, y as ra, f as je, z as lt, A as ct, B as ht, C as na, D as ua, F as da, G as la, H as ca, I as ha, J as pa, K as fa, L as ma, M as ga } from "./backend_util-
|
|
7
|
-
import { t as W, e as S, h as Q, b as G, c as Ie, P as pt, d as xa, a as Ca } from "./webgpu_program-
|
|
8
|
-
import { r as R, a as wa } from "./Reshape-
|
|
9
|
-
import { s as ya } from "./shared-
|
|
10
|
-
import { c as Oe, a as Ce, b as we, d as Me, e as Sa, g as ft } from "./axis_util-
|
|
11
|
-
import { h as ye, i as Ne, j as Se, b as Z, d as Ee, g as Ue, k as mt } from "./step-
|
|
12
|
-
import { p as ba, a as va, s as ka, b as Ia } from "./slice_util-
|
|
13
|
-
import { z as Ra } from "./zeros-
|
|
14
|
-
import { c as me, a as Pa } from "./concat_util-
|
|
15
|
-
import { c as $a, a as Da } from "./segment_util-
|
|
5
|
+
import { S as Ji, a as ea } from "./selu_util-BXdhy_W6.js";
|
|
6
|
+
import { E as ta, t as sa, u as oa, w as ia, x as aa, y as ra, f as je, z as lt, A as ct, B as ht, C as na, D as ua, F as da, G as la, H as ca, I as ha, J as pa, K as fa, L as ma, M as ga } from "./backend_util-qwSFfxYx.js";
|
|
7
|
+
import { t as W, e as S, h as Q, b as G, c as Ie, P as pt, d as xa, a as Ca } from "./webgpu_program-CbjdYLYk.js";
|
|
8
|
+
import { r as R, a as wa } from "./Reshape-pwprEaej.js";
|
|
9
|
+
import { s as ya } from "./shared-DRWDyk9w.js";
|
|
10
|
+
import { c as Oe, a as Ce, b as we, d as Me, e as Sa, g as ft } from "./axis_util-QWWgLjut.js";
|
|
11
|
+
import { h as ye, i as Ne, j as Se, b as Z, d as Ee, g as Ue, k as mt } from "./step-DQY6_ABw.js";
|
|
12
|
+
import { p as ba, a as va, s as ka, b as Ia } from "./slice_util-DPY56GzQ.js";
|
|
13
|
+
import { z as Ra } from "./zeros-Bw0puq_w.js";
|
|
14
|
+
import { c as me, a as Pa } from "./concat_util-C1Mxe27t.js";
|
|
15
|
+
import { c as $a, a as Da } from "./segment_util-4zuHV5IG.js";
|
|
16
16
|
import { n as Na, a as za } from "./non_max_suppression_impl-B2W7YjZB.js";
|
|
17
|
-
import { c as He } from "./scatter_nd_util-
|
|
17
|
+
import { c as He } from "./scatter_nd_util-C-x73Cj6.js";
|
|
18
18
|
Qi() && Et(
|
|
19
19
|
"webgpu",
|
|
20
20
|
async () => {
|
|
@@ -3226,34 +3226,34 @@ function vs() {
|
|
|
3226
3226
|
vs();
|
|
3227
3227
|
export {
|
|
3228
3228
|
di as $,
|
|
3229
|
-
|
|
3230
|
-
|
|
3229
|
+
Ja as A,
|
|
3230
|
+
ur as B,
|
|
3231
3231
|
yr as C,
|
|
3232
|
-
|
|
3232
|
+
So as D,
|
|
3233
3233
|
f as E,
|
|
3234
3234
|
Yr as F,
|
|
3235
3235
|
Qr as G,
|
|
3236
|
-
|
|
3237
|
-
|
|
3238
|
-
|
|
3239
|
-
|
|
3240
|
-
|
|
3236
|
+
wo as H,
|
|
3237
|
+
Gs as I,
|
|
3238
|
+
Rt as J,
|
|
3239
|
+
yo as K,
|
|
3240
|
+
se as L,
|
|
3241
3241
|
Na as M,
|
|
3242
|
-
|
|
3242
|
+
z as N,
|
|
3243
3243
|
H as O,
|
|
3244
3244
|
Oa as P,
|
|
3245
|
-
|
|
3245
|
+
Ue as Q,
|
|
3246
3246
|
Xa as R,
|
|
3247
3247
|
uo as S,
|
|
3248
3248
|
Co as T,
|
|
3249
|
-
|
|
3250
|
-
|
|
3251
|
-
|
|
3252
|
-
|
|
3253
|
-
|
|
3254
|
-
|
|
3249
|
+
Cs as U,
|
|
3250
|
+
Tn as V,
|
|
3251
|
+
vn as W,
|
|
3252
|
+
qa as X,
|
|
3253
|
+
ni as Y,
|
|
3254
|
+
hs as Z,
|
|
3255
3255
|
os as _,
|
|
3256
|
-
|
|
3256
|
+
Ho as a,
|
|
3257
3257
|
ea as a$,
|
|
3258
3258
|
gi as a0,
|
|
3259
3259
|
tt as a1,
|
|
@@ -3318,7 +3318,7 @@ export {
|
|
|
3318
3318
|
$s as ax,
|
|
3319
3319
|
xt as ay,
|
|
3320
3320
|
he as az,
|
|
3321
|
-
|
|
3321
|
+
q as b,
|
|
3322
3322
|
Qe as b$,
|
|
3323
3323
|
na as b0,
|
|
3324
3324
|
la as b1,
|
|
@@ -3383,7 +3383,7 @@ export {
|
|
|
3383
3383
|
Fr as bx,
|
|
3384
3384
|
Mr as by,
|
|
3385
3385
|
xr as bz,
|
|
3386
|
-
|
|
3386
|
+
Jo as c,
|
|
3387
3387
|
en as c$,
|
|
3388
3388
|
tn as c0,
|
|
3389
3389
|
za as c1,
|
|
@@ -3448,7 +3448,7 @@ export {
|
|
|
3448
3448
|
gs as cx,
|
|
3449
3449
|
cr as cy,
|
|
3450
3450
|
Tr as cz,
|
|
3451
|
-
|
|
3451
|
+
$ as d,
|
|
3452
3452
|
to as d0,
|
|
3453
3453
|
Za as d1,
|
|
3454
3454
|
Bo as d2,
|
|
@@ -3491,26 +3491,26 @@ export {
|
|
|
3491
3491
|
ja as dx,
|
|
3492
3492
|
ko as dy,
|
|
3493
3493
|
Io as dz,
|
|
3494
|
-
|
|
3494
|
+
ei as e,
|
|
3495
3495
|
as as f,
|
|
3496
3496
|
ai as g,
|
|
3497
|
-
|
|
3498
|
-
|
|
3499
|
-
|
|
3497
|
+
S as h,
|
|
3498
|
+
nt as i,
|
|
3499
|
+
V as j,
|
|
3500
3500
|
Fn as k,
|
|
3501
|
-
|
|
3501
|
+
M as l,
|
|
3502
3502
|
b as m,
|
|
3503
|
-
|
|
3503
|
+
T as n,
|
|
3504
3504
|
N as o,
|
|
3505
3505
|
Qt as p,
|
|
3506
|
-
|
|
3506
|
+
Ct as q,
|
|
3507
3507
|
ri as r,
|
|
3508
3508
|
si as s,
|
|
3509
3509
|
A as t,
|
|
3510
|
-
|
|
3511
|
-
|
|
3512
|
-
|
|
3513
|
-
|
|
3514
|
-
|
|
3515
|
-
|
|
3510
|
+
Jn as u,
|
|
3511
|
+
p as v,
|
|
3512
|
+
An as w,
|
|
3513
|
+
wr as x,
|
|
3514
|
+
Kr as y,
|
|
3515
|
+
K as z
|
|
3516
3516
|
};
|
|
@@ -0,0 +1,16 @@
|
|
|
1
|
+
import { Conversation } from '../tokeniser/type';
|
|
2
|
+
export interface GeneratorConversation extends Conversation {
|
|
3
|
+
_completed?: boolean;
|
|
4
|
+
_timestamp?: number;
|
|
5
|
+
}
|
|
6
|
+
export interface GenerateOptions {
|
|
7
|
+
temperature?: number;
|
|
8
|
+
topK?: number;
|
|
9
|
+
topP?: number;
|
|
10
|
+
usePadding?: boolean;
|
|
11
|
+
attentionScores?: boolean;
|
|
12
|
+
includeProbabilities?: boolean;
|
|
13
|
+
embeddings?: 'embedding' | 'logits' | 'softmax' | 'all';
|
|
14
|
+
targets?: number[];
|
|
15
|
+
loraName?: string;
|
|
16
|
+
}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
|
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
import { _ as B,
|
|
2
|
-
import { u as O, f as H } from "./gpgpu_math-
|
|
3
|
-
import { f as v } from "./backend_util-
|
|
1
|
+
import { _ as B, N as G, aU as K, a7 as W, aH as z, aV as V, ab as N, aI as F, am as S } from "./index-DSGwv2Yx.js";
|
|
2
|
+
import { u as O, f as H } from "./gpgpu_math-3bCb5ooU.js";
|
|
3
|
+
import { f as v } from "./backend_util-qwSFfxYx.js";
|
|
4
4
|
function Y(t, e) {
|
|
5
5
|
return ["x", "y", "z", "w", "u", "v"].slice(0, e).map((s) => `${t}.${s}`);
|
|
6
6
|
}
|
|
@@ -200,12 +200,12 @@ const be = {
|
|
|
200
200
|
backendName: "webgl",
|
|
201
201
|
kernelFunc: oe
|
|
202
202
|
};
|
|
203
|
-
const
|
|
203
|
+
const k = "return (a < 0.) ? b * a : a;", U = `
|
|
204
204
|
vec4 aLessThanZero = vec4(lessThan(a, vec4(0.)));
|
|
205
205
|
return (aLessThanZero * (b * a)) + ((vec4(1.0) - aLessThanZero) * a);
|
|
206
206
|
`;
|
|
207
207
|
function ue(t) {
|
|
208
|
-
const { inputs: e, backend: s } = t, { x: r, alpha: u } = e, n = N().getBool("WEBGL_PACK_BINARY_OPERATIONS") ? new E(
|
|
208
|
+
const { inputs: e, backend: s } = t, { x: r, alpha: u } = e, n = N().getBool("WEBGL_PACK_BINARY_OPERATIONS") ? new E(U, r.shape, u.shape) : new b(k, r.shape, u.shape);
|
|
209
209
|
return s.runWebGLProgram(n, [r, u], "float32");
|
|
210
210
|
}
|
|
211
211
|
const Ne = {
|
|
@@ -273,7 +273,7 @@ function Ae(t, e = !1) {
|
|
|
273
273
|
if (t === "relu6")
|
|
274
274
|
return e ? ae : Q;
|
|
275
275
|
if (t === "prelu")
|
|
276
|
-
return e ?
|
|
276
|
+
return e ? U : k;
|
|
277
277
|
if (t === "leakyrelu")
|
|
278
278
|
return e ? R : w;
|
|
279
279
|
if (t === "sigmoid")
|
package/dist/layers/BaseLayer.js
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { a2 as p,
|
|
1
|
+
import { a2 as p, e as s, a4 as g } from "../index-DSGwv2Yx.js";
|
|
2
2
|
import b from "./WeightStore.js";
|
|
3
3
|
class T {
|
|
4
4
|
parent;
|
|
@@ -59,11 +59,11 @@ class T {
|
|
|
59
59
|
checkpointingFn(t, ...e) {
|
|
60
60
|
const r = this.trainableVariables;
|
|
61
61
|
return p((...i) => {
|
|
62
|
-
const o = i[i.length - 1], a = i.slice(0, e.length),
|
|
63
|
-
return o(a), { value:
|
|
62
|
+
const o = i[i.length - 1], a = i.slice(0, e.length), n = this.forward(t, ...a);
|
|
63
|
+
return o(a), { value: n, gradFunc: (h, l) => {
|
|
64
64
|
const c = s().state.activeTape;
|
|
65
65
|
s().state.activeTape = [];
|
|
66
|
-
const d = g((...u) => this.forward(t, ...u.slice(0, a.length)))([...l, ...r],
|
|
66
|
+
const d = g((...u) => this.forward(t, ...u.slice(0, a.length)))([...l, ...r], h);
|
|
67
67
|
return s().state.activeTape = c, d;
|
|
68
68
|
} };
|
|
69
69
|
})(...e, ...r);
|
|
@@ -1,11 +1,11 @@
|
|
|
1
1
|
import { attentionMask as R } from "../ops/attentionMask.js";
|
|
2
2
|
import J from "./BaseLayer.js";
|
|
3
|
-
import { r as v } from "../rope-
|
|
3
|
+
import { r as v } from "../rope-CC5RjmKU.js";
|
|
4
4
|
import { appendCache as A } from "../ops/appendCache.js";
|
|
5
|
-
import { k as c, t as L } from "../index-
|
|
5
|
+
import { k as c, t as L } from "../index-DSGwv2Yx.js";
|
|
6
6
|
import { softmax16 as y } from "../ops/softmax16.js";
|
|
7
|
-
import { b as M } from "../matMul16-
|
|
8
|
-
import { p as K } from "../pack16-
|
|
7
|
+
import { b as M } from "../matMul16-BIT70Vya.js";
|
|
8
|
+
import { p as K } from "../pack16-WlOSOuZA.js";
|
|
9
9
|
import { transpose16 as j } from "../ops/transpose16.js";
|
|
10
10
|
import { dot16 as E } from "../ops/dot16.js";
|
|
11
11
|
import { reshape16 as _ } from "../ops/reshape16.js";
|
|
@@ -13,8 +13,8 @@ import { isPackedTensor as l } from "../utilities/packed.js";
|
|
|
13
13
|
import { qkv as q } from "../ops/qkv.js";
|
|
14
14
|
import { normRMS as O } from "../ops/normRMS.js";
|
|
15
15
|
import { dropout16 as x } from "../ops/dropout16.js";
|
|
16
|
-
import { v as P } from "../variable-
|
|
17
|
-
import { r as S } from "../random_normal-
|
|
16
|
+
import { v as P } from "../variable-SSATClyt.js";
|
|
17
|
+
import { r as S } from "../random_normal-CIm8lk2-.js";
|
|
18
18
|
class it extends J {
|
|
19
19
|
constructor(t, o, s, i) {
|
|
20
20
|
super(o, i), this.attentionConfig = s, this.index = t, this.units = o.nEmbed * 3, this.projUnits = o.nEmbed, this.ATTN = `block_${this.index}_cAttn`, this.PROJ = `block_${this.index}_cProj`, this.addVariable(this.ATTN), this.addVariable(this.PROJ), this.divisor = 1 / Math.sqrt(o.nEmbed / o.nHead);
|
package/dist/layers/LoRA.js
CHANGED
|
@@ -1,8 +1,8 @@
|
|
|
1
|
-
import {
|
|
1
|
+
import { b as m, t as n } from "../index-DSGwv2Yx.js";
|
|
2
2
|
import { p } from "../index-DmeWGGmS.js";
|
|
3
|
-
import { v as g } from "../variable-
|
|
4
|
-
import { r as S } from "../random_normal-
|
|
5
|
-
import { z as _ } from "../zeros-
|
|
3
|
+
import { v as g } from "../variable-SSATClyt.js";
|
|
4
|
+
import { r as S } from "../random_normal-CIm8lk2-.js";
|
|
5
|
+
import { z as _ } from "../zeros-Bw0puq_w.js";
|
|
6
6
|
class B {
|
|
7
7
|
weightStore;
|
|
8
8
|
alpha;
|
package/dist/layers/MLP.js
CHANGED
|
@@ -1,10 +1,10 @@
|
|
|
1
|
-
import { t as M } from "../index-
|
|
1
|
+
import { t as M } from "../index-DSGwv2Yx.js";
|
|
2
2
|
import f from "./BaseLayer.js";
|
|
3
|
-
import { b as h } from "../matMul16-
|
|
3
|
+
import { b as h } from "../matMul16-BIT70Vya.js";
|
|
4
4
|
import { reshape16 as d } from "../ops/reshape16.js";
|
|
5
5
|
import { dropout16 as L } from "../ops/dropout16.js";
|
|
6
|
-
import { v as n } from "../variable-
|
|
7
|
-
import { r as m } from "../random_normal-
|
|
6
|
+
import { v as n } from "../variable-SSATClyt.js";
|
|
7
|
+
import { r as m } from "../random_normal-CIm8lk2-.js";
|
|
8
8
|
class N extends f {
|
|
9
9
|
index;
|
|
10
10
|
hiddenUnits;
|
|
@@ -1,9 +1,9 @@
|
|
|
1
|
-
import { t as c, an as p,
|
|
1
|
+
import { t as c, an as p, b as s } from "../index-DSGwv2Yx.js";
|
|
2
2
|
import f from "./BaseLayer.js";
|
|
3
|
-
import { E as u } from "../random_width-
|
|
4
|
-
import { r as b } from "../exports_initializers-
|
|
5
|
-
import { m as g } from "../mod-
|
|
6
|
-
import { r as l } from "../range-
|
|
3
|
+
import { E as u } from "../random_width-B_fVXhGx.js";
|
|
4
|
+
import { r as b } from "../exports_initializers-DIOZQt_L.js";
|
|
5
|
+
import { m as g } from "../mod-BXjLYwvM.js";
|
|
6
|
+
import { r as l } from "../range-BDxO73mk.js";
|
|
7
7
|
function h(e) {
|
|
8
8
|
return new u(e);
|
|
9
9
|
}
|
package/dist/layers/RMSNorm.js
CHANGED
|
@@ -1,8 +1,8 @@
|
|
|
1
|
-
import { t as i } from "../index-
|
|
1
|
+
import { t as i } from "../index-DSGwv2Yx.js";
|
|
2
2
|
import e from "./BaseLayer.js";
|
|
3
3
|
import { normRMS as m } from "../ops/normRMS.js";
|
|
4
|
-
import { v as a } from "../variable-
|
|
5
|
-
import { o as M } from "../ones-
|
|
4
|
+
import { v as a } from "../variable-SSATClyt.js";
|
|
5
|
+
import { o as M } from "../ones-DbVB5N58.js";
|
|
6
6
|
class l extends e {
|
|
7
7
|
GAMMA;
|
|
8
8
|
rmsConfig;
|
package/dist/layers/RoPECache.js
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
import {
|
|
2
|
-
import { r as l } from "../zeros_like-
|
|
3
|
-
import { c as f, s as m } from "../unsorted_segment_sum-
|
|
4
|
-
import { r as h } from "../range-
|
|
1
|
+
import { d as a, b as n, p as c, t as p, k as r } from "../index-DSGwv2Yx.js";
|
|
2
|
+
import { r as l } from "../zeros_like-rOHr54NY.js";
|
|
3
|
+
import { c as f, s as m } from "../unsorted_segment_sum-BfFVV9Zm.js";
|
|
4
|
+
import { r as h } from "../range-BDxO73mk.js";
|
|
5
5
|
class x {
|
|
6
6
|
constructor(s) {
|
|
7
7
|
this.config = s;
|