@genai-fi/nanogpt 0.5.5 → 0.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/Generator.js +8 -7
- package/dist/NanoGPTModel.js +8 -8
- package/dist/{Reshape-Biok_3X1.js → Reshape-CLOrdpve.js} +2 -2
- package/dist/TeachableLLM.js +18 -17
- package/dist/{TiedEmbedding-8S8xn8e6.js → TiedEmbedding-BhxWO8QR.js} +5 -5
- package/dist/{axis_util-BczFISHz.js → axis_util-D17qZRQm.js} +1 -1
- package/dist/{broadcast_to-B7NGsBSh.js → broadcast_to-BMQLjvt_.js} +2 -2
- package/dist/{concat-DdKPyAtw.js → concat-DhZfF1GY.js} +1 -1
- package/dist/{dataset-iqT4Otvb.js → dataset-oilnemHf.js} +3 -3
- package/dist/{dropout-B09InSJS.js → dropout-CrMQPCeG.js} +1 -1
- package/dist/{gather-D6MsdXqc.js → gather-DZCMHZuN.js} +1 -1
- package/dist/{gpgpu_math-BFbOyvk4.js → gpgpu_math-Ctc31slO.js} +1 -1
- package/dist/{index-Du-bmOP8.js → index-bMBtI-WR.js} +50 -50
- package/dist/{kernel_funcs_utils-DShm7-0k.js → kernel_funcs_utils-CNmjLWnB.js} +26 -24
- package/dist/layers/BaseLayer.js +2 -2
- package/dist/layers/CausalSelfAttention.js +6 -6
- package/dist/layers/MLP.js +5 -5
- package/dist/layers/RMSNorm.js +3 -3
- package/dist/layers/RoPECache.js +3 -3
- package/dist/layers/TiedEmbedding.js +6 -6
- package/dist/layers/TransformerBlock.js +1 -1
- package/dist/{log_sum_exp-CxfBtUaG.js → log_sum_exp-BHdkCb4s.js} +5 -5
- package/dist/main.d.ts +1 -0
- package/dist/main.js +20 -19
- package/dist/{mat_mul-CbiqIe2d.js → mat_mul-BsrLfy81.js} +1 -1
- package/dist/{max-0Xnlpv8k.js → max-DechV4Bc.js} +1 -1
- package/dist/{norm-01kY9I2B.js → norm-B9hWHZH1.js} +5 -5
- package/dist/{ones-CrutWGas.js → ones-g0K8jVwm.js} +2 -2
- package/dist/ops/appendCache.js +3 -3
- package/dist/ops/attentionMask.js +1 -1
- package/dist/ops/cpu/appendCache.js +2 -2
- package/dist/ops/cpu/attentionMask.js +5 -5
- package/dist/ops/cpu/fusedSoftmax.js +2 -2
- package/dist/ops/cpu/gatherSub.js +3 -3
- package/dist/ops/cpu/gelu.js +1 -1
- package/dist/ops/cpu/matMulGelu.js +1 -1
- package/dist/ops/cpu/matMulMul.js +1 -1
- package/dist/ops/cpu/mulDropout.js +1 -1
- package/dist/ops/cpu/normRMS.js +1 -1
- package/dist/ops/cpu/qkv.js +3 -3
- package/dist/ops/cpu/rope.js +5 -5
- package/dist/ops/cpu/scatterSub.js +4 -4
- package/dist/ops/fusedSoftmax.js +1 -1
- package/dist/ops/gatherSub.js +1 -1
- package/dist/ops/gelu.js +1 -1
- package/dist/ops/grads/attentionMask.js +15 -11
- package/dist/ops/grads/fusedSoftmax.js +12 -10
- package/dist/ops/grads/gelu.js +1 -1
- package/dist/ops/grads/matMulGelu.js +1 -1
- package/dist/ops/grads/normRMS.js +1 -1
- package/dist/ops/grads/qkv.js +1 -1
- package/dist/ops/grads/rope.js +1 -1
- package/dist/ops/log.d.ts +0 -0
- package/dist/ops/log.js +1 -0
- package/dist/ops/matMulGelu.js +1 -1
- package/dist/ops/matMulMul.js +1 -1
- package/dist/ops/mulDrop.js +1 -1
- package/dist/ops/node/sparseCrossEntropy.js +1 -1
- package/dist/ops/normRMS.js +1 -1
- package/dist/ops/qkv.js +1 -1
- package/dist/ops/scatterSub.js +1 -1
- package/dist/ops/webgl/appendCache.js +1 -1
- package/dist/ops/webgl/attentionMask.js +1 -1
- package/dist/ops/webgl/fusedSoftmax.js +205 -3022
- package/dist/ops/webgl/gatherSub.js +1 -1
- package/dist/ops/webgl/gelu.js +2 -2
- package/dist/ops/webgl/log.d.ts +17 -0
- package/dist/ops/webgl/log.js +39 -0
- package/dist/ops/webgl/matMulGelu.js +4 -4
- package/dist/ops/webgl/matMulMul.js +1 -1
- package/dist/ops/webgl/mulDropout.js +1 -1
- package/dist/ops/webgl/normRMS.js +2 -2
- package/dist/ops/webgl/qkv.js +1 -1
- package/dist/ops/webgl/rope.js +1 -1
- package/dist/ops/webgl/scatterSub.js +1 -1
- package/dist/{ops-CJNniCAV.js → ops-Mv7Ta72x.js} +13 -13
- package/dist/{random_width-C-v-35bY.js → random_width-BBAWzDym.js} +23 -23
- package/dist/{range-Bvs1hidm.js → range-DMaG9A3G.js} +1 -1
- package/dist/{reshape-BH7eBpwq.js → reshape-T4yDEqoF.js} +1 -1
- package/dist/shared-XNAoXhOa.js +2826 -0
- package/dist/{sin-CPAZXNjH.js → sin-EEhbrRO_.js} +1 -1
- package/dist/{slice_util-DskXqRZa.js → slice_util-Ddk0uxGJ.js} +1 -1
- package/dist/{softmax-DhWoBa7r.js → softmax-B2_IKPDR.js} +1 -1
- package/dist/{split-BCUhuU7B.js → split-dcks18H1.js} +1 -1
- package/dist/{stack-BV1v7l3S.js → stack-lpJ5kYvE.js} +1 -1
- package/dist/{sum-Cvq06317.js → sum-CutF5lj2.js} +1 -1
- package/dist/{tensor-DgTOPY6h.js → tensor-C15NA2LA.js} +1 -1
- package/dist/{tensor2d-CRWjDyUe.js → tensor2d-DZ_e5eKM.js} +1 -1
- package/dist/{tfjs_backend-D9Ytje0G.js → tfjs_backend-BDb8r9qx.js} +28 -28
- package/dist/training/AdamExt.js +1 -1
- package/dist/training/DatasetBuilder.js +2 -2
- package/dist/training/FullTrainer.js +1 -1
- package/dist/training/Trainer.js +3 -3
- package/dist/training/sparseCrossEntropy.js +4 -4
- package/dist/utilities/dummy.js +2 -2
- package/dist/utilities/generate.js +3 -3
- package/dist/utilities/load.d.ts +25 -0
- package/dist/utilities/load.js +89 -37
- package/dist/utilities/profile.js +4 -4
- package/dist/utilities/safetensors.d.ts +3 -0
- package/dist/utilities/safetensors.js +83 -0
- package/dist/utilities/save.js +47 -29
- package/dist/utilities/weights.js +2 -2
- package/dist/{variable-DZ3fF0R2.js → variable-CdRKKp8x.js} +1 -1
- package/dist/{zeros-BaHhQTWf.js → zeros-CAbHfODe.js} +1 -1
- package/package.json +1 -1
package/dist/utilities/save.js
CHANGED
|
@@ -1,43 +1,61 @@
|
|
|
1
|
-
import { j as
|
|
2
|
-
import
|
|
3
|
-
import
|
|
4
|
-
|
|
5
|
-
async function
|
|
6
|
-
const
|
|
7
|
-
|
|
8
|
-
const
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
|
|
1
|
+
import { j as p } from "../jszip.min-CjP2V1VV.js";
|
|
2
|
+
import b from "../tokeniser/CharTokeniser.js";
|
|
3
|
+
import { save_safetensors as l } from "./safetensors.js";
|
|
4
|
+
import { VERSION as y } from "./load.js";
|
|
5
|
+
async function N(e, a, n) {
|
|
6
|
+
const f = n?.includeLog ?? !0, s = /* @__PURE__ */ new Map();
|
|
7
|
+
e.saveWeights(s);
|
|
8
|
+
const i = new p(), r = {};
|
|
9
|
+
s.forEach((t, o) => {
|
|
10
|
+
t.length === 1 && (r[o] = t[0]);
|
|
11
|
+
});
|
|
12
|
+
const g = await l(r);
|
|
13
|
+
i.file("model.safetensors", g, { binary: !0 });
|
|
14
|
+
const c = {
|
|
15
|
+
model_type: "GenAI_NanoGPT_1",
|
|
16
|
+
vocab_size: a.getVocab().length,
|
|
17
|
+
hidden_size: e.config.gpt.nEmbed,
|
|
18
|
+
num_hidden_layers: e.config.gpt.nLayer,
|
|
19
|
+
num_attention_heads: e.config.gpt.nHead,
|
|
20
|
+
block_size: e.config.gpt.blockSize,
|
|
21
|
+
dropout: e.config.gpt.dropout,
|
|
22
|
+
biasInLinear: e.config.gpt.biasInLinear,
|
|
23
|
+
biasInLayerNorm: e.config.gpt.biasInLayerNorm,
|
|
24
|
+
mlpFactor: e.config.gpt.mlpFactor,
|
|
25
|
+
useRope: e.config.gpt.useRope
|
|
26
|
+
};
|
|
27
|
+
if (i.file("config.json", JSON.stringify(c, void 0, 4), {
|
|
28
|
+
binary: !1
|
|
29
|
+
}), i.file(
|
|
30
|
+
"meta.json",
|
|
31
|
+
JSON.stringify(
|
|
32
|
+
{
|
|
33
|
+
version: y,
|
|
34
|
+
application: "@genai-fi/nanogpt",
|
|
35
|
+
meta: n?.metadata,
|
|
36
|
+
name: n?.name
|
|
37
|
+
},
|
|
38
|
+
void 0,
|
|
39
|
+
4
|
|
40
|
+
),
|
|
23
41
|
{
|
|
24
42
|
binary: !1
|
|
25
43
|
}
|
|
26
|
-
),
|
|
44
|
+
), i.file(
|
|
27
45
|
"tokeniser.json",
|
|
28
46
|
JSON.stringify({
|
|
29
|
-
type: a instanceof
|
|
47
|
+
type: a instanceof b ? "char" : "bpe",
|
|
30
48
|
vocab: a.getVocab(),
|
|
31
49
|
merges: await a.getMerges()
|
|
32
50
|
}),
|
|
33
51
|
{
|
|
34
52
|
binary: !1
|
|
35
53
|
}
|
|
36
|
-
),
|
|
37
|
-
for (const [
|
|
38
|
-
|
|
39
|
-
return
|
|
54
|
+
), f && i.file("log.json", JSON.stringify(e.log), { binary: !1 }), n?.files)
|
|
55
|
+
for (const [t, o] of Object.entries(n.files))
|
|
56
|
+
i.file(t, JSON.stringify(o), { binary: !1 });
|
|
57
|
+
return i.generateAsync({ type: "blob" });
|
|
40
58
|
}
|
|
41
59
|
export {
|
|
42
|
-
|
|
60
|
+
N as saveModel
|
|
43
61
|
};
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import "../index-
|
|
2
|
-
import { t as p } from "../tensor-
|
|
1
|
+
import "../index-bMBtI-WR.js";
|
|
2
|
+
import { t as p } from "../tensor-C15NA2LA.js";
|
|
3
3
|
function h(n) {
|
|
4
4
|
const e = n.reduce((s, o) => s + o.length, 0), a = new Float32Array(e);
|
|
5
5
|
let t = 0;
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { o as m, j as r, X as l, E as c, Y as i, n as p, Z as u, q as f } from "./index-
|
|
1
|
+
import { o as m, j as r, X as l, E as c, Y as i, n as p, Z as u, q as f } from "./index-bMBtI-WR.js";
|
|
2
2
|
/**
|
|
3
3
|
* @license
|
|
4
4
|
* Copyright 2020 Google LLC. All Rights Reserved.
|