@genai-fi/nanogpt 0.17.4 → 0.18.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (258) hide show
  1. package/dist/Generator.d.ts +2 -15
  2. package/dist/Generator.js +45 -34
  3. package/dist/{RealDiv-CGwv0liw.js → RealDiv-ioj6Z-ox.js} +9 -9
  4. package/dist/{Reshape-BW__R4mZ.js → Reshape-BZC-ebeR.js} +7 -7
  5. package/dist/{Reshape-CPBkTIH2.js → Reshape-pwprEaej.js} +1 -1
  6. package/dist/TeachableLLM.d.ts +3 -8
  7. package/dist/TeachableLLM.js +61 -44
  8. package/dist/Trainer.d.ts +6 -4
  9. package/dist/Trainer.js +107 -92
  10. package/dist/{axis_util-GTVlo58H.js → axis_util-QWWgLjut.js} +1 -1
  11. package/dist/backend.js +2 -2
  12. package/dist/{backend_util-GaFarB78.js → backend_util-qwSFfxYx.js} +21 -21
  13. package/dist/{backend_webgpu-BqASlsbV.js → backend_webgpu-DI2wXEC2.js} +8 -8
  14. package/dist/{broadcast_to-eS93CCN_.js → broadcast_to-C_EJTVTZ.js} +2 -2
  15. package/dist/checks/appendCache.js +2 -2
  16. package/dist/checks/attentionMask.js +5 -5
  17. package/dist/checks/gelu.js +2 -2
  18. package/dist/checks/matMulGelu.js +2 -2
  19. package/dist/checks/normRMS.js +6 -6
  20. package/dist/checks/normRMSGrad.js +3 -3
  21. package/dist/checks/packUnpack.js +6 -6
  22. package/dist/checks/qkv.js +2 -2
  23. package/dist/checks/rope.js +2 -2
  24. package/dist/{clip_by_value-DDA7rrcT.js → clip_by_value-CLAD4h_I.js} +1 -1
  25. package/dist/complex-3DpPEG9B.js +11 -0
  26. package/dist/{concat-CAQpCret.js → concat-Dqk7Xk7h.js} +5 -5
  27. package/dist/{concat_util-D18dJ4fD.js → concat_util-C1Mxe27t.js} +1 -1
  28. package/dist/{dataset-CGGp1z9P.js → dataset-DlqAN81i.js} +3 -3
  29. package/dist/{dropout_util--NxWuYg2.js → dropout_util-N0z8Os-K.js} +1 -1
  30. package/dist/{expand_dims-Bkd1YD5x.js → expand_dims-D0rBtgT1.js} +4 -4
  31. package/dist/{exports_initializers-CYzKLjN7.js → exports_initializers-DIOZQt_L.js} +1 -1
  32. package/dist/{floor-BQtb-Azg.js → floor-CymuCmTO.js} +1 -1
  33. package/dist/{gather-qIqEqaGn.js → gather-DEyjXNb1.js} +1 -1
  34. package/dist/{gelu-B220X1Go.js → gelu-DpTCC3eB.js} +1 -1
  35. package/dist/{gpgpu_math-BwvV12df.js → gpgpu_math-3bCb5ooU.js} +25 -25
  36. package/dist/{index-CjOWnMXP.js → index-BQvB7LCC.js} +15 -15
  37. package/dist/{index-CUXkjxiT.js → index-DSGwv2Yx.js} +33 -33
  38. package/dist/inference/types.d.ts +16 -0
  39. package/dist/inference/types.js +1 -0
  40. package/dist/{kernel_funcs_utils-pq0CK9co.js → kernel_funcs_utils-DGqzNlHT.js} +6 -6
  41. package/dist/layers/BaseLayer.js +4 -4
  42. package/dist/layers/CausalSelfAttention.js +6 -6
  43. package/dist/layers/LoRA.js +4 -4
  44. package/dist/layers/MLP.js +4 -4
  45. package/dist/layers/PositionEmbedding.js +5 -5
  46. package/dist/layers/RMSNorm.js +3 -3
  47. package/dist/layers/RoPECache.js +4 -4
  48. package/dist/layers/TiedEmbedding.js +6 -6
  49. package/dist/layers/TransformerBlock.js +1 -1
  50. package/dist/layers/WeightStore.js +2 -2
  51. package/dist/loader/load.d.ts +2 -8
  52. package/dist/loader/loadTransformers.d.ts +2 -8
  53. package/dist/loader/loadTransformers.js +13 -11
  54. package/dist/loader/newZipLoad.d.ts +2 -8
  55. package/dist/loader/newZipLoad.js +25 -10
  56. package/dist/loader/oldZipLoad.js +13 -13
  57. package/dist/loader/save.d.ts +9 -2
  58. package/dist/loader/save.js +64 -55
  59. package/dist/loader/types.d.ts +29 -1
  60. package/dist/main.d.ts +2 -0
  61. package/dist/main.js +45 -43
  62. package/dist/{matMul16-BcVC_E62.js → matMul16-BIT70Vya.js} +3 -3
  63. package/dist/{matMulGelu-JNLZqKQp.js → matMulGelu-CsZnh18H.js} +18 -18
  64. package/dist/mat_mul-DP86qZtZ.js +11 -0
  65. package/dist/mod-BXjLYwvM.js +11 -0
  66. package/dist/models/NanoGPTV1.js +2 -2
  67. package/dist/models/NanoGPTV2.js +2 -2
  68. package/dist/models/model.d.ts +3 -2
  69. package/dist/models/model.js +13 -13
  70. package/dist/{not_equal-hurPF26l.js → not_equal-CkQKkKZy.js} +15 -15
  71. package/dist/{ones-BytntneX.js → ones-DbVB5N58.js} +3 -3
  72. package/dist/ops/adamAdjust.js +3 -3
  73. package/dist/ops/adamMoments.js +3 -3
  74. package/dist/ops/add16.js +1 -1
  75. package/dist/ops/appendCache.js +6 -6
  76. package/dist/ops/attentionMask.js +3 -3
  77. package/dist/ops/concat16.js +3 -3
  78. package/dist/ops/cpu/adamAdjust.js +9 -9
  79. package/dist/ops/cpu/adamMoments.js +5 -5
  80. package/dist/ops/cpu/appendCache.js +2 -2
  81. package/dist/ops/cpu/attentionMask.js +6 -6
  82. package/dist/ops/cpu/fusedSoftmax.js +4 -4
  83. package/dist/ops/cpu/gatherSub.js +5 -5
  84. package/dist/ops/cpu/gelu.js +4 -4
  85. package/dist/ops/cpu/matMul16.js +2 -2
  86. package/dist/ops/cpu/matMulGelu.js +7 -7
  87. package/dist/ops/cpu/matMulMul.js +2 -2
  88. package/dist/ops/cpu/mulDropout.js +5 -5
  89. package/dist/ops/cpu/normRMS.js +1 -1
  90. package/dist/ops/cpu/qkv.js +3 -3
  91. package/dist/ops/cpu/rope.js +5 -5
  92. package/dist/ops/cpu/scatterSub.js +5 -5
  93. package/dist/ops/dot16.js +2 -2
  94. package/dist/ops/dropout.js +6 -6
  95. package/dist/ops/dropout16.js +1 -1
  96. package/dist/ops/gatherSub.js +1 -1
  97. package/dist/ops/gelu.js +2 -2
  98. package/dist/ops/globalNorm.js +7 -7
  99. package/dist/ops/grads/add16.js +1 -1
  100. package/dist/ops/grads/attentionMask.js +2 -2
  101. package/dist/ops/grads/dropout16.js +1 -1
  102. package/dist/ops/grads/gelu.js +2 -2
  103. package/dist/ops/grads/matMul16.js +3 -3
  104. package/dist/ops/grads/matMulGelu.js +1 -1
  105. package/dist/ops/grads/mul16.js +1 -1
  106. package/dist/ops/grads/normRMS.js +7 -7
  107. package/dist/ops/grads/pack16.js +3 -3
  108. package/dist/ops/grads/qkv.js +11 -11
  109. package/dist/ops/grads/rope.js +2 -2
  110. package/dist/ops/grads/softmax16.js +1 -1
  111. package/dist/ops/grads/unpack16.js +2 -2
  112. package/dist/ops/matMul16.js +3 -3
  113. package/dist/ops/matMulGelu.js +6 -6
  114. package/dist/ops/matMulMul.js +3 -3
  115. package/dist/ops/mul16.js +1 -1
  116. package/dist/ops/mulDrop.js +3 -3
  117. package/dist/ops/normRMS.js +4 -4
  118. package/dist/ops/pack16.js +2 -2
  119. package/dist/ops/qkv.js +3 -3
  120. package/dist/ops/reshape16.js +6 -6
  121. package/dist/ops/rope.js +2 -2
  122. package/dist/ops/scatterSub.js +1 -1
  123. package/dist/ops/slice16.js +2 -2
  124. package/dist/ops/softmax16.js +1 -1
  125. package/dist/ops/sub16.js +1 -1
  126. package/dist/ops/sum16.js +6 -6
  127. package/dist/ops/transpose16.js +3 -3
  128. package/dist/ops/unpack16.js +2 -2
  129. package/dist/ops/webgl/adamAdjust.js +2 -2
  130. package/dist/ops/webgl/adamMoments.js +1 -1
  131. package/dist/ops/webgl/appendCache.js +1 -1
  132. package/dist/ops/webgl/attentionMask.js +1 -1
  133. package/dist/ops/webgl/dropout16.js +1 -1
  134. package/dist/ops/webgl/fusedSoftmax.js +7 -7
  135. package/dist/ops/webgl/gatherSub.js +3 -3
  136. package/dist/ops/webgl/gelu.js +2 -2
  137. package/dist/ops/webgl/log.js +3 -3
  138. package/dist/ops/webgl/matMul16.js +13 -13
  139. package/dist/ops/webgl/matMulGelu.js +4 -4
  140. package/dist/ops/webgl/matMulMul.js +2 -2
  141. package/dist/ops/webgl/mulDropout.js +1 -1
  142. package/dist/ops/webgl/normRMS.js +2 -2
  143. package/dist/ops/webgl/qkv.js +1 -1
  144. package/dist/ops/webgl/rope.js +1 -1
  145. package/dist/ops/webgl/scatterSub.js +2 -2
  146. package/dist/ops/webgpu/adamAdjust.js +3 -3
  147. package/dist/ops/webgpu/adamMoments.js +3 -3
  148. package/dist/ops/webgpu/add16.js +6 -6
  149. package/dist/ops/webgpu/appendCache.js +3 -3
  150. package/dist/ops/webgpu/attentionMask.js +2 -2
  151. package/dist/ops/webgpu/attentionMask32_program.js +2 -2
  152. package/dist/ops/webgpu/clipScale.js +7 -7
  153. package/dist/ops/webgpu/concat16.js +5 -5
  154. package/dist/ops/webgpu/dropout16.js +6 -6
  155. package/dist/ops/webgpu/gatherSub.js +3 -3
  156. package/dist/ops/webgpu/gelu.js +8 -8
  157. package/dist/ops/webgpu/matMul16.js +16 -16
  158. package/dist/ops/webgpu/matMul16_program.js +2 -2
  159. package/dist/ops/webgpu/mul16.js +5 -5
  160. package/dist/ops/webgpu/norm2.js +1 -1
  161. package/dist/ops/webgpu/normRMS.js +2 -2
  162. package/dist/ops/webgpu/normRMSGrad.js +4 -4
  163. package/dist/ops/webgpu/pack16.js +4 -4
  164. package/dist/ops/webgpu/pack16_program.js +2 -2
  165. package/dist/ops/webgpu/qkv.js +2 -2
  166. package/dist/ops/webgpu/rope.js +3 -3
  167. package/dist/ops/webgpu/scatterSub.js +3 -3
  168. package/dist/ops/webgpu/slice16.js +4 -4
  169. package/dist/ops/webgpu/softmax16.js +4 -4
  170. package/dist/ops/webgpu/softmax16_program.js +2 -2
  171. package/dist/ops/webgpu/softmax16_subgroup_program.js +2 -2
  172. package/dist/ops/webgpu/softmax16grad.js +4 -4
  173. package/dist/ops/webgpu/sub16.js +6 -6
  174. package/dist/ops/webgpu/sum16.js +3 -3
  175. package/dist/ops/webgpu/transpose16.js +8 -8
  176. package/dist/ops/webgpu/transpose16_program.js +2 -2
  177. package/dist/ops/webgpu/transpose16_shared_program.js +3 -3
  178. package/dist/ops/webgpu/unpack16.js +3 -3
  179. package/dist/ops/webgpu/utils/binary_op.js +3 -3
  180. package/dist/ops/webgpu/utils/reductions.js +5 -5
  181. package/dist/{ops-CsXeTq1P.js → ops-CURIZSVt.js} +100 -100
  182. package/dist/{pack16-bqltoUlR.js → pack16-WlOSOuZA.js} +2 -2
  183. package/dist/patches/webgpu_backend.js +6 -6
  184. package/dist/patches/webgpu_base.js +1 -1
  185. package/dist/patches/webgpu_program.js +2 -2
  186. package/dist/{random_normal-IBRrha8a.js → random_normal-CIm8lk2-.js} +1 -1
  187. package/dist/{random_width-DN5ZtQkM.js → random_width-B_fVXhGx.js} +131 -131
  188. package/dist/{range-C-CjF-LI.js → range-BDxO73mk.js} +1 -1
  189. package/dist/{readers-iz5u3HBo.js → readers-17HLdxVM.js} +2 -2
  190. package/dist/relu-DTvZKBsZ.js +9 -0
  191. package/dist/{reshape-BDOuCSNW.js → reshape-BIN71H3p.js} +1 -1
  192. package/dist/{resize_nearest_neighbor-BojqlfRe.js → resize_nearest_neighbor-C6_0dAnK.js} +41 -41
  193. package/dist/{rope-0j_f1TPm.js → rope-CC5RjmKU.js} +4 -4
  194. package/dist/{scatter_nd_util-ByNJaL6I.js → scatter_nd_util-C-x73Cj6.js} +1 -1
  195. package/dist/{segment_util-Dasb2Zaf.js → segment_util-4zuHV5IG.js} +2 -2
  196. package/dist/{selu_util-BLhIqRkw.js → selu_util-BXdhy_W6.js} +5 -5
  197. package/dist/{shared-CagdqkLh.js → shared-DRWDyk9w.js} +6 -6
  198. package/dist/{shared-3agzAqQ_.js → shared-zTaJ5siv.js} +1 -1
  199. package/dist/slice-BvItlgXu.js +12 -0
  200. package/dist/{slice_util-CC35pLmT.js → slice_util-DPY56GzQ.js} +5 -5
  201. package/dist/{softmax-D4q1LJN7.js → softmax-BLGJqdwx.js} +1 -1
  202. package/dist/split-BN9LkEgS.js +9 -0
  203. package/dist/{squeeze-ho4wLUek.js → squeeze-O_YWJpw_.js} +2 -2
  204. package/dist/{stack-DudVrtmG.js → stack-z6QE7kmP.js} +1 -1
  205. package/dist/{step-BTxPtq1r.js → step-DQY6_ABw.js} +4 -4
  206. package/dist/{sum-BpiwSWvg.js → sum-D39FeU5h.js} +3 -3
  207. package/dist/{tensor-BWFldCso.js → tensor-D8e0Gd7c.js} +1 -1
  208. package/dist/{tensor1d-LMGMIUlr.js → tensor1d-BMl0eZYV.js} +1 -1
  209. package/dist/{tensor2d-BnXMKScO.js → tensor2d-DTtQ1QcT.js} +1 -1
  210. package/dist/{tensor4d-C6UCG_u8.js → tensor4d-Dj4rDssL.js} +1 -1
  211. package/dist/{tfjs_backend-BGnG-ppu.js → tfjs_backend-Bk3PmK91.js} +65 -65
  212. package/dist/{tile-CFy-xTO6.js → tile-CsWlVKKz.js} +1 -1
  213. package/dist/tokeniser/BaseTokeniser.d.ts +4 -1
  214. package/dist/tokeniser/BaseTokeniser.js +21 -5
  215. package/dist/tokeniser/CharTokeniser.d.ts +1 -1
  216. package/dist/tokeniser/CharTokeniser.js +62 -50
  217. package/dist/tokeniser/bpe.d.ts +1 -1
  218. package/dist/tokeniser/bpe.js +41 -35
  219. package/dist/tokeniser/type.d.ts +3 -1
  220. package/dist/training/AdamW.d.ts +3 -0
  221. package/dist/training/AdamW.js +59 -30
  222. package/dist/training/BasicTrainer.d.ts +1 -0
  223. package/dist/training/BasicTrainer.js +112 -92
  224. package/dist/training/DatasetBuilder.js +3 -3
  225. package/dist/training/Evaluator.js +2 -2
  226. package/dist/training/LRScheduler.d.ts +1 -0
  227. package/dist/training/LRScheduler.js +18 -12
  228. package/dist/training/PreTrainer.js +3 -3
  229. package/dist/training/SFTDatasetBuilder.js +3 -3
  230. package/dist/training/SFTTrainer.js +1 -1
  231. package/dist/training/orthoGrad.js +1 -1
  232. package/dist/training/sparseCrossEntropy.js +30 -30
  233. package/dist/training/types.d.ts +5 -3
  234. package/dist/training/validation.js +13 -13
  235. package/dist/{transpose-9kRxIXWR.js → transpose-Qxz-4os3.js} +7 -7
  236. package/dist/{unsorted_segment_sum-DJvk5xnh.js → unsorted_segment_sum-BfFVV9Zm.js} +20 -20
  237. package/dist/utilities/datasetID.d.ts +2 -0
  238. package/dist/utilities/datasetID.js +21 -0
  239. package/dist/utilities/dummy.js +6 -6
  240. package/dist/utilities/multinomialCPU.js +2 -2
  241. package/dist/utilities/packed.js +1 -1
  242. package/dist/utilities/performance.js +1 -1
  243. package/dist/utilities/profile.js +1 -1
  244. package/dist/utilities/safetensors.js +2 -2
  245. package/dist/utilities/sentences.js +5 -5
  246. package/dist/utilities/weights.js +2 -2
  247. package/dist/{variable-Ck482e3n.js → variable-SSATClyt.js} +1 -1
  248. package/dist/{webgpu_program-B4HmApL1.js → webgpu_program-CbjdYLYk.js} +1 -1
  249. package/dist/{webgpu_util-DYlGSwOJ.js → webgpu_util-DuofJBMo.js} +7 -7
  250. package/dist/{zeros-DvZpK8s6.js → zeros-Bw0puq_w.js} +2 -2
  251. package/dist/{zeros_like-CWjDdwr-.js → zeros_like-rOHr54NY.js} +69 -69
  252. package/package.json +3 -3
  253. package/dist/complex-DI35Q-gW.js +0 -11
  254. package/dist/mat_mul-DhG0Newp.js +0 -11
  255. package/dist/mod-CSdCpRjf.js +0 -11
  256. package/dist/relu-J_X6MUzx.js +0 -9
  257. package/dist/slice-BzS11Qh0.js +0 -12
  258. package/dist/split-C2Sj255c.js +0 -9
@@ -1,4 +1,4 @@
1
- import { o as a, q as f, x as m, f as y, E as c, C as p } from "./index-CUXkjxiT.js";
1
+ import { o as a, n as f, v as m, f as y, E as c, C as p } from "./index-DSGwv2Yx.js";
2
2
  function u(o, s, t) {
3
3
  const r = f(o, "x", "clipByValue");
4
4
  if (m(s <= t, () => `Error in clip: min (${s}) must be less than or equal to max (${t}).`), s === t)
@@ -0,0 +1,11 @@
1
+ import { o as t, n as s, a6 as c, E as m, a7 as r } from "./index-DSGwv2Yx.js";
2
+ function l(o, n) {
3
+ const a = s(o, "real", "complex"), e = s(n, "imag", "complex");
4
+ c(a.shape, e.shape, `real and imag shapes, ${a.shape} and ${e.shape}, must match in call to tf.complex().`);
5
+ const p = { real: a, imag: e };
6
+ return m.runKernel(r, p);
7
+ }
8
+ const i = /* @__PURE__ */ t({ complex_: l });
9
+ export {
10
+ i as c
11
+ };
@@ -1,5 +1,5 @@
1
- import { o as s, x as a, y as p, w as i, E as l, z as f } from "./index-CUXkjxiT.js";
2
- function h(o, e = 0) {
1
+ import { o as s, v as a, w as p, u as i, E as l, x as u } from "./index-DSGwv2Yx.js";
2
+ function f(o, e = 0) {
3
3
  a(o.length >= 1, () => "Pass at least one tensor to concat");
4
4
  const t = p(o, "tensors", "concat", "string_or_numeric");
5
5
  if (t[0].dtype === "complex64" && t.forEach((n) => {
@@ -9,9 +9,9 @@ function h(o, e = 0) {
9
9
  }), t.length === 1)
10
10
  return i(t[0]);
11
11
  const r = t, c = { axis: e };
12
- return l.runKernel(f, r, c);
12
+ return l.runKernel(u, r, c);
13
13
  }
14
- const u = /* @__PURE__ */ s({ concat_: h });
14
+ const m = /* @__PURE__ */ s({ concat_: f });
15
15
  export {
16
- u as c
16
+ m as c
17
17
  };
@@ -1,4 +1,4 @@
1
- import { x as s } from "./index-CUXkjxiT.js";
1
+ import { v as s } from "./index-DSGwv2Yx.js";
2
2
  function h(n, o) {
3
3
  const t = n[0].length;
4
4
  n.forEach((a, c) => {
@@ -1,7 +1,7 @@
1
- import { ag as h, aA as S, ab as N, d as v, aB as o, aC as p, aD as g, x as k, t as y } from "./index-CUXkjxiT.js";
1
+ import { ag as h, aA as S, ab as N, l as v, aB as o, aC as p, aD as g, v as k, t as y } from "./index-DSGwv2Yx.js";
2
2
  import { s as R } from "./index-CieiGp4Y.js";
3
- import { s as B } from "./stack-DudVrtmG.js";
4
- import { t as $ } from "./tensor-BWFldCso.js";
3
+ import { s as B } from "./stack-z6QE7kmP.js";
4
+ import { t as $ } from "./tensor-D8e0Gd7c.js";
5
5
  function _(s, t) {
6
6
  return b(s, t);
7
7
  }
@@ -1,4 +1,4 @@
1
- import { o as u, u as f, a5 as i, ac as m } from "./index-CUXkjxiT.js";
1
+ import { o as u, q as f, a5 as i, ac as m } from "./index-DSGwv2Yx.js";
2
2
  import { U as c } from "./rand_util-CZ7yLoUm.js";
3
3
  function g(n, r = 0, t = 1, e = "float32", a) {
4
4
  f(n);
@@ -1,11 +1,11 @@
1
- import { o as e, q as a, x as i, E as m, A as p } from "./index-CUXkjxiT.js";
2
- function x(t, n = 0) {
1
+ import { o as e, n as a, v as i, E as m, y as p } from "./index-DSGwv2Yx.js";
2
+ function c(t, n = 0) {
3
3
  const s = a(t, "x", "expandDims", "string_or_numeric");
4
4
  i(n <= s.rank, () => "Axis must be <= rank of the tensor");
5
5
  const r = { input: s }, o = { dim: n };
6
6
  return m.runKernel(p, r, o);
7
7
  }
8
- const u = /* @__PURE__ */ e({ expandDims_: x });
8
+ const x = /* @__PURE__ */ e({ expandDims_: c });
9
9
  export {
10
- u as e
10
+ x as e
11
11
  };
@@ -1,4 +1,4 @@
1
- import { R as o } from "./random_width-DN5ZtQkM.js";
1
+ import { R as o } from "./random_width-B_fVXhGx.js";
2
2
  function m(r) {
3
3
  return new o(r);
4
4
  }
@@ -1,4 +1,4 @@
1
- import { o as n, q as s, E as t, F as f } from "./index-CUXkjxiT.js";
1
+ import { o as n, n as s, E as t, F as f } from "./index-DSGwv2Yx.js";
2
2
  function a(o) {
3
3
  const r = { x: s(o, "x", "floor", "float32") };
4
4
  return t.runKernel(f, r);
@@ -1,4 +1,4 @@
1
- import { o as g, q as t, E as h, G as p } from "./index-CUXkjxiT.js";
1
+ import { o as g, n as t, E as h, G as p } from "./index-DSGwv2Yx.js";
2
2
  function u(n, s, r = 0, e = 0) {
3
3
  const o = t(n, "x", "gather"), a = t(s, "indices", "gather", "int32"), c = { x: o, indices: a }, i = { axis: r, batchDims: e };
4
4
  return h.runKernel(p, c, i);
@@ -1,4 +1,4 @@
1
- import { e as t, h as n } from "./index-CUXkjxiT.js";
1
+ import { c as t, e as n } from "./index-DSGwv2Yx.js";
2
2
  import "./ops/cpu/gelu.js";
3
3
  import "./ops/webgl/gelu.js";
4
4
  const a = {
@@ -1,5 +1,5 @@
1
- import { ab as $, U as E, aR as X, ac as T, aS as ae, K as N, aT as G, x as ie, a9 as k, ad as ce } from "./index-CUXkjxiT.js";
2
- import { b as se } from "./backend_util-GaFarB78.js";
1
+ import { ab as $, N as E, aR as X, ac as T, aS as ae, I as N, aT as G, v as ie, a9 as k, ad as ce } from "./index-DSGwv2Yx.js";
2
+ import { b as se } from "./backend_util-qwSFfxYx.js";
3
3
  const w = {}, M = {
4
4
  alpha: !1,
5
5
  antialias: !1,
@@ -215,7 +215,7 @@ function Ot(e, t, n) {
215
215
  function It(e, t) {
216
216
  v(e, () => e.bindFramebuffer(e.FRAMEBUFFER, t)), v(e, () => e.framebufferTexture2D(e.FRAMEBUFFER, e.COLOR_ATTACHMENT0, e.TEXTURE_2D, null, 0));
217
217
  }
218
- function Ut(e) {
218
+ function Lt(e) {
219
219
  const t = e.checkFramebufferStatus(e.FRAMEBUFFER);
220
220
  if (t !== e.FRAMEBUFFER_COMPLETE)
221
221
  throw new Error("Error binding framebuffer: " + Se(e, t));
@@ -258,7 +258,7 @@ function J(e) {
258
258
  e[e.length - 1]
259
259
  ];
260
260
  }
261
- function Lt(e) {
261
+ function Ut(e) {
262
262
  let t = [1, 1, 1];
263
263
  return e.length === 0 || e.length === 1 && e[0] === 1 || (t = [Z(e), ...J(e)]), t;
264
264
  }
@@ -378,7 +378,7 @@ function Xt(e, t) {
378
378
  n != null && ie(n.dtype !== "complex64", () => `${t} does not support complex64 tensors in the WebGL backend.`);
379
379
  });
380
380
  }
381
- function U() {
381
+ function L() {
382
382
  let e, t, n, r, o, a, i, c, s, l;
383
383
  return $().getNumber("WEBGL_VERSION") === 2 ? (e = "#version 300 es", t = "in", n = "out", r = "in", o = "texture", a = "outputColor", i = "out vec4 outputColor;", c = $().getBool("WEBGL2_ISNAN_CUSTOM") ? `
384
384
  bool isnan_custom(float val) {
@@ -567,8 +567,8 @@ function Fe(e, t, n) {
567
567
  });
568
568
  const o = r.join(`
569
569
  `), a = e.map((x) => _e(x, t, n.packedInputs, n.enableShapeUniforms)).join(`
570
- `), i = t.texShape, c = U(), s = Ne(c);
571
- let l, u, f = Ue(c);
570
+ `), i = t.texShape, c = L(), s = Ne(c);
571
+ let l, u, f = Le(c);
572
572
  return t.isPacked ? (l = Ae(t.logicalShape, i, n.enableShapeUniforms), u = Ie(c)) : (l = we(t.logicalShape, i, n.enableShapeUniforms), u = Oe(c)), n.packedInputs && (f += be), [
573
573
  f,
574
574
  s,
@@ -580,7 +580,7 @@ function Fe(e, t, n) {
580
580
  ].join(`
581
581
  `);
582
582
  }
583
- function L(e, t = !1) {
583
+ function U(e, t = !1) {
584
584
  const n = e.shapeInfo.logicalShape;
585
585
  switch (n.length) {
586
586
  case 0:
@@ -617,7 +617,7 @@ function te(e, t) {
617
617
  }
618
618
  function _e(e, t, n = !1, r) {
619
619
  let o = "";
620
- n ? o += te(e, r) : o += L(e, r);
620
+ n ? o += te(e, r) : o += U(e, r);
621
621
  const a = e.shapeInfo.logicalShape, i = t.logicalShape;
622
622
  return a.length <= i.length && (n ? o += ot(e, t) : o += at(e, t)), o;
623
623
  }
@@ -676,7 +676,7 @@ function Ie(e) {
676
676
  }
677
677
  `;
678
678
  }
679
- function Ue(e) {
679
+ function Le(e) {
680
680
  return `${e.version}
681
681
  precision highp float;
682
682
  precision highp int;
@@ -732,12 +732,12 @@ function Ue(e) {
732
732
  return fract((p3.x + p3.y) * p3.z);
733
733
  }
734
734
 
735
- ${Le}
735
+ ${Ue}
736
736
  ${De}
737
737
  ${ge}
738
738
  `;
739
739
  }
740
- const Le = `
740
+ const Ue = `
741
741
  vec2 uvFromFlat(int texNumR, int texNumC, int index) {
742
742
  int texR = index / texNumC;
743
743
  int texC = index - texR * texNumC;
@@ -1112,7 +1112,7 @@ function O(e) {
1112
1112
  return `offset${e}`;
1113
1113
  }
1114
1114
  function He(e) {
1115
- const t = e.name, n = "get" + t.charAt(0).toUpperCase() + t.slice(1), r = U();
1115
+ const t = e.name, n = "get" + t.charAt(0).toUpperCase() + t.slice(1), r = L();
1116
1116
  return `
1117
1117
  vec4 ${n}() {
1118
1118
  return ${r.texture2D}(${t}, halfCR);
@@ -1147,7 +1147,7 @@ function qe(e, t) {
1147
1147
  `;
1148
1148
  }
1149
1149
  function je(e, t) {
1150
- const n = e.name, r = "get" + n.charAt(0).toUpperCase() + n.slice(1), o = e.shapeInfo.texShape, a = U();
1150
+ const n = e.name, r = "get" + n.charAt(0).toUpperCase() + n.slice(1), o = e.shapeInfo.texShape, a = L();
1151
1151
  if (t)
1152
1152
  return `
1153
1153
  vec4 ${r}(int index) {
@@ -1215,7 +1215,7 @@ function Ye(e, t) {
1215
1215
  `;
1216
1216
  }
1217
1217
  function Ke(e, t) {
1218
- const n = e.shapeInfo.logicalShape, r = e.name, o = "get" + r.charAt(0).toUpperCase() + r.slice(1), a = e.shapeInfo.texShape, i = a[0], c = a[1], s = U();
1218
+ const n = e.shapeInfo.logicalShape, r = e.name, o = "get" + r.charAt(0).toUpperCase() + r.slice(1), a = e.shapeInfo.texShape, i = a[0], c = a[1], s = L();
1219
1219
  if (a != null && T(n, a))
1220
1220
  return t ? `
1221
1221
  vec4 ${o}(int row, int col) {
@@ -1269,7 +1269,7 @@ function Ze(e, t) {
1269
1269
  if (s.length < n.length) {
1270
1270
  const d = g(e, s), x = ["row", "col"];
1271
1271
  return `
1272
- ${L(d, t)}
1272
+ ${U(d, t)}
1273
1273
  float ${o}(int row, int col) {
1274
1274
  return ${o}(${b(x, c)});
1275
1275
  }
@@ -1334,7 +1334,7 @@ function Je(e, t) {
1334
1334
  }
1335
1335
  `;
1336
1336
  }
1337
- const c = U();
1337
+ const c = L();
1338
1338
  if (t)
1339
1339
  return `
1340
1340
  vec4 ${o}(int b, int row, int col) {
@@ -1360,7 +1360,7 @@ function Qe(e, t) {
1360
1360
  if (l.length < n.length) {
1361
1361
  const p = g(e, l), m = ["row", "col", "depth"];
1362
1362
  return `
1363
- ${L(p, t)}
1363
+ ${U(p, t)}
1364
1364
  float ${o}(int row, int col, int depth) {
1365
1365
  return ${o}(${b(m, s)});
1366
1366
  }
@@ -1430,7 +1430,7 @@ function Qe(e, t) {
1430
1430
  `;
1431
1431
  }
1432
1432
  function et(e, t) {
1433
- const n = e.name, r = "get" + n.charAt(0).toUpperCase() + n.slice(1), o = U();
1433
+ const n = e.name, r = "get" + n.charAt(0).toUpperCase() + n.slice(1), o = L();
1434
1434
  if (t)
1435
1435
  return `
1436
1436
  vec4 ${r}(int b2, int b, int row, int col) {
@@ -1464,7 +1464,7 @@ function tt(e, t) {
1464
1464
  if (s.length < n.length) {
1465
1465
  const R = g(e, s), F = ["row", "col", "depth", "depth2"];
1466
1466
  return `
1467
- ${L(R, t)}
1467
+ ${U(R, t)}
1468
1468
  float ${o}(int row, int col, int depth, int depth2) {
1469
1469
  return ${o}(${b(F, l)});
1470
1470
  }
@@ -1550,7 +1550,7 @@ function nt(e) {
1550
1550
  if (s.length < t.length) {
1551
1551
  const p = g(e, s), m = ["row", "col", "depth", "depth2", "depth3"];
1552
1552
  return `
1553
- ${L(p)}
1553
+ ${U(p)}
1554
1554
  float ${r}(int row, int col, int depth, int depth2, int depth3) {
1555
1555
  return ${r}(${b(m, l)});
1556
1556
  }
@@ -1607,7 +1607,7 @@ function rt(e) {
1607
1607
  if (o.length < t.length) {
1608
1608
  const m = g(e, o), S = ["row", "col", "depth", "depth2", "depth3", "depth4"];
1609
1609
  return `
1610
- ${L(m)}
1610
+ ${U(m)}
1611
1611
  float ${r}(int row, int col, int depth,
1612
1612
  int depth2, int depth3, int depth4) {
1613
1613
  return ${r}(${b(S, a)});
@@ -1979,12 +1979,12 @@ export {
1979
1979
  wt as O,
1980
1980
  H as P,
1981
1981
  Nt as Q,
1982
- Ut as R,
1982
+ Lt as R,
1983
1983
  Ot as S,
1984
1984
  q as T,
1985
1985
  ut as U,
1986
1986
  j as V,
1987
- Lt as W,
1987
+ Ut as W,
1988
1988
  xt as X,
1989
1989
  ht as Y,
1990
1990
  Yt as Z,
@@ -2008,7 +2008,7 @@ export {
2008
2008
  yt as m,
2009
2009
  Pt as n,
2010
2010
  Vt as o,
2011
- U as p,
2011
+ L as p,
2012
2012
  Q as q,
2013
2013
  St as r,
2014
2014
  Rt as s,
@@ -1,20 +1,20 @@
1
- import { W as Mt } from "./backend_webgpu-BqASlsbV.js";
2
- import { ae as Et, ab as X, x as L, dc as Ut, dd as Ht, bX as Gt, U as D, _ as j, bb as Xt, ai as Ye, aU as Kt, a7 as qt, am as fe, bP as Yt, c7 as jt, c8 as Qt, bV as Zt, cO as Jt, ar as es, ac as De, ah as te, aW as ts, bm as ss, bn as os, bo as is, c9 as as, ca as rs, cb as ns, cc as us, cd as ds, ce as ls, aM as cs, aP as hs, bp as ps, cy as fs, cP as ms, cQ as gs, D as xs, S as Cs, br as ws, bd as ys, de as Ss, aQ as bs, aq as vs, bS as ks, bT as Is, af as Rs, bY as Ps, C as $s, cS as Ds, ao as Ns, z as zs, bt as As, cD as Fs, bu as Ws, cz as Ls, cT as Vs, cA as Bs, bv as Ts, bw as _s, bf as Os, bx as Ms, by as Es, cB as Us, cf as Hs, bz as Gs, cF as Xs, cG as Ks, df as qs, cg as Ys, cU as js, cV as Qs, dg as Zs, c0 as Js, N as eo, be as to, aG as so, cW as oo, bA as io, bB as ao, aN as ro, A as no, bZ as uo, cp as lo, bg as co, F as ho, b_ as po, dh as fo, a9 as at, bs as mo, cE as go, di as xo, al as Co, G as wo, a5 as ke, a$ as yo, b0 as So, cq as bo, ch as vo, ci as ko, cj as Io, aH as Ro, b1 as Po, b2 as $o, dj as Do, aO as No, b3 as zo, b4 as Ao, bD as Fo, cl as Wo, ck as Lo, cY as Vo, b$ as Bo, bE as To, cC as _o, cZ as Oo, c_ as Mo, dk as Eo, aZ as Uo, b5 as Ho, cm as Go, M as Xo, I as Ko, dl as qo, ap as Yo, bi as jo, bj as Qo, bF as Zo, d3 as Jo, bG as ei, P as ti, a6 as si, bH as oi, c$ as ii, aI as ai, c1 as ri, Z as ni, aX as ui, cn as di, H as li, aJ as ci, b9 as hi, d0 as pi, ba as fi, d1 as mi, bJ as gi, bh as xi, b6 as Ci, bK as wi, ak as yi, dm as Si, aL as bi, bL as vi, aF as ki, co as Ii, bM as Ri, bN as Pi, bC as $i, bI as Di, dn as Ni, dp as zi, T as Ai, av as rt, dq as Fi, Q as Wi, J as Li, c3 as Vi, d2 as Bi, b7 as Ti, aK as _i, cr as Oi, dr as Mi, c5 as Ei, cs as Ui, bq as Hi, ds as Gi, ct as Xi, bl as Ki, b8 as qi, bO as Yi, c as ji } from "./index-CUXkjxiT.js";
3
- import { i as Qi, a as Zi, c as b, f as v, M as Y, b as nt, d as ut, e as dt } from "./webgpu_util-DYlGSwOJ.js";
1
+ import { W as Mt } from "./backend_webgpu-DI2wXEC2.js";
2
+ import { ae as Et, ab as X, v as L, dc as Ut, dd as Ht, bX as Gt, N as D, _ as j, bb as Xt, ai as Ye, aU as Kt, a7 as qt, am as fe, bP as Yt, c7 as jt, c8 as Qt, bV as Zt, cO as Jt, ar as es, ac as De, ah as te, aW as ts, bm as ss, bn as os, bo as is, c9 as as, ca as rs, cb as ns, cc as us, cd as ds, ce as ls, aM as cs, aP as hs, bp as ps, cy as fs, cP as ms, cQ as gs, B as xs, S as Cs, br as ws, bd as ys, de as Ss, aQ as bs, aq as vs, bS as ks, bT as Is, af as Rs, bY as Ps, C as $s, cS as Ds, ao as Ns, x as zs, bt as As, cD as Fs, bu as Ws, cz as Ls, cT as Vs, cA as Bs, bv as Ts, bw as _s, bf as Os, bx as Ms, by as Es, cB as Us, cf as Hs, bz as Gs, cF as Xs, cG as Ks, df as qs, cg as Ys, cU as js, cV as Qs, dg as Zs, c0 as Js, K as eo, be as to, aG as so, cW as oo, bA as io, bB as ao, aN as ro, y as no, bZ as uo, cp as lo, bg as co, F as ho, b_ as po, dh as fo, a9 as at, bs as mo, cE as go, di as xo, al as Co, G as wo, a5 as ke, a$ as yo, b0 as So, cq as bo, ch as vo, ci as ko, cj as Io, aH as Ro, b1 as Po, b2 as $o, dj as Do, aO as No, b3 as zo, b4 as Ao, bD as Fo, cl as Wo, ck as Lo, cY as Vo, b$ as Bo, bE as To, cC as _o, cZ as Oo, c_ as Mo, dk as Eo, aZ as Uo, b5 as Ho, cm as Go, M as Xo, D as Ko, dl as qo, ap as Yo, bi as jo, bj as Qo, bF as Zo, d3 as Jo, bG as ei, P as ti, a6 as si, bH as oi, c$ as ii, aI as ai, c1 as ri, X as ni, aX as ui, cn as di, A as li, aJ as ci, b9 as hi, d0 as pi, ba as fi, d1 as mi, bJ as gi, bh as xi, b6 as Ci, bK as wi, ak as yi, dm as Si, aL as bi, bL as vi, aF as ki, co as Ii, bM as Ri, bN as Pi, bC as $i, bI as Di, dn as Ni, dp as zi, T as Ai, av as rt, dq as Fi, L as Wi, H as Li, c3 as Vi, d2 as Bi, b7 as Ti, aK as _i, cr as Oi, dr as Mi, c5 as Ei, cs as Ui, bq as Hi, ds as Gi, ct as Xi, bl as Ki, b8 as qi, bO as Yi, a as ji } from "./index-DSGwv2Yx.js";
3
+ import { i as Qi, a as Zi, c as b, f as v, M as Y, b as nt, d as ut, e as dt } from "./webgpu_util-DuofJBMo.js";
4
4
  import { g as _e, B as F } from "./binary_op_util-pKXltfxI.js";
5
- import { S as Ji, a as ea } from "./selu_util-BLhIqRkw.js";
6
- import { E as ta, t as sa, u as oa, w as ia, x as aa, y as ra, f as je, z as lt, A as ct, B as ht, C as na, D as ua, F as da, G as la, H as ca, I as ha, J as pa, K as fa, L as ma, M as ga } from "./backend_util-GaFarB78.js";
7
- import { t as W, e as S, h as Q, b as G, c as Ie, P as pt, d as xa, a as Ca } from "./webgpu_program-B4HmApL1.js";
8
- import { r as R, a as wa } from "./Reshape-CPBkTIH2.js";
9
- import { s as ya } from "./shared-CagdqkLh.js";
10
- import { c as Oe, a as Ce, b as we, d as Me, e as Sa, g as ft } from "./axis_util-GTVlo58H.js";
11
- import { h as ye, i as Ne, j as Se, b as Z, d as Ee, g as Ue, k as mt } from "./step-BTxPtq1r.js";
12
- import { p as ba, a as va, s as ka, b as Ia } from "./slice_util-CC35pLmT.js";
13
- import { z as Ra } from "./zeros-DvZpK8s6.js";
14
- import { c as me, a as Pa } from "./concat_util-D18dJ4fD.js";
15
- import { c as $a, a as Da } from "./segment_util-Dasb2Zaf.js";
5
+ import { S as Ji, a as ea } from "./selu_util-BXdhy_W6.js";
6
+ import { E as ta, t as sa, u as oa, w as ia, x as aa, y as ra, f as je, z as lt, A as ct, B as ht, C as na, D as ua, F as da, G as la, H as ca, I as ha, J as pa, K as fa, L as ma, M as ga } from "./backend_util-qwSFfxYx.js";
7
+ import { t as W, e as S, h as Q, b as G, c as Ie, P as pt, d as xa, a as Ca } from "./webgpu_program-CbjdYLYk.js";
8
+ import { r as R, a as wa } from "./Reshape-pwprEaej.js";
9
+ import { s as ya } from "./shared-DRWDyk9w.js";
10
+ import { c as Oe, a as Ce, b as we, d as Me, e as Sa, g as ft } from "./axis_util-QWWgLjut.js";
11
+ import { h as ye, i as Ne, j as Se, b as Z, d as Ee, g as Ue, k as mt } from "./step-DQY6_ABw.js";
12
+ import { p as ba, a as va, s as ka, b as Ia } from "./slice_util-DPY56GzQ.js";
13
+ import { z as Ra } from "./zeros-Bw0puq_w.js";
14
+ import { c as me, a as Pa } from "./concat_util-C1Mxe27t.js";
15
+ import { c as $a, a as Da } from "./segment_util-4zuHV5IG.js";
16
16
  import { n as Na, a as za } from "./non_max_suppression_impl-B2W7YjZB.js";
17
- import { c as He } from "./scatter_nd_util-ByNJaL6I.js";
17
+ import { c as He } from "./scatter_nd_util-C-x73Cj6.js";
18
18
  Qi() && Et(
19
19
  "webgpu",
20
20
  async () => {
@@ -3226,34 +3226,34 @@ function vs() {
3226
3226
  vs();
3227
3227
  export {
3228
3228
  di as $,
3229
- Kr as A,
3230
- K as B,
3229
+ Ja as A,
3230
+ ur as B,
3231
3231
  yr as C,
3232
- ur as D,
3232
+ So as D,
3233
3233
  f as E,
3234
3234
  Yr as F,
3235
3235
  Qr as G,
3236
- Ja as H,
3237
- So as I,
3238
- wo as J,
3239
- Gs as K,
3240
- Rt as L,
3236
+ wo as H,
3237
+ Gs as I,
3238
+ Rt as J,
3239
+ yo as K,
3240
+ se as L,
3241
3241
  Na as M,
3242
- yo as N,
3242
+ z as N,
3243
3243
  H as O,
3244
3244
  Oa as P,
3245
- se as Q,
3245
+ Ue as Q,
3246
3246
  Xa as R,
3247
3247
  uo as S,
3248
3248
  Co as T,
3249
- z as U,
3250
- Ue as V,
3251
- Cs as W,
3252
- Tn as X,
3253
- vn as Y,
3254
- qa as Z,
3249
+ Cs as U,
3250
+ Tn as V,
3251
+ vn as W,
3252
+ qa as X,
3253
+ ni as Y,
3254
+ hs as Z,
3255
3255
  os as _,
3256
- q as a,
3256
+ Ho as a,
3257
3257
  ea as a$,
3258
3258
  gi as a0,
3259
3259
  tt as a1,
@@ -3318,7 +3318,7 @@ export {
3318
3318
  $s as ax,
3319
3319
  xt as ay,
3320
3320
  he as az,
3321
- ni as b,
3321
+ q as b,
3322
3322
  Qe as b$,
3323
3323
  na as b0,
3324
3324
  la as b1,
@@ -3383,7 +3383,7 @@ export {
3383
3383
  Fr as bx,
3384
3384
  Mr as by,
3385
3385
  xr as bz,
3386
- Ho as c,
3386
+ Jo as c,
3387
3387
  en as c$,
3388
3388
  tn as c0,
3389
3389
  za as c1,
@@ -3448,7 +3448,7 @@ export {
3448
3448
  gs as cx,
3449
3449
  cr as cy,
3450
3450
  Tr as cz,
3451
- M as d,
3451
+ $ as d,
3452
3452
  to as d0,
3453
3453
  Za as d1,
3454
3454
  Bo as d2,
@@ -3491,26 +3491,26 @@ export {
3491
3491
  ja as dx,
3492
3492
  ko as dy,
3493
3493
  Io as dz,
3494
- Jo as e,
3494
+ ei as e,
3495
3495
  as as f,
3496
3496
  ai as g,
3497
- ei as h,
3498
- $ as i,
3499
- S as j,
3497
+ S as h,
3498
+ nt as i,
3499
+ V as j,
3500
3500
  Fn as k,
3501
- nt as l,
3501
+ M as l,
3502
3502
  b as m,
3503
- V as n,
3503
+ T as n,
3504
3504
  N as o,
3505
3505
  Qt as p,
3506
- T as q,
3506
+ Ct as q,
3507
3507
  ri as r,
3508
3508
  si as s,
3509
3509
  A as t,
3510
- Ct as u,
3511
- hs as v,
3512
- Jn as w,
3513
- p as x,
3514
- An as y,
3515
- wr as z
3510
+ Jn as u,
3511
+ p as v,
3512
+ An as w,
3513
+ wr as x,
3514
+ Kr as y,
3515
+ K as z
3516
3516
  };
@@ -0,0 +1,16 @@
1
+ import { Conversation } from '../tokeniser/type';
2
+ export interface GeneratorConversation extends Conversation {
3
+ _completed?: boolean;
4
+ _timestamp?: number;
5
+ }
6
+ export interface GenerateOptions {
7
+ temperature?: number;
8
+ topK?: number;
9
+ topP?: number;
10
+ usePadding?: boolean;
11
+ attentionScores?: boolean;
12
+ includeProbabilities?: boolean;
13
+ embeddings?: 'embedding' | 'logits' | 'softmax' | 'all';
14
+ targets?: number[];
15
+ loraName?: string;
16
+ }
@@ -0,0 +1 @@
1
+
@@ -1,6 +1,6 @@
1
- import { _ as B, U as G, aU as K, a7 as W, aH as z, aV as V, ab as N, aI as F, am as S } from "./index-CUXkjxiT.js";
2
- import { u as O, f as H } from "./gpgpu_math-BwvV12df.js";
3
- import { f as v } from "./backend_util-GaFarB78.js";
1
+ import { _ as B, N as G, aU as K, a7 as W, aH as z, aV as V, ab as N, aI as F, am as S } from "./index-DSGwv2Yx.js";
2
+ import { u as O, f as H } from "./gpgpu_math-3bCb5ooU.js";
3
+ import { f as v } from "./backend_util-qwSFfxYx.js";
4
4
  function Y(t, e) {
5
5
  return ["x", "y", "z", "w", "u", "v"].slice(0, e).map((s) => `${t}.${s}`);
6
6
  }
@@ -200,12 +200,12 @@ const be = {
200
200
  backendName: "webgl",
201
201
  kernelFunc: oe
202
202
  };
203
- const U = "return (a < 0.) ? b * a : a;", k = `
203
+ const k = "return (a < 0.) ? b * a : a;", U = `
204
204
  vec4 aLessThanZero = vec4(lessThan(a, vec4(0.)));
205
205
  return (aLessThanZero * (b * a)) + ((vec4(1.0) - aLessThanZero) * a);
206
206
  `;
207
207
  function ue(t) {
208
- const { inputs: e, backend: s } = t, { x: r, alpha: u } = e, n = N().getBool("WEBGL_PACK_BINARY_OPERATIONS") ? new E(k, r.shape, u.shape) : new b(U, r.shape, u.shape);
208
+ const { inputs: e, backend: s } = t, { x: r, alpha: u } = e, n = N().getBool("WEBGL_PACK_BINARY_OPERATIONS") ? new E(U, r.shape, u.shape) : new b(k, r.shape, u.shape);
209
209
  return s.runWebGLProgram(n, [r, u], "float32");
210
210
  }
211
211
  const Ne = {
@@ -273,7 +273,7 @@ function Ae(t, e = !1) {
273
273
  if (t === "relu6")
274
274
  return e ? ae : Q;
275
275
  if (t === "prelu")
276
- return e ? k : U;
276
+ return e ? U : k;
277
277
  if (t === "leakyrelu")
278
278
  return e ? R : w;
279
279
  if (t === "sigmoid")
@@ -1,4 +1,4 @@
1
- import { a2 as p, h as s, a4 as g } from "../index-CUXkjxiT.js";
1
+ import { a2 as p, e as s, a4 as g } from "../index-DSGwv2Yx.js";
2
2
  import b from "./WeightStore.js";
3
3
  class T {
4
4
  parent;
@@ -59,11 +59,11 @@ class T {
59
59
  checkpointingFn(t, ...e) {
60
60
  const r = this.trainableVariables;
61
61
  return p((...i) => {
62
- const o = i[i.length - 1], a = i.slice(0, e.length), h = this.forward(t, ...a);
63
- return o(a), { value: h, gradFunc: (n, l) => {
62
+ const o = i[i.length - 1], a = i.slice(0, e.length), n = this.forward(t, ...a);
63
+ return o(a), { value: n, gradFunc: (h, l) => {
64
64
  const c = s().state.activeTape;
65
65
  s().state.activeTape = [];
66
- const d = g((...u) => this.forward(t, ...u.slice(0, a.length)))([...l, ...r], n);
66
+ const d = g((...u) => this.forward(t, ...u.slice(0, a.length)))([...l, ...r], h);
67
67
  return s().state.activeTape = c, d;
68
68
  } };
69
69
  })(...e, ...r);
@@ -1,11 +1,11 @@
1
1
  import { attentionMask as R } from "../ops/attentionMask.js";
2
2
  import J from "./BaseLayer.js";
3
- import { r as v } from "../rope-0j_f1TPm.js";
3
+ import { r as v } from "../rope-CC5RjmKU.js";
4
4
  import { appendCache as A } from "../ops/appendCache.js";
5
- import { k as c, t as L } from "../index-CUXkjxiT.js";
5
+ import { k as c, t as L } from "../index-DSGwv2Yx.js";
6
6
  import { softmax16 as y } from "../ops/softmax16.js";
7
- import { b as M } from "../matMul16-BcVC_E62.js";
8
- import { p as K } from "../pack16-bqltoUlR.js";
7
+ import { b as M } from "../matMul16-BIT70Vya.js";
8
+ import { p as K } from "../pack16-WlOSOuZA.js";
9
9
  import { transpose16 as j } from "../ops/transpose16.js";
10
10
  import { dot16 as E } from "../ops/dot16.js";
11
11
  import { reshape16 as _ } from "../ops/reshape16.js";
@@ -13,8 +13,8 @@ import { isPackedTensor as l } from "../utilities/packed.js";
13
13
  import { qkv as q } from "../ops/qkv.js";
14
14
  import { normRMS as O } from "../ops/normRMS.js";
15
15
  import { dropout16 as x } from "../ops/dropout16.js";
16
- import { v as P } from "../variable-Ck482e3n.js";
17
- import { r as S } from "../random_normal-IBRrha8a.js";
16
+ import { v as P } from "../variable-SSATClyt.js";
17
+ import { r as S } from "../random_normal-CIm8lk2-.js";
18
18
  class it extends J {
19
19
  constructor(t, o, s, i) {
20
20
  super(o, i), this.attentionConfig = s, this.index = t, this.units = o.nEmbed * 3, this.projUnits = o.nEmbed, this.ATTN = `block_${this.index}_cAttn`, this.PROJ = `block_${this.index}_cProj`, this.addVariable(this.ATTN), this.addVariable(this.PROJ), this.divisor = 1 / Math.sqrt(o.nEmbed / o.nHead);
@@ -1,8 +1,8 @@
1
- import { a as m, t as n } from "../index-CUXkjxiT.js";
1
+ import { b as m, t as n } from "../index-DSGwv2Yx.js";
2
2
  import { p } from "../index-DmeWGGmS.js";
3
- import { v as g } from "../variable-Ck482e3n.js";
4
- import { r as S } from "../random_normal-IBRrha8a.js";
5
- import { z as _ } from "../zeros-DvZpK8s6.js";
3
+ import { v as g } from "../variable-SSATClyt.js";
4
+ import { r as S } from "../random_normal-CIm8lk2-.js";
5
+ import { z as _ } from "../zeros-Bw0puq_w.js";
6
6
  class B {
7
7
  weightStore;
8
8
  alpha;
@@ -1,10 +1,10 @@
1
- import { t as M } from "../index-CUXkjxiT.js";
1
+ import { t as M } from "../index-DSGwv2Yx.js";
2
2
  import f from "./BaseLayer.js";
3
- import { b as h } from "../matMul16-BcVC_E62.js";
3
+ import { b as h } from "../matMul16-BIT70Vya.js";
4
4
  import { reshape16 as d } from "../ops/reshape16.js";
5
5
  import { dropout16 as L } from "../ops/dropout16.js";
6
- import { v as n } from "../variable-Ck482e3n.js";
7
- import { r as m } from "../random_normal-IBRrha8a.js";
6
+ import { v as n } from "../variable-SSATClyt.js";
7
+ import { r as m } from "../random_normal-CIm8lk2-.js";
8
8
  class N extends f {
9
9
  index;
10
10
  hiddenUnits;
@@ -1,9 +1,9 @@
1
- import { t as c, an as p, a as s } from "../index-CUXkjxiT.js";
1
+ import { t as c, an as p, b as s } from "../index-DSGwv2Yx.js";
2
2
  import f from "./BaseLayer.js";
3
- import { E as u } from "../random_width-DN5ZtQkM.js";
4
- import { r as b } from "../exports_initializers-CYzKLjN7.js";
5
- import { m as g } from "../mod-CSdCpRjf.js";
6
- import { r as l } from "../range-C-CjF-LI.js";
3
+ import { E as u } from "../random_width-B_fVXhGx.js";
4
+ import { r as b } from "../exports_initializers-DIOZQt_L.js";
5
+ import { m as g } from "../mod-BXjLYwvM.js";
6
+ import { r as l } from "../range-BDxO73mk.js";
7
7
  function h(e) {
8
8
  return new u(e);
9
9
  }
@@ -1,8 +1,8 @@
1
- import { t as i } from "../index-CUXkjxiT.js";
1
+ import { t as i } from "../index-DSGwv2Yx.js";
2
2
  import e from "./BaseLayer.js";
3
3
  import { normRMS as m } from "../ops/normRMS.js";
4
- import { v as a } from "../variable-Ck482e3n.js";
5
- import { o as M } from "../ones-BytntneX.js";
4
+ import { v as a } from "../variable-SSATClyt.js";
5
+ import { o as M } from "../ones-DbVB5N58.js";
6
6
  class l extends e {
7
7
  GAMMA;
8
8
  rmsConfig;
@@ -1,7 +1,7 @@
1
- import { i as a, a as n, p as c, t as p, k as r } from "../index-CUXkjxiT.js";
2
- import { r as l } from "../zeros_like-CWjDdwr-.js";
3
- import { c as f, s as m } from "../unsorted_segment_sum-DJvk5xnh.js";
4
- import { r as h } from "../range-C-CjF-LI.js";
1
+ import { d as a, b as n, p as c, t as p, k as r } from "../index-DSGwv2Yx.js";
2
+ import { r as l } from "../zeros_like-rOHr54NY.js";
3
+ import { c as f, s as m } from "../unsorted_segment_sum-BfFVV9Zm.js";
4
+ import { r as h } from "../range-BDxO73mk.js";
5
5
  class x {
6
6
  constructor(s) {
7
7
  this.config = s;