@genai-fi/nanogpt 0.10.2 → 0.10.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (249) hide show
  1. package/dist/Generator.js +11761 -171
  2. package/dist/{RealDiv-zz7FpkKX.js → RealDiv-KAPDe8zB.js} +23 -25
  3. package/dist/Reshape-BYkmUnAv.js +14 -0
  4. package/dist/{Reshape-CHdUjC72.js → Reshape-Zt6eb7yh.js} +18 -20
  5. package/dist/TeachableLLM.js +10 -11
  6. package/dist/{axis_util-BsIr9ZNu.js → axis_util-BaG7mf5A.js} +3 -3
  7. package/dist/backend.js +2 -2
  8. package/dist/{backend_util-B1XRLuq9.js → backend_util-RCe-rHaj.js} +72 -73
  9. package/dist/{backend_webgpu-CqpfEImu.js → backend_webgpu-DE3ACOLx.js} +45 -47
  10. package/dist/broadcast_to-B3eYlZm7.js +28 -0
  11. package/dist/checks/appendCache.js +2 -2
  12. package/dist/checks/attentionMask.js +3 -3
  13. package/dist/checks/gelu.js +2 -2
  14. package/dist/checks/matMulGelu.js +7 -11
  15. package/dist/checks/normRMS.js +9 -9
  16. package/dist/checks/normRMSGrad.js +3 -3
  17. package/dist/checks/packUnpack.js +2 -2
  18. package/dist/checks/qkv.js +12 -13
  19. package/dist/checks/rope.js +2 -2
  20. package/dist/clip_by_value-BnO7-a88.js +12 -0
  21. package/dist/complex-DjxcVmoX.js +11 -0
  22. package/dist/concat-BV8bt5H-.js +17 -0
  23. package/dist/{concat_util-iBYIyuQe.js → concat_util-DpW8mL_l.js} +1 -1
  24. package/dist/{dataset-D2P7rHAw.js → dataset-BcwmTGYc.js} +137 -139
  25. package/dist/dropout-BcvN9JYi.js +92 -0
  26. package/dist/expand_dims-DT4tEPwA.js +11 -0
  27. package/dist/{exports_initializers-CZSUJoVE.js → exports_initializers-Hta_rEnm.js} +1 -1
  28. package/dist/floor-D5QdR_le.js +9 -0
  29. package/dist/gather-D3JcZUaI.js +9 -0
  30. package/dist/{gelu-Bmhopi0J.js → gelu-CjNPL4OH.js} +10 -11
  31. package/dist/{gpgpu_math-DsCcikas.js → gpgpu_math-DAOmgtXR.js} +841 -1015
  32. package/dist/{index-DRyE072i.js → index-BwexR4lA.js} +262 -263
  33. package/dist/index-DOvlwCh-.js +3520 -0
  34. package/dist/{kernel_funcs_utils-CWfOAPGO.js → kernel_funcs_utils-CCzYdUZg.js} +130 -132
  35. package/dist/layers/BaseLayer.js +15 -16
  36. package/dist/layers/CausalSelfAttention.js +6 -6
  37. package/dist/layers/MLP.js +4 -4
  38. package/dist/layers/PositionEmbedding.js +7 -7
  39. package/dist/layers/RMSNorm.js +3 -3
  40. package/dist/layers/RoPECache.js +9 -9
  41. package/dist/layers/TiedEmbedding.js +6 -6
  42. package/dist/layers/TransformerBlock.js +1 -1
  43. package/dist/loader/loadTransformers.js +1 -1
  44. package/dist/loader/oldZipLoad.js +13 -14
  45. package/dist/log_sum_exp-ngO0-4pK.js +39 -0
  46. package/dist/main.js +49 -50
  47. package/dist/{matMul16-fEAJ4smh.js → matMul16-BWRSOCWB.js} +14 -15
  48. package/dist/matMulGelu-CzfgT6Wq.js +163 -0
  49. package/dist/mat_mul-SjpJRLyL.js +11 -0
  50. package/dist/mod-AnXEvvpo.js +11 -0
  51. package/dist/models/NanoGPTV1.js +2 -2
  52. package/dist/models/model.js +13 -14
  53. package/dist/ones-D2rT0xk2.js +14 -0
  54. package/dist/ops/adamAdjust.js +1 -1
  55. package/dist/ops/adamMoments.js +1 -1
  56. package/dist/ops/add16.js +1 -1
  57. package/dist/ops/appendCache.js +3 -3
  58. package/dist/ops/attentionMask.js +1 -1
  59. package/dist/ops/concat16.js +2 -2
  60. package/dist/ops/cpu/adamAdjust.js +13 -14
  61. package/dist/ops/cpu/adamMoments.js +6 -7
  62. package/dist/ops/cpu/appendCache.js +7 -8
  63. package/dist/ops/cpu/attentionMask.js +7 -7
  64. package/dist/ops/cpu/fusedSoftmax.js +10 -11
  65. package/dist/ops/cpu/gatherSub.js +9 -10
  66. package/dist/ops/cpu/gelu.js +9 -10
  67. package/dist/ops/cpu/matMul16.js +6 -7
  68. package/dist/ops/cpu/matMulGelu.js +5 -6
  69. package/dist/ops/cpu/matMulMul.js +3 -4
  70. package/dist/ops/cpu/mulDropout.js +3 -4
  71. package/dist/ops/cpu/normRMS.js +10 -11
  72. package/dist/ops/cpu/qkv.js +8 -9
  73. package/dist/ops/cpu/rope.js +5 -6
  74. package/dist/ops/cpu/scatterSub.js +17 -19
  75. package/dist/ops/dot16.js +2 -2
  76. package/dist/ops/gatherSub.js +1 -1
  77. package/dist/ops/gelu.js +2 -2
  78. package/dist/ops/grads/add16.js +11 -12
  79. package/dist/ops/grads/attentionMask.js +5 -6
  80. package/dist/ops/grads/gelu.js +3 -4
  81. package/dist/ops/grads/matMul16.js +4 -5
  82. package/dist/ops/grads/matMulGelu.js +9 -10
  83. package/dist/ops/grads/normRMS.js +7 -8
  84. package/dist/ops/grads/pack16.js +4 -5
  85. package/dist/ops/grads/qkv.js +17 -19
  86. package/dist/ops/grads/rope.js +3 -5
  87. package/dist/ops/grads/softmax16.js +3 -4
  88. package/dist/ops/grads/unpack16.js +3 -4
  89. package/dist/ops/grads/utils.d.ts +1 -0
  90. package/dist/ops/grads/utils.js +8 -4
  91. package/dist/ops/matMul16.js +3 -3
  92. package/dist/ops/matMulGelu.js +2 -2
  93. package/dist/ops/matMulMul.js +1 -1
  94. package/dist/ops/mul16.js +1 -1
  95. package/dist/ops/mulDrop.js +1 -1
  96. package/dist/ops/normRMS.js +1 -1
  97. package/dist/ops/pack16.js +3 -4
  98. package/dist/ops/qkv.js +4 -8
  99. package/dist/ops/reshape16.js +14 -16
  100. package/dist/ops/rope.d.ts +1 -1
  101. package/dist/ops/rope.js +3 -8
  102. package/dist/ops/scatterSub.js +1 -1
  103. package/dist/ops/slice16.js +2 -2
  104. package/dist/ops/softmax16.js +5 -8
  105. package/dist/ops/sub16.js +1 -1
  106. package/dist/ops/sum16.js +2 -2
  107. package/dist/ops/transpose16.js +23 -24
  108. package/dist/ops/unpack16.js +2 -2
  109. package/dist/ops/webgl/adamAdjust.js +2 -3
  110. package/dist/ops/webgl/adamMoments.js +1 -2
  111. package/dist/ops/webgl/appendCache.js +1 -2
  112. package/dist/ops/webgl/attentionMask.js +4 -5
  113. package/dist/ops/webgl/fusedSoftmax.js +4 -6
  114. package/dist/ops/webgl/gatherSub.js +6 -7
  115. package/dist/ops/webgl/gelu.js +2 -3
  116. package/dist/ops/webgl/log.js +11 -12
  117. package/dist/ops/webgl/matMul16.js +10 -11
  118. package/dist/ops/webgl/matMulGelu.js +7 -111
  119. package/dist/ops/webgl/matMulMul.js +9 -10
  120. package/dist/ops/webgl/mulDropout.js +8 -9
  121. package/dist/ops/webgl/normRMS.js +2 -3
  122. package/dist/ops/webgl/qkv.js +5 -6
  123. package/dist/ops/webgl/rope.js +7 -8
  124. package/dist/ops/webgl/scatterSub.js +5 -6
  125. package/dist/ops/webgpu/adamAdjust.js +10 -12
  126. package/dist/ops/webgpu/adamMoments.js +8 -10
  127. package/dist/ops/webgpu/add16.js +8 -9
  128. package/dist/ops/webgpu/appendCache.js +23 -25
  129. package/dist/ops/webgpu/attentionMask.js +8 -10
  130. package/dist/ops/webgpu/attentionMask32_program.js +2 -2
  131. package/dist/ops/webgpu/concat16.js +12 -14
  132. package/dist/ops/webgpu/gatherSub.js +11 -13
  133. package/dist/ops/webgpu/gelu.js +28 -29
  134. package/dist/ops/webgpu/matMul16.js +26 -28
  135. package/dist/ops/webgpu/matMul16_program.js +4 -5
  136. package/dist/ops/webgpu/mul16.js +9 -10
  137. package/dist/ops/webgpu/normRMS.js +15 -17
  138. package/dist/ops/webgpu/normRMSGrad.js +21 -28
  139. package/dist/ops/webgpu/pack16.js +12 -13
  140. package/dist/ops/webgpu/pack16_program.js +2 -2
  141. package/dist/ops/webgpu/qkv.js +16 -18
  142. package/dist/ops/webgpu/rope.js +25 -27
  143. package/dist/ops/webgpu/scatterSub.js +7 -9
  144. package/dist/ops/webgpu/slice16.js +21 -23
  145. package/dist/ops/webgpu/softmax16.js +17 -19
  146. package/dist/ops/webgpu/softmax16_program.js +2 -2
  147. package/dist/ops/webgpu/softmax16_subgroup_program.js +2 -2
  148. package/dist/ops/webgpu/softmax16grad.js +7 -8
  149. package/dist/ops/webgpu/sub16.js +7 -8
  150. package/dist/ops/webgpu/sum16.js +18 -20
  151. package/dist/ops/webgpu/transpose16.js +19 -20
  152. package/dist/ops/webgpu/transpose16_program.js +2 -2
  153. package/dist/ops/webgpu/transpose16_shared_program.js +11 -12
  154. package/dist/ops/webgpu/unpack16.js +3 -4
  155. package/dist/ops/webgpu/utils/binary_op.js +7 -8
  156. package/dist/ops/webgpu/utils/reductions.js +14 -22
  157. package/dist/ops-B5yanEdW.js +476 -0
  158. package/dist/pack16-nQ6JaLo-.js +39 -0
  159. package/dist/patches/webgpu_backend.js +19 -20
  160. package/dist/patches/webgpu_base.js +1 -1
  161. package/dist/patches/webgpu_program.js +21 -22
  162. package/dist/{random_width-BVV9HveY.js → random_width-or-CEftb.js} +2506 -2761
  163. package/dist/range-BklejeeW.js +10 -0
  164. package/dist/relu-CP0ZcxWO.js +9 -0
  165. package/dist/reshape-ByE68wS9.js +9 -0
  166. package/dist/resize_nearest_neighbor-B19mCEg2.js +175 -0
  167. package/dist/rope-Ir4mTyD1.js +24 -0
  168. package/dist/{scatter_nd_util-C7zXRT_h.js → scatter_nd_util-lvSiX8q4.js} +1 -1
  169. package/dist/selu_util-kbhpTdYD.js +44 -0
  170. package/dist/{shared-CHhxz-O5.js → shared-DT1TkE6w.js} +1 -1
  171. package/dist/{shared-D2NP_CpY.js → shared-dntlHIDQ.js} +343 -345
  172. package/dist/slice-BfEGSH82.js +12 -0
  173. package/dist/{slice_util-DyjSAD0u.js → slice_util-uTKwiEpW.js} +1 -1
  174. package/dist/{softmax-C9JQEtnO.js → softmax-CA5jFsLR.js} +4 -5
  175. package/dist/split-CVLc0w--.js +9 -0
  176. package/dist/squeeze-C7Z2srUo.js +10 -0
  177. package/dist/stack-Cf4n9h0N.js +11 -0
  178. package/dist/step-CINUs5QB.js +261 -0
  179. package/dist/sum-DWAtNGez.js +11 -0
  180. package/dist/tensor-DJoc7gJU.js +8 -0
  181. package/dist/tensor1d-D11P_7Dp.js +11 -0
  182. package/dist/{tensor2d-CSB4KOb0.js → tensor2d-Bs9wZRc7.js} +6 -7
  183. package/dist/{tensor4d-D7bLqGqz.js → tensor4d-BARPdTaS.js} +6 -7
  184. package/dist/{tfjs_backend-CNkSTL0c.js → tfjs_backend-y1cvNhLA.js} +255 -264
  185. package/dist/tile-mbfagpsB.js +11 -0
  186. package/dist/training/Adam.js +2 -2
  187. package/dist/training/AdamExt.js +1 -1
  188. package/dist/training/DatasetBuilder.js +2 -2
  189. package/dist/training/FullTrainer.js +1 -1
  190. package/dist/training/Trainer.js +2 -2
  191. package/dist/training/sparseCrossEntropy.js +5 -5
  192. package/dist/transpose-ClWiBS_b.js +36 -0
  193. package/dist/unsorted_segment_sum-BDDhB_E6.js +277 -0
  194. package/dist/utilities/dummy.js +3 -3
  195. package/dist/utilities/multinomialCPU.js +2 -2
  196. package/dist/utilities/packed.d.ts +1 -4
  197. package/dist/utilities/packed.js +10 -745
  198. package/dist/utilities/performance.js +1 -1
  199. package/dist/utilities/profile.js +1 -1
  200. package/dist/utilities/safetensors.js +2 -2
  201. package/dist/utilities/sentences.js +5 -5
  202. package/dist/utilities/weights.js +2 -2
  203. package/dist/{variable-DzfrwYuP.js → variable-WawDEaAb.js} +1 -1
  204. package/dist/{webgpu_program-DzaQiqel.js → webgpu_program-DuOXPQol.js} +178 -172
  205. package/dist/{webgpu_util-0_ubCEHJ.js → webgpu_util-RxEF33Rj.js} +34 -35
  206. package/dist/zeros-KnWaWf-X.js +13 -0
  207. package/dist/zeros_like-DvE73F4e.js +721 -0
  208. package/package.json +4 -2
  209. package/dist/Reshape-CDVLyVfz.js +0 -16
  210. package/dist/broadcast_to-B0ChcDaz.js +0 -30
  211. package/dist/complex-BBiRlsVq.js +0 -13
  212. package/dist/concat-DmBLPVGC.js +0 -19
  213. package/dist/dropout-B1x1kYMa.js +0 -99
  214. package/dist/expand_dims-ouvfxQ1n.js +0 -13
  215. package/dist/gather-CH9sdacz.js +0 -10
  216. package/dist/index-D6Q1lPZO.js +0 -2157
  217. package/dist/log_sum_exp-D3ftBNY5.js +0 -41
  218. package/dist/mat_mul-C59XWcJd.js +0 -12
  219. package/dist/mod-DESSvHIU.js +0 -12
  220. package/dist/mulmat_packed_gpu-Coh6qbJk.js +0 -55
  221. package/dist/ones-jU9jlQvM.js +0 -15
  222. package/dist/ops-BFDtP6th.js +0 -645
  223. package/dist/pack16-CmVZs6af.js +0 -41
  224. package/dist/patches/PackedTensor.d.ts +0 -12
  225. package/dist/patches/PackedTensor.js +0 -11
  226. package/dist/patches/engine.d.ts +0 -261
  227. package/dist/patches/engine.js +0 -12
  228. package/dist/patches/tape.d.ts +0 -12
  229. package/dist/patches/tape.js +0 -5
  230. package/dist/range-ZZZD60Fx.js +0 -11
  231. package/dist/reciprocal-CrYlsAGD.js +0 -10
  232. package/dist/register_all_kernels-nvj2k7OC.js +0 -12307
  233. package/dist/relu-BYDneVPn.js +0 -10
  234. package/dist/reshape-CaPQzFvz.js +0 -10
  235. package/dist/rope-s4W2XO9B.js +0 -32
  236. package/dist/selu_util-BGPXmd4B.js +0 -303
  237. package/dist/sin-Djs4aQiu.js +0 -16
  238. package/dist/slice-DvovR5wq.js +0 -13
  239. package/dist/split-DBck65sX.js +0 -10
  240. package/dist/squeeze-C00Ipm_7.js +0 -11
  241. package/dist/stack-ChnHwRpX.js +0 -13
  242. package/dist/sum-ywRJj3Zr.js +0 -12
  243. package/dist/tensor-0r5yOo2R.js +0 -8
  244. package/dist/tensor-CzmOBsdf.js +0 -909
  245. package/dist/tensor1d-BlUT89BP.js +0 -12
  246. package/dist/tensor_util-DfwaWayG.js +0 -523
  247. package/dist/tile-CR074jmp.js +0 -13
  248. package/dist/transpose-DH4gmHvu.js +0 -38
  249. package/dist/zeros-DBFVbpv5.js +0 -14
@@ -1,12 +0,0 @@
1
- import { x as n, y as t } from "./index-D6Q1lPZO.js";
2
- import { c as s } from "./tensor-CzmOBsdf.js";
3
- function p(r, e) {
4
- s(r);
5
- const o = n(r, e);
6
- if (o.length !== 1)
7
- throw new Error("tensor1d() requires values to be a flat/TypedArray");
8
- return t(r, null, o, e);
9
- }
10
- export {
11
- p as t
12
- };
@@ -1,523 +0,0 @@
1
- import { e as g, D as F, v as P, F as D, b as M, T as w } from "./tensor-CzmOBsdf.js";
2
- const A = 1e-7, G = 1e-4;
3
- class z {
4
- constructor(s, o) {
5
- this.backend = s, this.dataMover = o, this.data = /* @__PURE__ */ new WeakMap(), this.dataIdsCount = 0;
6
- }
7
- get(s) {
8
- return this.data.has(s) || this.dataMover.moveData(this.backend, s), this.data.get(s);
9
- }
10
- set(s, o) {
11
- this.dataIdsCount++, this.data.set(s, o);
12
- }
13
- has(s) {
14
- return this.data.has(s);
15
- }
16
- delete(s) {
17
- return this.dataIdsCount--, this.data.delete(s);
18
- }
19
- numDataIds() {
20
- return this.dataIdsCount;
21
- }
22
- }
23
- class K {
24
- refCount(s) {
25
- return d("refCount");
26
- }
27
- incRef(s) {
28
- return d("incRef");
29
- }
30
- timerAvailable() {
31
- return !0;
32
- }
33
- time(s) {
34
- return d("time");
35
- }
36
- read(s) {
37
- return d("read");
38
- }
39
- readSync(s) {
40
- return d("readSync");
41
- }
42
- readToGPU(s, o) {
43
- return d("readToGPU");
44
- }
45
- numDataIds() {
46
- return d("numDataIds");
47
- }
48
- disposeData(s, o) {
49
- return d("disposeData");
50
- }
51
- write(s, o, c) {
52
- return d("write");
53
- }
54
- move(s, o, c, a, r) {
55
- return d("move");
56
- }
57
- createTensorFromGPUData(s, o, c) {
58
- return d("createTensorFromGPUData");
59
- }
60
- memory() {
61
- return d("memory");
62
- }
63
- /** Returns the highest precision for floats in bits (e.g. 16 or 32) */
64
- floatPrecision() {
65
- return d("floatPrecision");
66
- }
67
- /** Returns the smallest representable number. */
68
- epsilon() {
69
- return this.floatPrecision() === 32 ? A : G;
70
- }
71
- dispose() {
72
- return d("dispose");
73
- }
74
- }
75
- function d(t) {
76
- throw new Error(`'${t}' not yet implemented or not found in the registry. This kernel may not be supported by the tfjs backend you have chosen`);
77
- }
78
- const _ = "Abs", U = "Acos", W = "Acosh", j = "Add", H = "AddN", X = "All", Y = "Any", Z = "ArgMax", J = "ArgMin", Q = "Asin", tt = "Asinh", st = "Atan", ot = "Atanh", et = "Atan2", nt = "AvgPool", at = "AvgPoolGrad", rt = "AvgPool3D", ct = "AvgPool3DGrad", it = "BatchMatMul", lt = "BatchToSpaceND", ut = "Bincount", pt = "BitwiseAnd", dt = "BroadcastTo", ft = "BroadcastArgs", ht = "Cast", gt = "Ceil", mt = "ClipByValue", bt = "Complex", St = "ComplexAbs", Dt = "Concat", Rt = "Conv2D", Tt = "Conv2DBackpropFilter", kt = "Conv2DBackpropInput", Nt = "Conv3D", xt = "Conv3DBackpropFilterV2", vt = "Conv3DBackpropInputV2", Pt = "Cos", Ct = "Cosh", Ft = "Cumprod", yt = "Cumsum", It = "CropAndResize", Bt = "DenseBincount", Et = "DepthToSpace", Mt = "DepthwiseConv2dNative", wt = "DepthwiseConv2dNativeBackpropFilter", At = "DepthwiseConv2dNativeBackpropInput", Gt = "Diag", Lt = "Dilation2D", $t = "Dilation2DBackpropInput", Ot = "Dilation2DBackpropFilter", qt = "Draw", Vt = "RealDiv", zt = "Einsum", Kt = "Elu", _t = "EluGrad", Ut = "Erf", Wt = "Equal", jt = "Exp", Ht = "ExpandDims", Xt = "Expm1", Yt = "FFT", Zt = "Fill", Jt = "FlipLeftRight", Qt = "Floor", ts = "FloorDiv", ss = "FusedBatchNorm", os = "GatherV2", es = "GatherNd", ns = "Greater", as = "GreaterEqual", rs = "Identity", cs = "IFFT", is = "Imag", ls = "IsFinite", us = "IsInf", ps = "IsNan", ds = "LeakyRelu", fs = "Less", hs = "LessEqual", gs = "LinSpace", ms = "Log", bs = "Log1p", Ss = "LogicalAnd", Ds = "LogicalNot", Rs = "LogicalOr", Ts = "LogSoftmax", ks = "LRN", Ns = "LRNGrad", xs = "Max", vs = "Maximum", Ps = "MaxPool", Cs = "MaxPoolGrad", Fs = "MaxPool3D", ys = "MaxPool3DGrad", Is = "MaxPoolWithArgmax", Bs = "Mean", Es = "Min", Ms = "Minimum", ws = "MirrorPad", As = "Mod", Gs = "Multinomial", Ls = "Multiply", $s = "Neg", Os = "NotEqual", qs = "NonMaxSuppressionV3", Vs = "NonMaxSuppressionV4", zs = "NonMaxSuppressionV5", Ks = "OnesLike", _s = "OneHot", Us = "Pack", Ws = "PadV2", js = "Pow", Hs = "Prelu", Xs = "Prod", Ys = "RaggedGather", Zs = "RaggedRange", Js = "RaggedTensorToTensor", Qs = "Range", to = "Real", so = "Reciprocal", oo = "Relu", eo = "Reshape", no = "ResizeNearestNeighbor", ao = "ResizeNearestNeighborGrad", ro = "ResizeBilinear", co = "ResizeBilinearGrad", io = "Relu6", lo = "Reverse", uo = "Round", po = "Rsqrt", fo = "ScatterNd", ho = "TensorScatterUpdate", go = "SearchSorted", mo = "Select", bo = "Selu", So = "Slice", Do = "Sin", Ro = "Sinh", To = "Sign", ko = "Sigmoid", No = "Softplus", xo = "Sqrt", vo = "Sum", Po = "SpaceToBatchND", Co = "SplitV", Fo = "Softmax", yo = "SparseFillEmptyRows", Io = "SparseReshape", Bo = "SparseSegmentMean", Eo = "SparseSegmentSum", Mo = "SparseToDense", wo = "SquaredDifference", Ao = "Square", Go = "StaticRegexReplace", Lo = "StridedSlice", $o = "StringNGrams", Oo = "StringSplit", qo = "StringToHashBucketFast", Vo = "Sub", zo = "Tan", Ko = "Tanh", _o = "Tile", Uo = "TopK", Wo = "Transform", jo = "Transpose", Ho = "Unique", Xo = "Unpack", Yo = "UnsortedSegmentSum", Zo = "ZerosLike", Jo = "Step", Qo = "FromPixels", te = "RotateWithOffset", se = "_FusedMatMul", oe = "FusedConv2D", ee = "FusedDepthwiseConv2D";
79
- function y(...t) {
80
- g().getBool("IS_TEST") || g().getBool("PROD") || console.warn(...t);
81
- }
82
- function ne(...t) {
83
- g().getBool("IS_TEST") || g().getBool("PROD") || console.log(...t);
84
- }
85
- const S = F("kernelRegistry", () => /* @__PURE__ */ new Map()), R = F("gradRegistry", () => /* @__PURE__ */ new Map());
86
- function ae(t, s) {
87
- const o = I(t, s);
88
- return S.get(o);
89
- }
90
- function re(t) {
91
- return R.get(t);
92
- }
93
- function ce(t) {
94
- const s = S.entries(), o = [];
95
- for (; ; ) {
96
- const { done: c, value: a } = s.next();
97
- if (c)
98
- break;
99
- const [r, l] = a, [p] = r.split("_");
100
- p === t && o.push(l);
101
- }
102
- return o;
103
- }
104
- function ie(t) {
105
- const { kernelName: s, backendName: o } = t, c = I(s, o);
106
- S.has(c) && y(`The kernel '${s}' for backend '${o}' is already registered`), S.set(c, t);
107
- }
108
- function le(t) {
109
- const { kernelName: s } = t;
110
- R.has(s) && g().getBool("DEBUG") && y(`Overriding the gradient for '${s}'`), R.set(s, t);
111
- }
112
- function I(t, s) {
113
- return `${s}_${t}`;
114
- }
115
- class ue {
116
- constructor(s, o) {
117
- this.backendTimer = s, this.logger = o, o == null && (this.logger = new $());
118
- }
119
- profileKernel(s, o, c) {
120
- let a;
121
- const r = () => {
122
- a = c();
123
- };
124
- let l;
125
- const p = P();
126
- if (this.backendTimer.timerAvailable())
127
- l = this.backendTimer.time(r);
128
- else {
129
- r();
130
- for (const e of a)
131
- e.dataSync();
132
- l = Promise.resolve({ kernelMs: P() - p });
133
- }
134
- if (g().getBool("CHECK_COMPUTATION_FOR_ERRORS"))
135
- for (let e = 0; e < a.length; e++) {
136
- const i = a[e];
137
- i.data().then((u) => {
138
- L(u, i.dtype, s);
139
- });
140
- }
141
- return {
142
- kernelName: s,
143
- outputs: a,
144
- inputs: o,
145
- timeMs: l.then((e) => e.kernelMs),
146
- extraInfo: l.then((e) => e.getExtraProfileInfo != null ? e.getExtraProfileInfo() : "")
147
- };
148
- }
149
- logKernelProfile(s) {
150
- const { kernelName: o, outputs: c, timeMs: a, inputs: r, extraInfo: l } = s;
151
- c.forEach((p) => {
152
- Promise.all([p.data(), a, l]).then((n) => {
153
- this.logger.logKernelProfile(o, p, n[0], n[1], r, n[2]);
154
- });
155
- });
156
- }
157
- }
158
- function L(t, s, o) {
159
- if (s !== "float32")
160
- return !1;
161
- for (let c = 0; c < t.length; c++) {
162
- const a = t[c];
163
- if (isNaN(a) || !isFinite(a))
164
- return console.warn(`Found ${a} in the result of '${o}'`), !0;
165
- }
166
- return !1;
167
- }
168
- class $ {
169
- logKernelProfile(s, o, c, a, r, l) {
170
- const p = typeof a == "number" ? D(`${a}ms`, 9) : a.error, n = D(s, 25), e = o.rank, i = o.size, u = D(o.shape.toString(), 14);
171
- let f = "";
172
- for (const h in r) {
173
- const m = r[h];
174
- if (m != null) {
175
- const b = m.shape || o.shape, v = b.length;
176
- f += `${h}: ${v}D ${v > 0 ? b : ""} `;
177
- }
178
- }
179
- console.log(`%c${n} %c${p} %c${e}D ${u} %c${i} %c${f} %c${l}`, "font-weight:bold", "color:red", "color:blue", "color: orange", "color: green", "color: steelblue");
180
- }
181
- }
182
- function pe(t, s, o) {
183
- const c = {}, a = {};
184
- for (let n = 0; n < s.length; n++)
185
- c[s[n].id] = !0;
186
- for (let n = 0; n < t.length; n++) {
187
- const e = t[n], i = e.inputs;
188
- for (const u in i) {
189
- const f = i[u];
190
- let h = !1;
191
- for (let m = 0; m < s.length; m++)
192
- if (c[f.id]) {
193
- e.outputs.forEach((b) => c[b.id] = !0), h = !0, a[e.id] = !0;
194
- break;
195
- }
196
- if (h)
197
- break;
198
- }
199
- }
200
- const r = {};
201
- r[o.id] = !0;
202
- const l = {};
203
- for (let n = t.length - 1; n >= 0; n--) {
204
- const e = t[n], i = e.inputs;
205
- for (let u = 0; u < e.outputs.length; u++)
206
- if (r[e.outputs[u].id]) {
207
- for (const f in i)
208
- r[i[f].id] = !0, l[e.id] = !0;
209
- break;
210
- }
211
- }
212
- const p = [];
213
- for (let n = 0; n < t.length; n++) {
214
- const e = t[n];
215
- if (a[e.id] && l[e.id]) {
216
- const i = {};
217
- for (const f in e.inputs) {
218
- const h = e.inputs[f];
219
- c[h.id] && (i[f] = h);
220
- }
221
- const u = Object.assign({}, e);
222
- u.inputs = i, u.outputs = e.outputs, p.push(u);
223
- }
224
- }
225
- return p;
226
- }
227
- function de(t, s, o, c) {
228
- for (let a = s.length - 1; a >= 0; a--) {
229
- const r = s[a], l = [];
230
- if (r.outputs.forEach((n) => {
231
- const e = t[n.id];
232
- e != null ? l.push(e) : l.push(null);
233
- }), r.gradient == null)
234
- throw new Error(`Cannot compute gradient: gradient function not found for ${r.kernelName}.`);
235
- const p = r.gradient(l);
236
- for (const n in r.inputs) {
237
- if (!(n in p))
238
- throw new Error(`Cannot backprop through input ${n}. Available gradients found: ${Object.keys(p)}.`);
239
- const e = o(() => p[n]());
240
- if (e.dtype !== "float32")
241
- throw new Error(`Error in gradient for op ${r.kernelName}. The gradient of input ${n} must have 'float32' dtype, but has '${e.dtype}'`);
242
- const i = r.inputs[n];
243
- if (!M(e.shape, i.shape))
244
- throw new Error(`Error in gradient for op ${r.kernelName}. The gradient of input '${n}' has shape '${e.shape}', which does not match the shape of the input '${i.shape}'`);
245
- if (t[i.id] == null)
246
- t[i.id] = e;
247
- else {
248
- const u = t[i.id];
249
- t[i.id] = c(u, e), u.dispose();
250
- }
251
- }
252
- }
253
- }
254
- var C;
255
- (function(t) {
256
- t.R0 = "R0", t.R1 = "R1", t.R2 = "R2", t.R3 = "R3", t.R4 = "R4", t.R5 = "R5", t.R6 = "R6";
257
- })(C || (C = {}));
258
- var T;
259
- (function(t) {
260
- t.float32 = "float32", t.int32 = "int32", t.bool = "int32", t.complex64 = "complex64";
261
- })(T || (T = {}));
262
- var k;
263
- (function(t) {
264
- t.float32 = "float32", t.int32 = "int32", t.bool = "bool", t.complex64 = "complex64";
265
- })(k || (k = {}));
266
- var N;
267
- (function(t) {
268
- t.float32 = "float32", t.int32 = "float32", t.bool = "float32", t.complex64 = "complex64";
269
- })(N || (N = {}));
270
- var x;
271
- (function(t) {
272
- t.float32 = "complex64", t.int32 = "complex64", t.bool = "complex64", t.complex64 = "complex64";
273
- })(x || (x = {}));
274
- const O = {
275
- float32: N,
276
- int32: T,
277
- bool: k,
278
- complex64: x
279
- };
280
- function B(t, s) {
281
- if (t === "string" || s === "string") {
282
- if (t === "string" && s === "string")
283
- return "string";
284
- throw new Error(`Can not upcast ${t} with ${s}`);
285
- }
286
- return O[t][s];
287
- }
288
- function fe(t) {
289
- return B(t, "int32");
290
- }
291
- function he(t) {
292
- return t != null && typeof t == "object" && "texture" in t && t.texture instanceof WebGLTexture;
293
- }
294
- function ge(t) {
295
- return typeof GPUBuffer < "u" && t != null && typeof t == "object" && "buffer" in t && t.buffer instanceof GPUBuffer;
296
- }
297
- function me(t, s) {
298
- if (t.dtype === s.dtype)
299
- return [t, s];
300
- const o = B(t.dtype, s.dtype);
301
- return [t.cast(o), s.cast(o)];
302
- }
303
- function be(t, s) {
304
- return s.some((o) => o.id === t.id);
305
- }
306
- function Se(t) {
307
- const s = [];
308
- return E(t, s, /* @__PURE__ */ new Set()), s;
309
- }
310
- function E(t, s, o) {
311
- if (t == null)
312
- return;
313
- if (t instanceof w) {
314
- s.push(t);
315
- return;
316
- }
317
- if (!q(t))
318
- return;
319
- const c = t;
320
- for (const a in c) {
321
- const r = c[a];
322
- o.has(r) || (o.add(r), E(r, s, o));
323
- }
324
- }
325
- function q(t) {
326
- return Array.isArray(t) || typeof t == "object";
327
- }
328
- export {
329
- Vt as $,
330
- j as A,
331
- it as B,
332
- Dt as C,
333
- is as D,
334
- Ht as E,
335
- to as F,
336
- os as G,
337
- jo as H,
338
- rs as I,
339
- z as J,
340
- K,
341
- ms as L,
342
- As as M,
343
- $s as N,
344
- be as O,
345
- Us as P,
346
- Qt as Q,
347
- Qs as R,
348
- Fo as S,
349
- _o as T,
350
- ko as U,
351
- Kt as V,
352
- ds as W,
353
- Hs as X,
354
- io as Y,
355
- Jo as Z,
356
- fe as _,
357
- le as a,
358
- Bt as a$,
359
- ne as a0,
360
- mt as a1,
361
- se as a2,
362
- de as a3,
363
- he as a4,
364
- ge as a5,
365
- ts as a6,
366
- Ls as a7,
367
- St as a8,
368
- _ as a9,
369
- zs as aA,
370
- Vs as aB,
371
- ro as aC,
372
- no as aD,
373
- Wo as aE,
374
- pt as aF,
375
- gt as aG,
376
- Wt as aH,
377
- Xt as aI,
378
- Xs as aJ,
379
- po as aK,
380
- Go as aL,
381
- X as aM,
382
- Y as aN,
383
- Z as aO,
384
- nt as aP,
385
- rt as aQ,
386
- Ko as aR,
387
- lt as aS,
388
- ss as aT,
389
- Rt as aU,
390
- kt as aV,
391
- Nt as aW,
392
- vt as aX,
393
- Ct as aY,
394
- Ft as aZ,
395
- yt as a_,
396
- Zt as aa,
397
- Zo as ab,
398
- js as ac,
399
- xo as ad,
400
- Vo as ae,
401
- vs as af,
402
- ut as ag,
403
- mo as ah,
404
- zt as ai,
405
- Es as aj,
406
- ns as ak,
407
- as as al,
408
- fs as am,
409
- hs as an,
410
- bs as ao,
411
- Ss as ap,
412
- Bs as aq,
413
- Ms as ar,
414
- Os as as,
415
- uo as at,
416
- wo as au,
417
- Xo as av,
418
- It as aw,
419
- Jt as ax,
420
- te as ay,
421
- qs as az,
422
- eo as b,
423
- Mo as b$,
424
- Mt as b0,
425
- Ut as b1,
426
- No as b2,
427
- Ds as b3,
428
- Ps as b4,
429
- Fs as b5,
430
- _s as b6,
431
- Ks as b7,
432
- Ws as b8,
433
- Po as b9,
434
- us as bA,
435
- ps as bB,
436
- Ts as bC,
437
- Ns as bD,
438
- ks as bE,
439
- ys as bF,
440
- Cs as bG,
441
- ws as bH,
442
- co as bI,
443
- ao as bJ,
444
- To as bK,
445
- Ao as bL,
446
- zo as bM,
447
- ft as bN,
448
- Et as bO,
449
- Gt as bP,
450
- qt as bQ,
451
- Yt as bR,
452
- Qo as bS,
453
- ee as bT,
454
- cs as bU,
455
- gs as bV,
456
- Rs as bW,
457
- Is as bX,
458
- go as bY,
459
- Bo as bZ,
460
- Eo as b_,
461
- lo as ba,
462
- bo as bb,
463
- Ro as bc,
464
- Yo as bd,
465
- Tt as be,
466
- oe as bf,
467
- wt as bg,
468
- At as bh,
469
- U as bi,
470
- W as bj,
471
- H as bk,
472
- J as bl,
473
- Q as bm,
474
- tt as bn,
475
- et as bo,
476
- st as bp,
477
- ot as bq,
478
- ct as br,
479
- at as bs,
480
- dt as bt,
481
- xt as bu,
482
- Lt as bv,
483
- Ot as bw,
484
- $t as bx,
485
- _t as by,
486
- ls as bz,
487
- Co as c,
488
- Lo as c0,
489
- $o as c1,
490
- ho as c2,
491
- Uo as c3,
492
- Ho as c4,
493
- Ys as c5,
494
- Zs as c6,
495
- Js as c7,
496
- yo as c8,
497
- Io as c9,
498
- Oo as ca,
499
- qo as cb,
500
- so as d,
501
- oo as e,
502
- So as f,
503
- vo as g,
504
- bt as h,
505
- Gs as i,
506
- fo as j,
507
- es as k,
508
- Pt as l,
509
- me as m,
510
- Do as n,
511
- ue as o,
512
- ce as p,
513
- ae as q,
514
- ie as r,
515
- re as s,
516
- Se as t,
517
- B as u,
518
- pe as v,
519
- y as w,
520
- ht as x,
521
- xs as y,
522
- jt as z
523
- };
@@ -1,13 +0,0 @@
1
- import { A as a, B as e, E as i } from "./index-D6Q1lPZO.js";
2
- import { T as m } from "./tensor_util-DfwaWayG.js";
3
- import { a as c } from "./tensor-CzmOBsdf.js";
4
- function l(n, t) {
5
- const r = e(n, "x", "tile", "string_or_numeric");
6
- c(r.rank === t.length, () => `Error in transpose: rank of input ${r.rank} must match length of reps ${t}.`);
7
- const o = { x: r }, s = { reps: t };
8
- return i.runKernel(m, o, s);
9
- }
10
- const x = /* @__PURE__ */ a({ tile_: l });
11
- export {
12
- x as t
13
- };
@@ -1,38 +0,0 @@
1
- import { A as u, B as i, E as a, t as m } from "./index-D6Q1lPZO.js";
2
- import { D as $, N as g, F as x, H as c } from "./tensor_util-DfwaWayG.js";
3
- import { c as k } from "./complex-BBiRlsVq.js";
4
- import { a as l } from "./tensor-CzmOBsdf.js";
5
- function K(r) {
6
- const e = { input: i(r, "input", "imag") };
7
- return a.runKernel($, e);
8
- }
9
- const h = /* @__PURE__ */ u({ imag_: K });
10
- function E(r) {
11
- const e = { x: i(r, "x", "neg") };
12
- return a.runKernel(g, e);
13
- }
14
- const N = /* @__PURE__ */ u({ neg_: E });
15
- function _(r) {
16
- const e = { input: i(r, "input", "real") };
17
- return a.runKernel(x, e);
18
- }
19
- const b = /* @__PURE__ */ u({ real_: _ });
20
- function d(r, t, e) {
21
- const n = i(r, "x", "transpose");
22
- if (t == null && (t = n.shape.map((s, o) => o).reverse()), l(n.rank === t.length, () => `Error in transpose: rank of input ${n.rank} must match length of perm ${t}.`), t.forEach((s) => {
23
- l(s >= 0 && s < n.rank, () => `All entries in 'perm' must be between 0 and ${n.rank - 1} but got ${t}`);
24
- }), n.rank <= 1)
25
- return n.clone();
26
- const f = { x: n }, p = { perm: t };
27
- return n.dtype === "complex64" ? m(() => {
28
- let s = b(n), o = h(n);
29
- return s = a.runKernel(c, { x: s }, p), o = a.runKernel(c, { x: o }, p), e && (o = N(o)), k(s, o);
30
- }) : a.runKernel(c, f, p);
31
- }
32
- const I = /* @__PURE__ */ u({ transpose_: d });
33
- export {
34
- h as i,
35
- N as n,
36
- b as r,
37
- I as t
38
- };
@@ -1,14 +0,0 @@
1
- import { E as m } from "./index-D6Q1lPZO.js";
2
- import { c as n } from "./complex-BBiRlsVq.js";
3
- import { d as i, f, s as c } from "./tensor-CzmOBsdf.js";
4
- function e(o, r = "float32") {
5
- if (i(o), r === "complex64") {
6
- const a = e(o, "float32"), t = e(o, "float32");
7
- return n(a, t);
8
- }
9
- const s = f(c(o), r);
10
- return m.makeTensor(s, o, r);
11
- }
12
- export {
13
- e as z
14
- };