npm - @huggingface/transformers - Versions diffs - 4.0.0-next.8 → 4.0.0-next.9 - Mend

@huggingface/transformers 4.0.0-next.8 → 4.0.0-next.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

package/README.md +2 -2
package/dist/ort-wasm-simd-threaded.jsep.mjs +26 -26
package/dist/transformers.js +338 -230
package/dist/transformers.min.js +22 -18
package/dist/transformers.node.cjs +339 -228
package/dist/transformers.node.min.cjs +23 -19
package/dist/transformers.node.min.mjs +23 -19
package/dist/transformers.node.mjs +336 -228
package/dist/transformers.web.js +220 -112
package/dist/transformers.web.min.js +18 -14
package/package.json +2 -2
package/src/env.js +1 -1
package/src/models/gemma3/image_processing_gemma3.js +3 -0
package/src/models/gemma3/modeling_gemma3.js +4 -1
package/src/models/gemma3/processing_gemma3.js +45 -0
package/src/models/image_processors.js +1 -0
package/src/models/modeling_utils.js +46 -25
package/src/models/processors.js +1 -0
package/src/models/qwen2_vl/modeling_qwen2_vl.js +39 -32
package/src/models/registry.js +2 -8
package/src/utils/model_registry/ModelRegistry.js +36 -0
package/src/utils/model_registry/get_available_dtypes.js +68 -0
package/src/utils/model_registry/get_model_files.js +7 -60
package/src/utils/model_registry/resolve_model_type.js +66 -0
package/types/models/gemma3/image_processing_gemma3.d.ts +4 -0
package/types/models/gemma3/image_processing_gemma3.d.ts.map +1 -0
package/types/models/gemma3/modeling_gemma3.d.ts +4 -1
package/types/models/gemma3/modeling_gemma3.d.ts.map +1 -1
package/types/models/gemma3/processing_gemma3.d.ts +20 -0
package/types/models/gemma3/processing_gemma3.d.ts.map +1 -0
package/types/models/image_processors.d.ts +1 -0
package/types/models/modeling_utils.d.ts +2 -3
package/types/models/modeling_utils.d.ts.map +1 -1
package/types/models/processors.d.ts +1 -0
package/types/models/qwen2_vl/modeling_qwen2_vl.d.ts.map +1 -1
package/types/models/registry.d.ts.map +1 -1
package/types/utils/model_registry/ModelRegistry.d.ts +27 -0
package/types/utils/model_registry/ModelRegistry.d.ts.map +1 -1
package/types/utils/model_registry/get_available_dtypes.d.ts +26 -0
package/types/utils/model_registry/get_available_dtypes.d.ts.map +1 -0
package/types/utils/model_registry/get_model_files.d.ts +25 -0
package/types/utils/model_registry/get_model_files.d.ts.map +1 -1
package/types/utils/model_registry/resolve_model_type.d.ts +24 -0
package/types/utils/model_registry/resolve_model_type.d.ts.map +1 -0

package/dist/transformers.js CHANGED Viewed

@@ -20,7 +20,7 @@ var node_path_default = {};
 var node_url_default = {};
 // src/env.js
-var VERSION = "4.0.0-next.8";
+var VERSION = "4.0.0-next.9";
 var HAS_SELF = typeof self !== "undefined";
 var IS_FS_AVAILABLE = !isEmpty(node_fs_default);
 var IS_PATH_AVAILABLE = !isEmpty(node_path_default);
@@ -5754,14 +5754,14 @@ var Random = class {
    * @returns {number} A normally distributed random value.
    */
   gauss(mu = 0, sigma = 1) {
-    let z = this._gauss_next;
+    let z2 = this._gauss_next;
     this._gauss_next = null;
-    if (z === null) {
+    if (z2 === null) {
       const x2pi = this.random() * 2 * Math.PI, g2rad = Math.sqrt(-2 * Math.log(1 - this.random()));
-      z = Math.cos(x2pi) * g2rad;
+      z2 = Math.cos(x2pi) * g2rad;
       this._gauss_next = Math.sin(x2pi) * g2rad;
     }
-    return mu + z * sigma;
+    return mu + z2 * sigma;
   }
   /**
    * Shuffles an array in-place using the Fisher-Yates algorithm.
@@ -7485,7 +7485,7 @@ __export(onnxruntime_node_exports, {
 });
 var onnxruntime_node_default = {};
-// ../../node_modules/.pnpm/onnxruntime-web@1.25.0-dev.20260307-d626b568e0/node_modules/onnxruntime-web/dist/ort.webgpu.bundle.min.mjs
+// ../../node_modules/.pnpm/onnxruntime-web@1.25.0-dev.20260323-a99aad9d36/node_modules/onnxruntime-web/dist/ort.webgpu.bundle.min.mjs
 var ort_webgpu_bundle_min_exports = {};
 __export(ort_webgpu_bundle_min_exports, {
   InferenceSession: () => Jf,
@@ -8253,7 +8253,7 @@ async function ts(a = {}) {
     throw L(e = "Aborted(" + e + ")"), W = true, e = new WebAssembly.RuntimeError(e + ". Build with -sASSERTIONS for more info."), R?.(e), e;
   }
   function Ye() {
-    return { a: { f: Vs, J: js, k: Hs, p: Ys, l: qs, ta: Js, b: Xs, ca: Qs, Ka: Sn, s: Zs, da: Ln, _a: On, Ga: Bn, Ia: Mn, $a: Cn, Ya: Un, Ra: Dn, Xa: Pn, pa: _n, Ha: Rn, Yb: Nn, Za: kn, Fa: Wn, eb: Ks, Da: ti, Tb: ri, Rb: oi, Ca: si, M: ii, I: ui, Sb: fi, ka: yi, Ub: bi, Ua: wi, Wb: Ti, La: vi, Pb: Ei, la: Si, Ta: Ar, bb: Ai, U: Oi, n: Di, c: Er, sb: Pi, w: _i, L: Ri, z: Ni, j: ki, o: Yn, tb: Wi, G: Fi, T: Gi, h: $i, u: zi, m: Vi, i: ji, Oa: Hi, Pa: Yi, Qa: qi, Ma: Qn, Na: Zn, Qb: Kn, fb: Xi, db: Ki, Y: eu, rb: tu, ma: ru, cb: Qi, gb: nu, ab: ou, Xb: au, N: Ji, hb: su, X: iu, Vb: uu, ob: bu, C: wu, sa: gu, ra: Tu, qb: vu, W: Eu, v: Su, nb: Au, mb: Iu, lb: xu, pb: Lu, kb: Ou, jb: Bu, ib: Mu, Va: ao, Wa: so, Ja: br, ea: io, oa: uo, Sa: fo, na: co, Db: Gf, xa: Df, Eb: Ff, ya: Uf, F: Ef, e: ff, r: sf, x: af, D: gf, Ib: Bf, ba: Lf, B: df, za: Mf, $: Pf, ha: Of, Fb: kf, Gb: Nf, Ba: Sf, Aa: xf, Jb: Af, wa: Wf, aa: Cf, d: cf, A: lf, q: uf, Cb: $f, t: mf, y: Tf, H: pf, E: hf, K: vf, S: _f, ja: wf, _: Rf, Kb: bf, Lb: yf, P: If2, g: Uu, a: Fe, Ob: qe, Hb: Du, ia: Pu, O: _u, qa: Ru, Mb: Nu, Q: ku, zb: Wu, Ab: Fu, ua: Gu, fa: $u, R: zu, Ea: Vu, va: ju, Z: Hu, xb: Yu, Zb: qu, V: Ju, Bb: Xu, ub: Qu, vb: Ku, wb: ef, ga: tf, yb: rf, Nb: nf } };
+    return { a: { f: Vs, J: js, k: Hs, p: Ys, l: qs, ta: Js, b: Xs, ca: Qs, Ka: Sn, q: Zs, da: Ln, _a: On, Ga: Bn, Ia: Mn, $a: Cn, Ya: Un, Ra: Dn, Xa: Pn, pa: _n, Ha: Rn, Yb: Nn, Za: kn, Fa: Wn, eb: Ks, Da: ti, Tb: ri, Rb: oi, Ca: si, M: ii, I: ui, Sb: fi, ka: yi, Ub: bi, Ua: wi, Wb: Ti, La: vi, Pb: Ei, la: Si, Ta: Ar, bb: Ai, U: Oi, n: Di, c: Er, sb: Pi, w: _i, L: Ri, z: Ni, j: ki, o: Yn, tb: Wi, G: Fi, T: Gi, h: $i, u: zi, m: Vi, i: ji, Oa: Hi, Pa: Yi, Qa: qi, Ma: Qn, Na: Zn, Qb: Kn, fb: Xi, db: Ki, Y: eu, rb: tu, ma: ru, cb: Qi, gb: nu, ab: ou, Xb: au, N: Ji, hb: su, X: iu, Vb: uu, ob: bu, C: wu, sa: gu, ra: Tu, qb: vu, W: Eu, v: Su, nb: Au, mb: Iu, lb: xu, pb: Lu, kb: Ou, jb: Bu, ib: Mu, Va: ao, Wa: so, Ja: br, ea: io, oa: uo, Sa: fo, na: co, Db: Gf, xa: Df, Eb: Ff, ya: Uf, F: Ef, e: ff, s: sf, x: af, D: gf, Ib: Bf, ba: Lf, B: lf, za: Mf, $: Pf, ha: Of, Fb: kf, Gb: Nf, Ba: Sf, Aa: xf, Jb: Af, wa: Wf, aa: Cf, d: uf, A: df, r: cf, Cb: $f, t: mf, y: Tf, H: pf, E: hf, K: vf, S: _f, ja: wf, _: Rf, Kb: bf, Lb: yf, P: If2, g: Uu, a: Fe, Ob: qe, Hb: Du, ia: Pu, O: _u, qa: Ru, Mb: Nu, Q: ku, zb: Wu, Ab: Fu, ua: Gu, fa: $u, R: zu, Ea: Vu, va: ju, Z: Hu, xb: Yu, Zb: qu, V: Ju, Bb: Xu, ub: Qu, vb: Ku, wb: ef, ga: tf, yb: rf, Nb: nf } };
   }
   async function bt() {
     function e(o, u) {
@@ -8316,14 +8316,14 @@ async function ts(a = {}) {
     gt.push(t), Je[e.Nc] = t, t.Nc = e.Nc;
     var n = { Oc: "run", he: e.ge, Wc: e.Wc, Nc: e.Nc };
     return t.postMessage(n, e.Yc), 0;
-  }, z = 0, V = (e, t, ...n) => {
+  }, G = 0, V = (e, t, ...n) => {
     var o, u = 16 * n.length, c = P(), h = Ft(u), b = h >>> 3;
     for (o of n) typeof o == "bigint" ? ((p(), pe)[b++ >>> 0] = 1n, (p(), pe)[b++ >>> 0] = o) : ((p(), pe)[b++ >>> 0] = 0n, (p(), ae)[b++ >>> 0] = o);
     return e = Lo(e, 0, u, h, t), D(c), e;
   };
   function qe(e) {
     if (i) return V(0, 1, e);
-    if (S = e, !(0 < z)) {
+    if (S = e, !(0 < G)) {
       for (var t of gt) Se(t);
       for (t of We) Se(t);
       We = [], gt = [], Je = {}, W = true;
@@ -8368,7 +8368,7 @@ async function ts(a = {}) {
     We.push(e);
   }
   var Fe, zs = (e, t) => {
-    z = 0, e = zr(e, t), 0 < z ? S = e : Fr(e);
+    G = 0, e = zr(e, t), 0 < G ? S = e : Fr(e);
   }, Ct = [], Ut = 0, me = (e) => -9007199254740992 > e || 9007199254740992 < e ? NaN : Number(e);
   function Vs(e) {
     var t = new wr(e >>>= 0);
@@ -8720,7 +8720,7 @@ async function ts(a = {}) {
   }
   var he = (e) => {
     if (!W) try {
-      if (e(), !(0 < z)) try {
+      if (e(), !(0 < G)) try {
         i ? Wt() && Fr(S) : br(S);
       } catch (t) {
         t instanceof wt || t == "unwind" || y(0, t);
@@ -8748,7 +8748,7 @@ async function ts(a = {}) {
     return (t ? Vr[t] : of[e])(...Ir);
   }
   var Ei = () => {
-    z = 0;
+    G = 0;
   };
   function Si(e) {
     e >>>= 0, i ? postMessage({ Oc: "cleanupThread", ie: e }) : yn(Je[e]);
@@ -8768,7 +8768,7 @@ async function ts(a = {}) {
       try {
         return e(...n);
       } finally {
-        W || (_t.pop(), Me && Ge === 1 && _t.length === 0 && (Ge = 0, z += 1, Pt(wa), typeof Fibers < "u" && Fibers.De()));
+        W || (_t.pop(), Me && Ge === 1 && _t.length === 0 && (Ge = 0, G += 1, Pt(wa), typeof Fibers < "u" && Fibers.De()));
       }
     };
     return jn.set(e, t), t;
@@ -8783,7 +8783,7 @@ async function ts(a = {}) {
             try {
               var c = (function() {
                 var E = (p(), x)[Me + 8 >>> 2 >>> 0];
-                return E = Vn.get(E), E = jn.get(E), --z, E();
+                return E = Vn.get(E), E = jn.get(E), --G, E();
               })();
             } catch (E) {
               c = E, u = true;
@@ -8974,7 +8974,7 @@ async function ts(a = {}) {
     return L(ct(e >>> 0, t >>> 0));
   }
   var ou = () => {
-    throw z += 1, "unwind";
+    throw G += 1, "unwind";
   };
   function au() {
     return 4294901760;
@@ -9067,15 +9067,15 @@ async function ts(a = {}) {
       }
       (b = (p(), A)[c + 24 >>> 2 >>> 0]) && (b = { label: Ne(b + 4) }, e.defaultQueue = b), e.label = Ne(c + 4);
     }
-    z += 1, lt(t, h.requestDevice(e).then((B) => {
-      --z, he(() => {
-        ce[u >>> 0] = B.queue, ce[o >>> 0] = B, lt(n, B.lost.then((ue) => {
+    G += 1, lt(t, h.requestDevice(e).then((B) => {
+      --G, he(() => {
+        ce[u >>> 0] = B.queue, ce[o >>> 0] = B, G += 1, lt(n, B.lost.then((ue) => {
           he(() => {
             B.onuncapturederror = () => {
             };
             var ye = P(), fe = Ce(ue.message);
             _r(n, yu[ue.reason], fe), D(ye);
-          });
+          }), --G;
         })), B.onuncapturederror = (ue) => {
           var ye = 5;
           ue.error instanceof GPUValidationError ? ye = 2 : ue.error instanceof GPUOutOfMemoryError ? ye = 3 : ue.error instanceof GPUInternalError && (ye = 4);
@@ -9084,7 +9084,7 @@ async function ts(a = {}) {
         }, "adapterInfo" in B || (B.adapterInfo = h.info), kr(t, 1, o, 0);
       });
     }, (B) => {
-      --z, he(() => {
+      --G, he(() => {
         var ue = P(), ye = Ce(B.message);
         kr(t, 3, o, ye), n && _r(n, 4, ye), D(ue);
       });
@@ -9127,12 +9127,12 @@ async function ts(a = {}) {
   function vu(e, t, n, o, u) {
     e >>>= 0, t = me(t), n = me(n), u >>>= 0;
     var c = O(e);
-    Re[e] = [], u == 4294967295 && (u = void 0), z += 1, lt(t, c.mapAsync(n, o >>> 0, u).then(() => {
-      --z, he(() => {
+    Re[e] = [], u == 4294967295 && (u = void 0), G += 1, lt(t, c.mapAsync(n, o >>> 0, u).then(() => {
+      --G, he(() => {
         Rr(t, 1, 0);
       });
     }, (h) => {
-      --z, he(() => {
+      --G, he(() => {
         P();
         var b = Ce(h.message);
         Rr(t, h.name === "AbortError" ? 4 : h.name === "OperationError" ? 3 : 0, b), delete Re[e];
@@ -9161,12 +9161,12 @@ async function ts(a = {}) {
     return ce[n >>> 0] = u, o && (Re[n] = []), true;
   }
   function Iu(e, t, n, o) {
-    e >>>= 0, t = me(t), o >>>= 0, n = du(n >>> 0), e = O(e), z += 1, lt(t, e.createComputePipelineAsync(n).then((u) => {
-      --z, he(() => {
+    e >>>= 0, t = me(t), o >>>= 0, n = du(n >>> 0), e = O(e), G += 1, lt(t, e.createComputePipelineAsync(n).then((u) => {
+      --G, he(() => {
         ce[o >>> 0] = u, Pr(t, 1, o, 0);
       });
     }, (u) => {
-      --z, he(() => {
+      --G, he(() => {
         var c = P(), h = Ce(u.message);
         Pr(t, u.reason === "validation" ? 3 : u.reason === "internal" ? 4 : 0, o, h), D(c);
       });
@@ -9181,15 +9181,15 @@ async function ts(a = {}) {
     (e = O(e)).onuncapturederror = null, e.destroy();
   };
   function Ou(e, t) {
-    t = me(t), e = O(e >>> 0), z += 1, lt(t, e.popErrorScope().then((n) => {
-      --z, he(() => {
+    t = me(t), e = O(e >>> 0), G += 1, lt(t, e.popErrorScope().then((n) => {
+      --G, he(() => {
         var o = 5;
         n ? n instanceof GPUValidationError ? o = 2 : n instanceof GPUOutOfMemoryError ? o = 3 : n instanceof GPUInternalError && (o = 4) : o = 1;
         var u = P(), c = n ? Ce(n.message) : 0;
         Nr(t, 1, o, c), D(u);
       });
     }, (n) => {
-      --z, he(() => {
+      --G, he(() => {
         var o = P(), u = Ce(n.message);
         Nr(t, 1, 5, u), D(o);
       });
@@ -9200,8 +9200,8 @@ async function ts(a = {}) {
       var u = { featureLevel: pu[(p(), x)[n + 4 >>> 2 >>> 0]], powerPreference: mu[(p(), x)[n + 8 >>> 2 >>> 0]], forceFallbackAdapter: !!(p(), A)[n + 12 >>> 2 >>> 0] };
       (e = (p(), A)[n >>> 2 >>> 0]) !== 0 && (p(), u.Fe = !!(p(), A)[e + 8 >>> 2 >>> 0]);
     }
-    "gpu" in navigator ? (z += 1, lt(t, navigator.gpu.requestAdapter(u).then((c) => {
-      --z, he(() => {
+    "gpu" in navigator ? (G += 1, lt(t, navigator.gpu.requestAdapter(u).then((c) => {
+      --G, he(() => {
         if (c) ce[o >>> 0] = c, Et(t, 1, o, 0);
         else {
           var h = P(), b = Ce("WebGPU not available on this browser (requestAdapter returned null)");
@@ -9209,7 +9209,7 @@ async function ts(a = {}) {
         }
       });
     }, (c) => {
-      --z, he(() => {
+      --G, he(() => {
         var h = P(), b = Ce(c.message);
         Et(t, 4, o, b), D(h);
       });
@@ -9440,7 +9440,7 @@ async function ts(a = {}) {
         Te(`invalid type for getValue: ${t}`);
     }
   }, r.UTF8ToString = ct, r.stringToUTF8 = Pe, r.lengthBytesUTF8 = _e;
-  var lo, po, Dr, Wt, xe, pt, mo, ho, yo, bo, wo, go, To, vo, Eo, So, Ao, Pr, _r, Rr, Nr, Et, kr, Io, Wr, xo, Lo, Oo, Fr, Bo, Mo, Gr, N, St, Co, D, Ft, P, Uo, $r, Do, Po, _o, zr, Ro, No, ko, Wo, Fo, Go, $o, zo, Vo, jo, Ho, Yo, qo, Jo, Xo, Qo, Zo, Ko, ea, ta, ra, na, oa, aa, sa, ia, ua, fa, ca, da, la, pa, ma, ha, ya, ba, wa, ga, Ta, ke, of = [qe, yr, En, Ln, On, Bn, Mn, Cn, Un, Dn, Pn, _n, Rn, Nn, kn, Wn, Qn, Zn, Kn, ao, so, io, uo, fo, co], Vr = { 925676: (e, t, n, o, u) => {
+  var lo, po, Dr, Wt, xe, pt, mo, ho, yo, bo, wo, go, To, vo, Eo, So, Ao, Pr, _r, Rr, Nr, Et, kr, Io, Wr, xo, Lo, Oo, Fr, Bo, Mo, Gr, N, St, Co, D, Ft, P, Uo, $r, Do, Po, _o, zr, Ro, No, ko, Wo, Fo, Go, $o, zo, Vo, jo, Ho, Yo, qo, Jo, Xo, Qo, Zo, Ko, ea, ta, ra, na, oa, aa, sa, ia, ua, fa, ca, da, la, pa, ma, ha, ya, ba, wa, ga, Ta, ke, of = [qe, yr, En, Ln, On, Bn, Mn, Cn, Un, Dn, Pn, _n, Rn, Nn, kn, Wn, Qn, Zn, Kn, ao, so, io, uo, fo, co], Vr = { 937012: (e, t, n, o, u) => {
     if (r === void 0 || !r.Uc) return 1;
     if ((e = ct(Number(e >>> 0))).startsWith("./") && (e = e.substring(2)), !(e = r.Uc.get(e))) return 2;
     if (t = Number(t >>> 0), n = Number(n >>> 0), o = Number(o >>> 0), t + n > e.byteLength) return 3;
@@ -9460,11 +9460,11 @@ async function ts(a = {}) {
     } catch {
       return 4;
     }
-  }, 926500: (e, t, n) => {
+  }, 937836: (e, t, n) => {
     r.Sd(e, (p(), J).subarray(t >>> 0, t + n >>> 0));
-  }, 926564: () => r.me(), 926606: (e) => {
+  }, 937900: () => r.me(), 937942: (e) => {
     r.jd(e);
-  }, 926643: () => typeof wasmOffsetConverter < "u" };
+  }, 937979: () => typeof wasmOffsetConverter < "u" };
   function af(e, t, n, o) {
     var u = P();
     try {
@@ -9483,12 +9483,12 @@ async function ts(a = {}) {
       N(1, 0);
     }
   }
-  function uf(e, t, n) {
-    var o = P();
+  function uf(e) {
+    var t = P();
     try {
-      _o(e, t, n);
-    } catch (u) {
-      if (D(o), u !== u + 0) throw u;
+      Ro(e);
+    } catch (n) {
+      if (D(t), n !== n + 0) throw n;
       N(1, 0);
     }
   }
@@ -9501,25 +9501,16 @@ async function ts(a = {}) {
       N(1, 0);
     }
   }
-  function cf(e) {
-    var t = P();
-    try {
-      Ro(e);
-    } catch (n) {
-      if (D(t), n !== n + 0) throw n;
-      N(1, 0);
-    }
-  }
-  function df(e, t, n, o, u, c, h) {
-    var b = P();
+  function cf(e, t, n) {
+    var o = P();
     try {
-      return Wo(e, t, n, o, u, c, h);
-    } catch (E) {
-      if (D(b), E !== E + 0) throw E;
+      _o(e, t, n);
+    } catch (u) {
+      if (D(o), u !== u + 0) throw u;
       N(1, 0);
     }
   }
-  function lf(e, t) {
+  function df(e, t) {
     var n = P();
     try {
       Vo(e, t);
@@ -9528,6 +9519,15 @@ async function ts(a = {}) {
       N(1, 0);
     }
   }
+  function lf(e, t, n, o, u, c, h) {
+    var b = P();
+    try {
+      return Wo(e, t, n, o, u, c, h);
+    } catch (E) {
+      if (D(b), E !== E + 0) throw E;
+      N(1, 0);
+    }
+  }
   function pf(e, t, n, o, u, c) {
     var h = P();
     try {
@@ -9957,7 +9957,7 @@ var nc;
 var oc;
 var ac;
 var qt;
-var $;
+var z;
 var je = k(() => {
   "use strict";
   Yt();
@@ -10013,19 +10013,19 @@ var je = k(() => {
         rr = false, ds = true, H(M);
       });
     })), await Promise.race(C), S) throw new Error(`WebAssembly backend initializing failed due to timeout: ${r}ms`);
-  }, $ = () => {
+  }, z = () => {
     if (nn && rn) return rn;
     throw new Error("WebAssembly is not initialized yet.");
   };
 });
 var be;
 var Lt;
-var G;
+var $;
 var nr = k(() => {
   "use strict";
   je();
   be = (a, r) => {
-    let s = $(), f = s.lengthBytesUTF8(a) + 1, i = s._malloc(f);
+    let s = z(), f = s.lengthBytesUTF8(a) + 1, i = s._malloc(f);
     return s.stringToUTF8(a, i, f), r.push(i), i;
   }, Lt = (a, r, s, f) => {
     if (typeof a == "object" && a !== null) {
@@ -10039,8 +10039,8 @@ var nr = k(() => {
       else if (typeof d == "boolean") f(l, d ? "1" : "0");
       else throw new Error(`Can't handle extra config type: ${typeof d}`);
     });
-  }, G = (a) => {
-    let r = $(), s = r.stackSave();
+  }, $ = (a) => {
+    let r = z(), s = r.stackSave();
     try {
       let f = r.PTR_SIZE, i = r.stackAlloc(2 * f);
       r._OrtGetLastError(i, i + f);
@@ -10057,7 +10057,7 @@ var ps = k(() => {
   je();
   nr();
   ls = (a) => {
-    let r = $(), s = 0, f = [], i = a || {};
+    let r = z(), s = 0, f = [], i = a || {};
     try {
       if (a?.logSeverityLevel === void 0) i.logSeverityLevel = 2;
       else if (typeof a.logSeverityLevel != "number" || !Number.isInteger(a.logSeverityLevel) || a.logSeverityLevel < 0 || a.logSeverityLevel > 4) throw new Error(`log severity level is not valid: ${a.logSeverityLevel}`);
@@ -10065,9 +10065,9 @@ var ps = k(() => {
       else if (typeof a.logVerbosityLevel != "number" || !Number.isInteger(a.logVerbosityLevel)) throw new Error(`log verbosity level is not valid: ${a.logVerbosityLevel}`);
       a?.terminate === void 0 && (i.terminate = false);
       let d = 0;
-      return a?.tag !== void 0 && (d = be(a.tag, f)), s = r._OrtCreateRunOptions(i.logSeverityLevel, i.logVerbosityLevel, !!i.terminate, d), s === 0 && G("Can't create run options."), a?.extra !== void 0 && Lt(a.extra, "", /* @__PURE__ */ new WeakSet(), (l, m) => {
+      return a?.tag !== void 0 && (d = be(a.tag, f)), s = r._OrtCreateRunOptions(i.logSeverityLevel, i.logVerbosityLevel, !!i.terminate, d), s === 0 && $("Can't create run options."), a?.extra !== void 0 && Lt(a.extra, "", /* @__PURE__ */ new WeakSet(), (l, m) => {
         let y = be(l, f), w = be(m, f);
-        r._OrtAddRunConfigEntry(s, y, w) !== 0 && G(`Can't set a run config entry: ${l} - ${m}.`);
+        r._OrtAddRunConfigEntry(s, y, w) !== 0 && $(`Can't set a run config entry: ${l} - ${m}.`);
       }), [s, f];
     } catch (d) {
       throw s !== 0 && r._OrtReleaseRunOptions(s), f.forEach((l) => r._free(l)), d;
@@ -10115,7 +10115,7 @@ var hs = k(() => {
     r.use_ort_model_bytes_directly || (r.use_ort_model_bytes_directly = "1"), a.executionProviders && a.executionProviders.some((s) => (typeof s == "string" ? s : s.name) === "webgpu") && (a.enableMemPattern = false);
   }, on = (a, r, s, f) => {
     let i = be(r, f), d = be(s, f);
-    $()._OrtAddSessionConfigEntry(a, i, d) !== 0 && G(`Can't set a session config entry: ${r} - ${s}.`);
+    z()._OrtAddSessionConfigEntry(a, i, d) !== 0 && $(`Can't set a session config entry: ${r} - ${s}.`);
   }, ot = (a, r, s, f) => {
     let i = be(r, f), d = be(s, f);
     a.push([i, d]);
@@ -10146,7 +10146,7 @@ var hs = k(() => {
               }
               S.validationMode && ot(l, "validationMode", S.validationMode, s);
             }
-            let v = $().webgpuRegisterDevice(g);
+            let v = z().webgpuRegisterDevice(g);
             if (v) {
               let [S, C, R] = v;
               ot(l, "deviceId", S.toString(), s), ot(l, "webgpuInstance", C.toString(), s), ot(l, "webgpuDevice", R.toString(), s);
@@ -10161,13 +10161,13 @@ var hs = k(() => {
       }
       let m = be(d, s), y = l.length, w = 0, T = 0;
       if (y > 0) {
-        w = $()._malloc(y * $().PTR_SIZE), s.push(w), T = $()._malloc(y * $().PTR_SIZE), s.push(T);
-        for (let g = 0; g < y; g++) $().setValue(w + g * $().PTR_SIZE, l[g][0], "*"), $().setValue(T + g * $().PTR_SIZE, l[g][1], "*");
+        w = z()._malloc(y * z().PTR_SIZE), s.push(w), T = z()._malloc(y * z().PTR_SIZE), s.push(T);
+        for (let g = 0; g < y; g++) z().setValue(w + g * z().PTR_SIZE, l[g][0], "*"), z().setValue(T + g * z().PTR_SIZE, l[g][1], "*");
       }
-      await $()._OrtAppendExecutionProvider(a, m, w, T, y) !== 0 && G(`Can't append execution provider: ${d}.`);
+      await z()._OrtAppendExecutionProvider(a, m, w, T, y) !== 0 && $(`Can't append execution provider: ${d}.`);
     }
   }, ms = async (a) => {
-    let r = $(), s = 0, f = [], i = a || {};
+    let r = z(), s = 0, f = [], i = a || {};
     uc(i);
     try {
       let d = sc(i.graphOptimizationLevel ?? "all"), l = ic(i.executionMode ?? "sequential"), m = typeof i.logId == "string" ? be(i.logId, f) : 0, y = i.logSeverityLevel ?? 2;
@@ -10175,7 +10175,7 @@ var hs = k(() => {
       let w = i.logVerbosityLevel ?? 0;
       if (!Number.isInteger(w) || w < 0 || w > 4) throw new Error(`log verbosity level is not valid: ${w}`);
       let T = typeof i.optimizedModelFilePath == "string" ? be(i.optimizedModelFilePath, f) : 0;
-      if (s = r._OrtCreateSessionOptions(d, !!i.enableCpuMemArena, !!i.enableMemPattern, l, !!i.enableProfiling, 0, m, y, w, T), s === 0 && G("Can't create session options."), i.executionProviders && await fc(s, i, f), i.enableGraphCapture !== void 0) {
+      if (s = r._OrtCreateSessionOptions(d, !!i.enableCpuMemArena, !!i.enableMemPattern, l, !!i.enableProfiling, 0, m, y, w, T), s === 0 && $("Can't create session options."), i.executionProviders && await fc(s, i, f), i.enableGraphCapture !== void 0) {
         if (typeof i.enableGraphCapture != "boolean") throw new Error(`enableGraphCapture must be a boolean value: ${i.enableGraphCapture}`);
         on(s, "enableGraphCapture", i.enableGraphCapture.toString(), f);
       }
@@ -10183,13 +10183,13 @@ var hs = k(() => {
         if (typeof g != "string") throw new Error(`free dimension override name must be a string: ${g}`);
         if (typeof v != "number" || !Number.isInteger(v) || v < 0) throw new Error(`free dimension override value must be a non-negative integer: ${v}`);
         let S = be(g, f);
-        r._OrtAddFreeDimensionOverride(s, S, v) !== 0 && G(`Can't set a free dimension override: ${g} - ${v}.`);
+        r._OrtAddFreeDimensionOverride(s, S, v) !== 0 && $(`Can't set a free dimension override: ${g} - ${v}.`);
       }
       return i.extra !== void 0 && Lt(i.extra, "", /* @__PURE__ */ new WeakSet(), (g, v) => {
         on(s, g, v, f);
       }), [s, f];
     } catch (d) {
-      throw s !== 0 && r._OrtReleaseSessionOptions(s) !== 0 && G("Can't release session options."), f.forEach((l) => r._free(l)), d;
+      throw s !== 0 && r._OrtReleaseSessionOptions(s) !== 0 && $("Can't release session options."), f.forEach((l) => r._free(l)), d;
     }
   };
 });
@@ -10759,7 +10759,7 @@ var Os = k(() => {
       return l ? l.push(d) : this.temporarySessionTensorIds.set(r, [d]), d;
     }
     uploadTensor(r, s) {
-      if (!$().shouldTransferToMLTensor) throw new Error("Trying to upload to a MLTensor while shouldTransferToMLTensor is false");
+      if (!z().shouldTransferToMLTensor) throw new Error("Trying to upload to a MLTensor while shouldTransferToMLTensor is false");
       le("verbose", () => `[WebNN] uploadTensor {tensorId: ${r}, data: ${s.byteLength}}`), this.tensorManager.upload(r, s);
     }
     async downloadTensor(r, s) {
@@ -10865,11 +10865,11 @@ var Kr = k(() => {
   nr();
   sn();
   yc = (a, r) => {
-    $()._OrtInit(a, r) !== 0 && G("Can't initialize onnxruntime.");
+    z()._OrtInit(a, r) !== 0 && $("Can't initialize onnxruntime.");
   }, Jt = async (a) => {
     yc(a.wasm.numThreads, Ot(a.logLevel));
   }, Xt = async (a, r) => {
-    $().asyncInit?.();
+    z().asyncInit?.();
     let s = a.webgpu.adapter;
     if (r === "webgpu") {
       if (typeof navigator > "u" || !navigator.gpu) throw new Error("WebGPU is not supported in current environment");
@@ -10884,29 +10884,29 @@ var Kr = k(() => {
       }
     }
     if (r === "webnn" && (typeof navigator > "u" || !navigator.ml)) throw new Error("WebNN is not supported in current environment");
-    if (r === "webgpu" && $().webgpuInit((f) => {
+    if (r === "webgpu" && z().webgpuInit((f) => {
       a.webgpu.device = f;
     }), r === "webnn") {
       let f = new (Os(), $t(Ls)).WebNNBackend(a);
-      $().webnnInit([f, () => f.reserveTensorId(), (i) => f.releaseTensorId(i), async (i, d, l, m, y) => f.ensureTensor(i, d, l, m, y), (i, d) => {
+      z().webnnInit([f, () => f.reserveTensorId(), (i) => f.releaseTensorId(i), async (i, d, l, m, y) => f.ensureTensor(i, d, l, m, y), (i, d) => {
         f.uploadTensor(i, d);
       }, async (i, d) => f.downloadTensor(i, d), (i, d) => f.registerMLContext(i, d), !!a.trace]);
     }
   }, it = /* @__PURE__ */ new Map(), bc = (a) => {
-    let r = $(), s = r.stackSave();
+    let r = z(), s = r.stackSave();
     try {
       let f = r.PTR_SIZE, i = r.stackAlloc(2 * f);
-      r._OrtGetInputOutputCount(a, i, i + f) !== 0 && G("Can't get session input/output count.");
+      r._OrtGetInputOutputCount(a, i, i + f) !== 0 && $("Can't get session input/output count.");
       let l = f === 4 ? "i32" : "i64";
       return [Number(r.getValue(i, l)), Number(r.getValue(i + f, l))];
     } finally {
       r.stackRestore(s);
     }
   }, Bs = (a, r) => {
-    let s = $(), f = s.stackSave(), i = 0;
+    let s = z(), f = s.stackSave(), i = 0;
     try {
       let d = s.PTR_SIZE, l = s.stackAlloc(2 * d);
-      s._OrtGetInputOutputMetadata(a, r, l, l + d) !== 0 && G("Can't get session input/output metadata.");
+      s._OrtGetInputOutputMetadata(a, r, l, l + d) !== 0 && $("Can't get session input/output metadata.");
       let y = Number(s.getValue(l, "*"));
       i = Number(s.getValue(l + d, "*"));
       let w = s.HEAP32[i / 4];
@@ -10921,11 +10921,11 @@ var Kr = k(() => {
       s.stackRestore(f), i !== 0 && s._OrtFree(i);
     }
   }, xt = (a) => {
-    let r = $(), s = r._malloc(a.byteLength);
+    let r = z(), s = r._malloc(a.byteLength);
     if (s === 0) throw new Error(`Can't create a session. failed to allocate a buffer of size ${a.byteLength}.`);
     return r.HEAPU8.set(a, s), [s, a.byteLength];
   }, Qt = async (a, r) => {
-    let s, f, i = $();
+    let s, f, i = z();
     Array.isArray(a) ? [s, f] = a : a.buffer === i.HEAPU8.buffer ? [s, f] = [a.byteOffset, a.byteLength] : [s, f] = xt(a);
     let d = 0, l = 0, m = 0, y = [], w = [], T = [];
     try {
@@ -10946,17 +10946,17 @@ var Kr = k(() => {
         } else i.currentContext = await i.webnnCreateMLContext();
         break;
       }
-      d = await i._OrtCreateSession(s, f, l), i.webgpuOnCreateSession?.(d), d === 0 && G("Can't create a session."), i.jsepOnCreateSession?.(), i.currentContext && (i.webnnRegisterMLContext(d, i.currentContext), i.currentContext = void 0, i.shouldTransferToMLTensor = true);
+      d = await i._OrtCreateSession(s, f, l), i.webgpuOnCreateSession?.(d), d === 0 && $("Can't create a session."), i.jsepOnCreateSession?.(), i.currentContext && (i.webnnRegisterMLContext(d, i.currentContext), i.currentContext = void 0, i.shouldTransferToMLTensor = true);
       let [g, v] = bc(d), S = !!r?.enableGraphCapture, C = [], R = [], H = [], U = [], M = [];
       for (let L = 0; L < g; L++) {
         let [W, oe, p] = Bs(d, L);
-        W === 0 && G("Can't get an input name."), w.push(W);
+        W === 0 && $("Can't get an input name."), w.push(W);
         let ne = i.UTF8ToString(W);
         C.push(ne), H.push(oe === 0 ? { name: ne, isTensor: false } : { name: ne, isTensor: true, type: or(oe), shape: p });
       }
       for (let L = 0; L < v; L++) {
         let [W, oe, p] = Bs(d, L + g);
-        W === 0 && G("Can't get an output name."), T.push(W);
+        W === 0 && $("Can't get an output name."), T.push(W);
         let ne = i.UTF8ToString(W);
         R.push(ne), U.push(oe === 0 ? { name: ne, isTensor: false } : { name: ne, isTensor: true, type: or(oe), shape: p });
         {
@@ -10975,23 +10975,23 @@ var Kr = k(() => {
         }
       }
       let Y = null;
-      return M.some((L) => L === "gpu-buffer" || L === "ml-tensor" || L === "ml-tensor-cpu-output") && (m = i._OrtCreateBinding(d), m === 0 && G("Can't create IO binding."), Y = { handle: m, outputPreferredLocations: M, outputPreferredLocationsEncoded: M.map((L) => L === "ml-tensor-cpu-output" ? "ml-tensor" : L).map((L) => an(L)) }), it.set(d, [d, w, T, Y, S, false]), [d, C, R, H, U];
+      return M.some((L) => L === "gpu-buffer" || L === "ml-tensor" || L === "ml-tensor-cpu-output") && (m = i._OrtCreateBinding(d), m === 0 && $("Can't create IO binding."), Y = { handle: m, outputPreferredLocations: M, outputPreferredLocationsEncoded: M.map((L) => L === "ml-tensor-cpu-output" ? "ml-tensor" : L).map((L) => an(L)) }), it.set(d, [d, w, T, Y, S, false]), [d, C, R, H, U];
     } catch (g) {
-      throw w.forEach((v) => i._OrtFree(v)), T.forEach((v) => i._OrtFree(v)), m !== 0 && i._OrtReleaseBinding(m) !== 0 && G("Can't release IO binding."), d !== 0 && i._OrtReleaseSession(d) !== 0 && G("Can't release session."), g;
+      throw w.forEach((v) => i._OrtFree(v)), T.forEach((v) => i._OrtFree(v)), m !== 0 && i._OrtReleaseBinding(m) !== 0 && $("Can't release IO binding."), d !== 0 && i._OrtReleaseSession(d) !== 0 && $("Can't release session."), g;
     } finally {
-      i._free(s), l !== 0 && i._OrtReleaseSessionOptions(l) !== 0 && G("Can't release session options."), y.forEach((g) => i._free(g)), i.unmountExternalData?.();
+      i._free(s), l !== 0 && i._OrtReleaseSessionOptions(l) !== 0 && $("Can't release session options."), y.forEach((g) => i._free(g)), i.unmountExternalData?.();
     }
   }, Zt = (a) => {
-    let r = $(), s = it.get(a);
+    let r = z(), s = it.get(a);
     if (!s) throw new Error(`cannot release session. invalid session id: ${a}`);
     let [f, i, d, l, m] = s;
-    l && (m && r._OrtClearBoundOutputs(l.handle) !== 0 && G("Can't clear bound outputs."), r._OrtReleaseBinding(l.handle) !== 0 && G("Can't release IO binding.")), r.jsepOnReleaseSession?.(a), r.webnnOnReleaseSession?.(a), r.webgpuOnReleaseSession?.(a), i.forEach((y) => r._OrtFree(y)), d.forEach((y) => r._OrtFree(y)), r._OrtReleaseSession(f) !== 0 && G("Can't release session."), it.delete(a);
+    l && (m && r._OrtClearBoundOutputs(l.handle) !== 0 && $("Can't clear bound outputs."), r._OrtReleaseBinding(l.handle) !== 0 && $("Can't release IO binding.")), r.jsepOnReleaseSession?.(a), r.webnnOnReleaseSession?.(a), r.webgpuOnReleaseSession?.(a), i.forEach((y) => r._OrtFree(y)), d.forEach((y) => r._OrtFree(y)), r._OrtReleaseSession(f) !== 0 && $("Can't release session."), it.delete(a);
   }, Ms = async (a, r, s, f, i, d, l = false) => {
     if (!a) {
       r.push(0);
       return;
     }
-    let m = $(), y = m.PTR_SIZE, w = a[0], T = a[1], g = a[3], v = g, S, C;
+    let m = z(), y = m.PTR_SIZE, w = a[0], T = a[1], g = a[3], v = g, S, C;
     if (w === "string" && (g === "gpu-buffer" || g === "ml-tensor")) throw new Error("String tensor is not supported on GPU.");
     if (l && g !== "gpu-buffer") throw new Error(`External buffer must be provided for input/output index ${d} when enableGraphCapture is true.`);
     if (g === "gpu-buffer") {
@@ -11035,12 +11035,12 @@ var Kr = k(() => {
     try {
       T.forEach((M, Y) => m.setValue(H + Y * y, M, y === 4 ? "i32" : "i64"));
       let U = m._OrtCreateTensor(He(w), S, C, H, T.length, an(v));
-      U === 0 && G(`Can't create tensor for input/output. session=${f}, index=${d}.`), r.push(U);
+      U === 0 && $(`Can't create tensor for input/output. session=${f}, index=${d}.`), r.push(U);
     } finally {
       m.stackRestore(R);
     }
   }, Kt = async (a, r, s, f, i, d) => {
-    let l = $(), m = l.PTR_SIZE, y = it.get(a);
+    let l = z(), m = l.PTR_SIZE, y = it.get(a);
     if (!y) throw new Error(`cannot run inference. invalid session id: ${a}`);
     let w = y[0], T = y[1], g = y[2], v = y[3], S = y[4], C = y[5], R = r.length, H = f.length, U = 0, M = [], Y = [], L = [], W = [], oe = [], p = l.stackSave(), ne = l.stackAlloc(R * m), X = l.stackAlloc(R * m), J = l.stackAlloc(H * m), Ue = l.stackAlloc(H * m);
     try {
@@ -11056,33 +11056,33 @@ var Kr = k(() => {
         $e("wasm bindInputsOutputs");
         for (let q = 0; q < R; q++) {
           let we = r[q];
-          await l._OrtBindInput(_, T[we], Y[q]) !== 0 && G(`Can't bind input[${q}] for session=${a}.`);
+          await l._OrtBindInput(_, T[we], Y[q]) !== 0 && $(`Can't bind input[${q}] for session=${a}.`);
         }
         for (let q = 0; q < H; q++) {
           let we = f[q];
-          i[q]?.[3] ? (oe.push(L[q]), l._OrtBindOutput(_, g[we], L[q], 0) !== 0 && G(`Can't bind pre-allocated output[${q}] for session=${a}.`)) : l._OrtBindOutput(_, g[we], 0, pe[we]) !== 0 && G(`Can't bind output[${q}] to ${ae[q]} for session=${a}.`);
+          i[q]?.[3] ? (oe.push(L[q]), l._OrtBindOutput(_, g[we], L[q], 0) !== 0 && $(`Can't bind pre-allocated output[${q}] for session=${a}.`)) : l._OrtBindOutput(_, g[we], 0, pe[we]) !== 0 && $(`Can't bind output[${q}] to ${ae[q]} for session=${a}.`);
         }
         ze("wasm bindInputsOutputs"), it.set(a, [w, T, g, v, S, true]);
       }
       l.jsepOnRunStart?.(w), l.webnnOnRunStart?.(w);
       let Q;
-      v ? Q = await l._OrtRunWithBinding(w, v.handle, H, J, U) : Q = await l._OrtRun(w, X, ne, R, Ue, H, J, U), Q !== 0 && G("failed to call OrtRun().");
+      v ? Q = await l._OrtRunWithBinding(w, v.handle, H, J, U) : Q = await l._OrtRun(w, X, ne, R, Ue, H, J, U), Q !== 0 && $("failed to call OrtRun().");
       let x = [], A = [];
       $e("wasm ProcessOutputTensor");
       for (let _ = 0; _ < H; _++) {
         let ae = Number(l.getValue(J + _ * m, "*"));
         if (ae === L[_] || oe.includes(L[_])) {
-          x.push(i[_]), ae !== L[_] && l._OrtReleaseTensor(ae) !== 0 && G("Can't release tensor.");
+          x.push(i[_]), ae !== L[_] && l._OrtReleaseTensor(ae) !== 0 && $("Can't release tensor.");
           continue;
         }
         let pe = l.stackSave(), q = l.stackAlloc(4 * m), we = false, re, se = 0;
         try {
-          l._OrtGetTensorData(ae, q, q + m, q + 2 * m, q + 3 * m) !== 0 && G(`Can't access output tensor data on index ${_}.`);
+          l._OrtGetTensorData(ae, q, q + m, q + 2 * m, q + 3 * m) !== 0 && $(`Can't access output tensor data on index ${_}.`);
           let Te = m === 4 ? "i32" : "i64", Ye = Number(l.getValue(q, Te));
           se = l.getValue(q + m, "*");
           let bt = l.getValue(q + m * 2, "*"), wt = Number(l.getValue(q + m * 3, Te)), Se = [];
           for (let ee = 0; ee < wt; ee++) Se.push(Number(l.getValue(bt + ee * m, Te)));
-          l._OrtFree(bt) !== 0 && G("Can't free memory for tensor dims.");
+          l._OrtFree(bt) !== 0 && $("Can't free memory for tensor dims.");
           let Ae = Se.reduce((ee, Z) => ee * Z, 1);
           re = or(Ye);
           let Oe = v?.outputPreferredLocations[f[_]];
@@ -11090,24 +11090,24 @@ var Kr = k(() => {
             if (Oe === "gpu-buffer" || Oe === "ml-tensor") throw new Error("String tensor is not supported on GPU.");
             let ee = [];
             for (let Z = 0; Z < Ae; Z++) {
-              let z = l.getValue(se + Z * m, "*"), V = l.getValue(se + (Z + 1) * m, "*"), qe = Z === Ae - 1 ? void 0 : V - z;
-              ee.push(l.UTF8ToString(z, qe));
+              let G = l.getValue(se + Z * m, "*"), V = l.getValue(se + (Z + 1) * m, "*"), qe = Z === Ae - 1 ? void 0 : V - G;
+              ee.push(l.UTF8ToString(G, qe));
             }
             x.push([re, Se, ee, "cpu"]);
           } else if (Oe === "gpu-buffer" && Ae > 0) {
             let ee = l.webgpuGetBuffer;
             if (!ee) throw new Error('preferredLocation "gpu-buffer" is not supported without using WebGPU.');
-            let Z = ee(se), z = mt(Ye, Ae);
-            if (z === void 0 || !ar(re)) throw new Error(`Unsupported data type: ${re}`);
+            let Z = ee(se), G = mt(Ye, Ae);
+            if (G === void 0 || !ar(re)) throw new Error(`Unsupported data type: ${re}`);
             we = true;
             {
               l.webgpuRegisterBuffer(Z, a, se);
-              let V = l.webgpuCreateDownloader(Z, z, a);
+              let V = l.webgpuCreateDownloader(Z, G, a);
               x.push([re, Se, { gpuBuffer: Z, download: async () => {
                 let qe = await V();
                 return new (at(re))(qe);
               }, dispose: () => {
-                l._OrtReleaseTensor(ae) !== 0 && G("Can't release tensor.");
+                l._OrtReleaseTensor(ae) !== 0 && $("Can't release tensor.");
               } }, "gpu-buffer"]);
             }
           } else if (Oe === "ml-tensor" && Ae > 0) {
@@ -11122,8 +11122,8 @@ var Kr = k(() => {
           } else if (Oe === "ml-tensor-cpu-output" && Ae > 0) {
             let ee = l.webnnCreateMLTensorDownloader(se, re)(), Z = x.length;
             we = true, A.push((async () => {
-              let z = [Z, await ee];
-              return l.webnnReleaseTensorId(se), l._OrtReleaseTensor(ae), z;
+              let G = [Z, await ee];
+              return l.webnnReleaseTensorId(se), l._OrtReleaseTensor(ae), G;
             })()), x.push([re, Se, [], "cpu"]);
           } else {
             let ee = at(re), Z = new ee(Ae);
@@ -11133,7 +11133,7 @@ var Kr = k(() => {
           l.stackRestore(pe), re === "string" && se && l._free(se), we || l._OrtReleaseTensor(ae);
         }
       }
-      v && !S && (l._OrtClearBoundOutputs(v.handle) !== 0 && G("Can't clear bound outputs."), it.set(a, [w, T, g, v, S, false]));
+      v && !S && (l._OrtClearBoundOutputs(v.handle) !== 0 && $("Can't clear bound outputs."), it.set(a, [w, T, g, v, S, false]));
       for (let [_, ae] of await Promise.all(A)) x[_][2] = ae;
       return ze("wasm ProcessOutputTensor"), x;
     } finally {
@@ -11144,10 +11144,10 @@ var Kr = k(() => {
       }), Y.forEach((Q) => l._OrtReleaseTensor(Q)), L.forEach((Q) => l._OrtReleaseTensor(Q)), W.forEach((Q) => l._free(Q)), U !== 0 && l._OrtReleaseRunOptions(U), M.forEach((Q) => l._free(Q));
     }
   }, er = (a) => {
-    let r = $(), s = it.get(a);
+    let r = z(), s = it.get(a);
     if (!s) throw new Error("invalid session id");
     let f = s[0], i = r._OrtEndProfiling(f);
-    i === 0 && G("Can't get an profile file name."), r._OrtFree(i);
+    i === 0 && $("Can't get an profile file name."), r._OrtFree(i);
   }, tr = (a) => {
     let r = [];
     for (let s of a) {
@@ -11380,7 +11380,7 @@ var $s = k(() => {
 Ve();
 Ve();
 Ve();
-var Xa = "1.25.0-dev.20260307-d626b568e0";
+var Xa = "1.25.0-dev.20260323-a99aad9d36";
 var Tl = Zr;
 {
   let a = ($s(), $t(Gs)).wasmBackend;
@@ -11531,10 +11531,10 @@ var tensorToDataURL = (tensor, options) => {
     for (let i = 0; i < height; i++) {
       for (let j = 0; j < width; j++) {
         const R = (tensor.data[rTensorPointer++] - normBias[0]) * normMean[0];
-        const G2 = (tensor.data[gTensorPointer++] - normBias[1]) * normMean[1];
+        const G = (tensor.data[gTensorPointer++] - normBias[1]) * normMean[1];
         const B = (tensor.data[bTensorPointer++] - normBias[2]) * normMean[2];
         const A = aTensorPointer === -1 ? 255 : (tensor.data[aTensorPointer++] - normBias[3]) * normMean[3];
-        pixels2DContext.fillStyle = "rgba(" + R + "," + G2 + "," + B + "," + A + ")";
+        pixels2DContext.fillStyle = "rgba(" + R + "," + G + "," + B + "," + A + ")";
         pixels2DContext.fillRect(j, i, 1, 1);
       }
     }
@@ -16499,6 +16499,7 @@ var processors_exports = {};
 __export(processors_exports, {
   ChatterboxProcessor: () => ChatterboxProcessor,
   Florence2Processor: () => Florence2Processor,
+  Gemma3Processor: () => Gemma3Processor,
   Gemma3nProcessor: () => Gemma3nProcessor,
   Glm46VProcessor: () => Glm46VProcessor,
   GraniteSpeechProcessor: () => GraniteSpeechProcessor,
@@ -19498,6 +19499,7 @@ __export(image_processors_exports, {
   DonutImageProcessor: () => DonutImageProcessor,
   EfficientNetImageProcessor: () => EfficientNetImageProcessor,
   GLPNFeatureExtractor: () => GLPNFeatureExtractor,
+  Gemma3ImageProcessor: () => Gemma3ImageProcessor,
   Glm46VImageProcessor: () => Glm46VImageProcessor,
   GroundingDinoImageProcessor: () => GroundingDinoImageProcessor,
   Idefics3ImageProcessor: () => Idefics3ImageProcessor,
@@ -19682,6 +19684,10 @@ var EfficientNetImageProcessor = class extends ImageProcessor {
   }
 };
+// src/models/gemma3/image_processing_gemma3.js
+var Gemma3ImageProcessor = class extends ImageProcessor {
+};
 // src/models/qwen2_vl/image_processing_qwen2_vl.js
 var Qwen2VLImageProcessor = class extends ImageProcessor {
   constructor(config) {
@@ -20905,6 +20911,48 @@ var Florence2Processor = class extends Processor {
   }
 };
+// src/models/gemma3/processing_gemma3.js
+var Gemma3Processor = class extends Processor {
+  static tokenizer_class = AutoTokenizer;
+  static image_processor_class = AutoImageProcessor;
+  static uses_processor_config = true;
+  static uses_chat_template_file = true;
+  constructor(config, components, chat_template) {
+    super(config, components, chat_template);
+    this.image_seq_length = this.config.image_seq_length;
+    const { boi_token, image_token, eoi_token } = this.tokenizer.config;
+    this.boi_token = boi_token;
+    this.image_token = image_token;
+    this.eoi_token = eoi_token;
+    const image_tokens_expanded = image_token.repeat(this.image_seq_length);
+    this.full_image_sequence = `
+${boi_token}${image_tokens_expanded}${eoi_token}
+`;
+  }
+  /**
+   * @param {string|string[]} text
+   * @param {import('../../utils/image.js').RawImage|import('../../utils/image.js').RawImage[]} [images]
+   * @param {Object} [options]
+   */
+  async _call(text, images = null, options = {}) {
+    if (typeof text === "string") {
+      text = [text];
+    }
+    let image_inputs;
+    if (images) {
+      image_inputs = await this.image_processor(images, options);
+      text = text.map((prompt) => prompt.replaceAll(this.boi_token, this.full_image_sequence));
+    }
+    const text_inputs = this.tokenizer(text, options);
+    return {
+      ...text_inputs,
+      ...image_inputs
+    };
+  }
+};
 // src/models/gemma3n/processing_gemma3n.js
 var Gemma3nProcessor = class extends Processor {
   static image_processor_class = AutoImageProcessor;
@@ -24085,8 +24133,7 @@ var MODEL_TYPES = {
   ImageAudioTextToText: 13,
   Supertonic: 14,
   Chatterbox: 15,
-  MultimodalLanguageModelOnly: 16,
-  VoxtralRealtime: 17
+  VoxtralRealtime: 16
 };
 var MODEL_TYPE_CONFIG = {
   [MODEL_TYPES.DecoderOnly]: {
@@ -24143,12 +24190,12 @@ var MODEL_TYPE_CONFIG = {
     can_generate: true,
     forward: image_text_to_text_forward,
     prepare_inputs: multimodal_text_to_text_prepare_inputs_for_generation,
-    sessions: (config) => {
+    sessions: (config, options, textOnly) => {
       const s = {
         embed_tokens: "embed_tokens",
-        vision_encoder: "vision_encoder",
         decoder_model_merged: "decoder_model_merged"
       };
+      if (!textOnly) s["vision_encoder"] = "vision_encoder";
       if (config.is_encoder_decoder) s["model"] = "encoder_model";
       return s;
     },
@@ -24170,12 +24217,17 @@ var MODEL_TYPE_CONFIG = {
   [MODEL_TYPES.ImageAudioTextToText]: {
     can_generate: true,
     prepare_inputs: multimodal_text_to_text_prepare_inputs_for_generation,
-    sessions: () => ({
-      embed_tokens: "embed_tokens",
-      audio_encoder: "audio_encoder",
-      vision_encoder: "vision_encoder",
-      decoder_model_merged: "decoder_model_merged"
-    }),
+    sessions: (config, options, textOnly) => {
+      const s = {
+        embed_tokens: "embed_tokens",
+        decoder_model_merged: "decoder_model_merged"
+      };
+      if (!textOnly) {
+        s["audio_encoder"] = "audio_encoder";
+        s["vision_encoder"] = "vision_encoder";
+      }
+      return s;
+    },
     optional_configs: { generation_config: "generation_config.json" }
   },
   [MODEL_TYPES.Phi3V]: {
@@ -24226,14 +24278,6 @@ var MODEL_TYPE_CONFIG = {
     cache_sessions: { model: true },
     optional_configs: { generation_config: "generation_config.json" }
   },
-  [MODEL_TYPES.MultimodalLanguageModelOnly]: {
-    can_generate: true,
-    forward: image_text_to_text_forward,
-    prepare_inputs: multimodal_text_to_text_prepare_inputs_for_generation,
-    sessions: () => ({ embed_tokens: "embed_tokens", decoder_model_merged: "decoder_model_merged" }),
-    cache_sessions: { decoder_model_merged: true },
-    optional_configs: { generation_config: "generation_config.json" }
-  },
   [MODEL_TYPES.VoxtralRealtime]: {
     can_generate: true,
     prepare_inputs: decoder_prepare_inputs_for_generation,
@@ -24259,6 +24303,19 @@ function getSessionsConfig(modelType, config, options = {}) {
     optional_configs: typeConfig.optional_configs
   };
 }
+function resolveTypeConfig(modelName, config) {
+  let modelType = MODEL_TYPE_MAPPING.get(modelName);
+  let textOnly = false;
+  const nativeArch = config?.architectures?.[0];
+  if (nativeArch && nativeArch !== modelName && modelName?.endsWith("ForCausalLM") && nativeArch.endsWith("ForConditionalGeneration")) {
+    const nativeType = MODEL_TYPE_MAPPING.get(nativeArch);
+    if (nativeType !== void 0) {
+      modelType = nativeType;
+      textOnly = true;
+    }
+  }
+  return { typeConfig: MODEL_TYPE_CONFIG[modelType] ?? MODEL_TYPE_CONFIG.default, textOnly, modelType };
+}
 var MODEL_TYPE_MAPPING = /* @__PURE__ */ new Map();
 var MODEL_NAME_TO_CLASS_MAPPING = /* @__PURE__ */ new Map();
 var MODEL_CLASS_TO_NAME_MAPPING = /* @__PURE__ */ new Map();
@@ -24278,8 +24335,7 @@ var PreTrainedModel = class extends Callable2 {
     this.sessions = sessions;
     this.configs = configs;
     const modelName = MODEL_CLASS_TO_NAME_MAPPING.get(this.constructor);
-    const modelType = MODEL_TYPE_MAPPING.get(modelName);
-    const typeConfig = MODEL_TYPE_CONFIG[modelType] ?? MODEL_TYPE_CONFIG.default;
+    const { typeConfig } = resolveTypeConfig(modelName, config);
     this.can_generate = typeConfig.can_generate;
     this._forward = typeConfig.forward;
     this._prepare_inputs_for_generation = typeConfig.prepare_inputs;
@@ -24342,9 +24398,8 @@ var PreTrainedModel = class extends Callable2 {
       session_options
     };
     const modelName = MODEL_CLASS_TO_NAME_MAPPING.get(this);
-    const modelType = MODEL_TYPE_MAPPING.get(modelName);
     config = options.config = await AutoConfig.from_pretrained(pretrained_model_name_or_path, options);
-    const typeConfig = MODEL_TYPE_CONFIG[modelType] ?? MODEL_TYPE_CONFIG.default;
+    const { typeConfig, textOnly, modelType } = resolveTypeConfig(modelName, config);
     if (modelType === void 0) {
       const type = modelName ?? config?.model_type;
       if (type !== "custom") {
@@ -24353,7 +24408,7 @@ var PreTrainedModel = class extends Callable2 {
         );
       }
     }
-    const sessions = typeConfig.sessions(config, options);
+    const sessions = typeConfig.sessions(config, options, textOnly);
     const promises = [
       constructSessions(pretrained_model_name_or_path, sessions, options, typeConfig.cache_sessions)
     ];
@@ -25408,6 +25463,7 @@ __export(models_exports, {
   Gemma2Model: () => Gemma2Model,
   Gemma2PreTrainedModel: () => Gemma2PreTrainedModel,
   Gemma3ForCausalLM: () => Gemma3ForCausalLM,
+  Gemma3ForConditionalGeneration: () => Gemma3ForConditionalGeneration,
   Gemma3Model: () => Gemma3Model,
   Gemma3PreTrainedModel: () => Gemma3PreTrainedModel,
   Gemma3nForCausalLM: () => Gemma3nForCausalLM,
@@ -27126,12 +27182,35 @@ var Gemma2Model = class extends Gemma2PreTrainedModel {
 var Gemma2ForCausalLM = class extends Gemma2PreTrainedModel {
 };
+// src/models/llava/modeling_llava.js
+var LlavaPreTrainedModel = class extends PreTrainedModel {
+  forward_params = ["input_ids", "attention_mask", "pixel_values", "position_ids", "past_key_values"];
+};
+var LlavaForConditionalGeneration = class extends LlavaPreTrainedModel {
+  _merge_input_ids_with_image_features(kwargs) {
+    const vision_hidden_size = kwargs.image_features.dims.at(-1);
+    const reshaped_image_hidden_states = kwargs.image_features.view(-1, vision_hidden_size);
+    return default_merge_input_ids_with_image_features({
+      // @ts-ignore
+      image_token_id: this.config.image_token_index ?? this.config.image_token_id,
+      ...kwargs,
+      image_features: reshaped_image_hidden_states
+    });
+  }
+};
+var Moondream1ForConditionalGeneration = class extends LlavaForConditionalGeneration {
+};
+var LlavaQwen2ForCausalLM = class extends LlavaForConditionalGeneration {
+};
 // src/models/gemma3/modeling_gemma3.js
 var Gemma3PreTrainedModel = class extends PreTrainedModel {
 };
 var Gemma3Model = class extends Gemma3PreTrainedModel {
 };
-var Gemma3ForCausalLM = class extends Gemma3PreTrainedModel {
+var Gemma3ForConditionalGeneration = class extends LlavaForConditionalGeneration {
+};
+var Gemma3ForCausalLM = class extends Gemma3ForConditionalGeneration {
 };
 // src/models/gemma3n/modeling_gemma3n.js
@@ -27314,8 +27393,8 @@ var Qwen2VLForConditionalGeneration = class extends Qwen2VLPreTrainedModel {
     for (let x = 0; x < 3; ++x) {
       for (const val of llm_pos_ids_list) {
         const seg_len = val.length / 3;
-        for (let z = x * seg_len; z < (x + 1) * seg_len; ++z) {
-          llm_positions[index++] = val[z];
+        for (let z2 = x * seg_len; z2 < (x + 1) * seg_len; ++z2) {
+          llm_positions[index++] = val[z2];
         }
       }
     }
@@ -27497,40 +27576,45 @@ var Qwen2VLForConditionalGeneration = class extends Qwen2VLPreTrainedModel {
     });
   }
   prepare_inputs_for_generation(input_ids, model_inputs, generation_config) {
-    if (model_inputs.attention_mask && !model_inputs.position_ids) {
-      if (!model_inputs.past_key_values) {
-        [model_inputs.position_ids, model_inputs.rope_deltas] = this.get_rope_index(
+    if (!model_inputs.attention_mask || model_inputs.position_ids) {
+      return model_inputs;
+    }
+    const session = this.sessions["decoder_model_merged"] ?? this.sessions["model"];
+    if (!session.inputNames.includes("position_ids")) {
+      return model_inputs;
+    }
+    if (!model_inputs.past_key_values) {
+      [model_inputs.position_ids, model_inputs.rope_deltas] = this.get_rope_index(
+        model_inputs.input_ids,
+        model_inputs.image_grid_thw,
+        model_inputs.video_grid_thw,
+        model_inputs.attention_mask
+      );
+    } else {
+      model_inputs.pixel_values = null;
+      const past_length = model_inputs.past_key_values.get_seq_length();
+      if (past_length < model_inputs.input_ids.dims[1]) {
+        const [full_position_ids, rope_deltas] = this.get_rope_index(
           model_inputs.input_ids,
           model_inputs.image_grid_thw,
           model_inputs.video_grid_thw,
           model_inputs.attention_mask
         );
+        model_inputs.rope_deltas = rope_deltas;
+        model_inputs.position_ids = full_position_ids.slice(null, null, [past_length, null]);
+        model_inputs.input_ids = model_inputs.input_ids.slice(null, [past_length, null]);
       } else {
-        model_inputs.pixel_values = null;
-        const past_length = model_inputs.past_key_values.get_seq_length();
-        if (past_length < model_inputs.input_ids.dims[1]) {
-          const [full_position_ids, rope_deltas] = this.get_rope_index(
+        if (!model_inputs.rope_deltas) {
+          [, model_inputs.rope_deltas] = this.get_rope_index(
             model_inputs.input_ids,
             model_inputs.image_grid_thw,
             model_inputs.video_grid_thw,
             model_inputs.attention_mask
           );
-          model_inputs.rope_deltas = rope_deltas;
-          model_inputs.position_ids = full_position_ids.slice(null, null, [past_length, null]);
-          model_inputs.input_ids = model_inputs.input_ids.slice(null, [past_length, null]);
-        } else {
-          if (!model_inputs.rope_deltas) {
-            [, model_inputs.rope_deltas] = this.get_rope_index(
-              model_inputs.input_ids,
-              model_inputs.image_grid_thw,
-              model_inputs.video_grid_thw,
-              model_inputs.attention_mask
-            );
-          }
-          const delta = BigInt(past_length);
-          const rope_deltas_list = model_inputs.rope_deltas.map((x) => delta + x);
-          model_inputs.position_ids = stack([rope_deltas_list, rope_deltas_list, rope_deltas_list], 0);
         }
+        const delta = BigInt(past_length);
+        const rope_deltas_list = model_inputs.rope_deltas.map((x) => delta + x);
+        model_inputs.position_ids = stack([rope_deltas_list, rope_deltas_list, rope_deltas_list], 0);
       }
     }
     return model_inputs;
@@ -27813,27 +27897,6 @@ var HunYuanDenseV1Model = class extends HunYuanDenseV1PreTrainedModel {
 var HunYuanDenseV1ForCausalLM = class extends HunYuanDenseV1PreTrainedModel {
 };
-// src/models/llava/modeling_llava.js
-var LlavaPreTrainedModel = class extends PreTrainedModel {
-  forward_params = ["input_ids", "attention_mask", "pixel_values", "position_ids", "past_key_values"];
-};
-var LlavaForConditionalGeneration = class extends LlavaPreTrainedModel {
-  _merge_input_ids_with_image_features(kwargs) {
-    const vision_hidden_size = kwargs.image_features.dims.at(-1);
-    const reshaped_image_hidden_states = kwargs.image_features.view(-1, vision_hidden_size);
-    return default_merge_input_ids_with_image_features({
-      // @ts-ignore
-      image_token_id: this.config.image_token_index ?? this.config.image_token_id,
-      ...kwargs,
-      image_features: reshaped_image_hidden_states
-    });
-  }
-};
-var Moondream1ForConditionalGeneration = class extends LlavaForConditionalGeneration {
-};
-var LlavaQwen2ForCausalLM = class extends LlavaForConditionalGeneration {
-};
 // src/models/idefics3/modeling_idefics3.js
 var Idefics3ForConditionalGeneration = class extends LlavaForConditionalGeneration {
   forward_params = [
@@ -30731,6 +30794,7 @@ var MODEL_FOR_CAUSAL_LM_MAPPING_NAMES = /* @__PURE__ */ new Map([
   ["qwen3_vl", "Qwen3VLForCausalLM"],
   ["qwen3_vl_moe", "Qwen3VLMoeForCausalLM"],
   ["qwen3_5", "Qwen3_5ForCausalLM"],
+  ["qwen3_5_text", "Qwen3_5ForCausalLM"],
   ["qwen3_5_moe", "Qwen3_5MoeForCausalLM"],
   ["gemma3n", "Gemma3nForCausalLM"],
   ["phi", "PhiForCausalLM"],
@@ -30818,6 +30882,7 @@ var MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPING_NAMES = /* @__PURE__ */ new Map([
   ["smolvlm", "SmolVLMForConditionalGeneration"],
   ["paligemma", "PaliGemmaForConditionalGeneration"],
   ["llava_qwen2", "LlavaQwen2ForCausalLM"],
+  ["gemma3", "Gemma3ForConditionalGeneration"],
   ["gemma3n", "Gemma3nForConditionalGeneration"],
   ["mistral3", "Mistral3ForConditionalGeneration"],
   ["lighton_ocr", "LightOnOcrForConditionalGeneration"],
@@ -31012,13 +31077,6 @@ var CUSTOM_MAPPING = [
   ],
   ["SupertonicForConditionalGeneration", SupertonicForConditionalGeneration, MODEL_TYPES.Supertonic],
   ["ChatterboxModel", ChatterboxModel, MODEL_TYPES.Chatterbox],
-  ["Qwen2VLForCausalLM", Qwen2VLForCausalLM, MODEL_TYPES.MultimodalLanguageModelOnly],
-  ["Qwen2_5_VLForCausalLM", Qwen2_5_VLForCausalLM, MODEL_TYPES.MultimodalLanguageModelOnly],
-  ["Qwen3VLForCausalLM", Qwen3VLForCausalLM, MODEL_TYPES.MultimodalLanguageModelOnly],
-  ["Qwen3VLMoeForCausalLM", Qwen3VLMoeForCausalLM, MODEL_TYPES.MultimodalLanguageModelOnly],
-  ["Qwen3_5ForCausalLM", Qwen3_5ForCausalLM, MODEL_TYPES.MultimodalLanguageModelOnly],
-  ["Qwen3_5MoeForCausalLM", Qwen3_5MoeForCausalLM, MODEL_TYPES.MultimodalLanguageModelOnly],
-  ["Gemma3nForCausalLM", Gemma3nForCausalLM, MODEL_TYPES.MultimodalLanguageModelOnly],
   [
     "VoxtralRealtimeForConditionalGeneration",
     VoxtralRealtimeForConditionalGeneration,
@@ -32700,6 +32758,41 @@ var TASK_ALIASES = Object.freeze({
   embeddings: "feature-extraction"
 });
+// src/utils/model_registry/resolve_model_type.js
+function resolve_model_type(config, { warn = true } = {}) {
+  const architectures = (
+    /** @type {string[]} */
+    config.architectures || []
+  );
+  for (const arch of architectures) {
+    const mappedType = MODEL_TYPE_MAPPING.get(arch);
+    if (mappedType !== void 0) {
+      return mappedType;
+    }
+  }
+  if (config.model_type) {
+    const mappedType = MODEL_TYPE_MAPPING.get(config.model_type);
+    if (mappedType !== void 0) {
+      return mappedType;
+    }
+    for (const mapping of Object.values(MODEL_MAPPING_NAMES)) {
+      if (mapping.has(config.model_type)) {
+        const resolved = MODEL_TYPE_MAPPING.get(mapping.get(config.model_type));
+        if (resolved !== void 0) {
+          return resolved;
+        }
+      }
+    }
+  }
+  if (warn) {
+    const archList = architectures.length > 0 ? architectures.join(", ") : "(none)";
+    logger.warn(
+      `[resolve_model_type] Architecture(s) not found in MODEL_TYPE_MAPPING: [${archList}] for model type '${config.model_type}'. Falling back to EncoderOnly (single model.onnx file). If you encounter issues, please report at: ${GITHUB_ISSUE_URL}`
+    );
+  }
+  return MODEL_TYPES.EncoderOnly;
+}
 // src/utils/model_registry/get_model_files.js
 function get_config(modelId, { config = null, cache_dir = null, local_files_only = false, revision = "main" } = {}) {
   if (config !== null) {
@@ -32722,43 +32815,7 @@ async function get_model_files(modelId, { config = null, dtype: overrideDtype =
   const subfolder = "onnx";
   const rawDevice = overrideDevice ?? custom_config.device;
   let dtype = overrideDtype ?? custom_config.dtype;
-  let modelType;
-  const architectures = (
-    /** @type {string[]} */
-    config.architectures || []
-  );
-  let foundInMapping = false;
-  for (const arch of architectures) {
-    const mappedType = MODEL_TYPE_MAPPING.get(arch);
-    if (mappedType !== void 0) {
-      modelType = mappedType;
-      foundInMapping = true;
-      break;
-    }
-  }
-  if (!foundInMapping && config.model_type) {
-    const mappedType = MODEL_TYPE_MAPPING.get(config.model_type);
-    if (mappedType !== void 0) {
-      modelType = mappedType;
-      foundInMapping = true;
-    }
-    if (!foundInMapping) {
-      for (const mapping of Object.values(MODEL_MAPPING_NAMES)) {
-        if (mapping.has(config.model_type)) {
-          modelType = MODEL_TYPE_MAPPING.get(mapping.get(config.model_type));
-          foundInMapping = true;
-          break;
-        }
-      }
-    }
-  }
-  if (!foundInMapping) {
-    const archList = architectures.length > 0 ? architectures.join(", ") : "(none)";
-    logger.warn(
-      `[get_model_files] Architecture(s) not found in MODEL_TYPE_MAPPING: [${archList}] for model type '${config.model_type}'. Falling back to EncoderOnly (single model.onnx file). If you encounter issues, please report at: ${GITHUB_ISSUE_URL}`
-    );
-    modelType = MODEL_TYPES.EncoderOnly;
-  }
+  const modelType = resolve_model_type(config);
   const add_model_file = (fileName, baseName = null) => {
     baseName = baseName ?? fileName;
     const selectedDevice = selectDevice(rawDevice, fileName);
@@ -33345,6 +33402,31 @@ async function clear_pipeline_cache(task, modelId, options = {}) {
   return await clear_files_from_cache(modelId, files, options);
 }
+// src/utils/model_registry/get_available_dtypes.js
+var CONCRETE_DTYPES = Object.keys(DEFAULT_DTYPE_SUFFIX_MAPPING);
+async function get_available_dtypes(modelId, { config = null, model_file_name = null, revision = "main", cache_dir = null, local_files_only = false } = {}) {
+  config = await get_config(modelId, { config, cache_dir, local_files_only, revision });
+  const subfolder = "onnx";
+  const modelType = resolve_model_type(config);
+  const { sessions } = getSessionsConfig(modelType, config, { model_file_name });
+  const baseNames = Object.values(sessions);
+  const metadataOptions = { revision, cache_dir, local_files_only };
+  const probeResults = await Promise.all(
+    CONCRETE_DTYPES.map(async (dtype) => {
+      const suffix = DEFAULT_DTYPE_SUFFIX_MAPPING[dtype] ?? "";
+      const allExist = await Promise.all(
+        baseNames.map(async (baseName) => {
+          const filename = `${subfolder}/${baseName}${suffix}.onnx`;
+          const metadata = await get_file_metadata(modelId, filename, metadataOptions);
+          return metadata.exists;
+        })
+      );
+      return { dtype, available: allExist.every(Boolean) };
+    })
+  );
+  return probeResults.filter((r) => r.available).map((r) => r.dtype);
+}
 // src/utils/model_registry/ModelRegistry.js
 var ModelRegistry = class {
   /**
@@ -33431,6 +33513,29 @@ var ModelRegistry = class {
   static async get_processor_files(modelId) {
     return get_processor_files(modelId);
   }
+  /**
+   * Detects which quantization levels (dtypes) are available for a model
+   * by checking which ONNX files exist on the hub or locally.
+   *
+   * A dtype is considered available if all required model session files
+   * exist for that dtype.
+   *
+   * @param {string} modelId - The model id (e.g., "onnx-community/all-MiniLM-L6-v2-ONNX")
+   * @param {Object} [options] - Optional parameters
+   * @param {import('../../configs.js').PretrainedConfig} [options.config=null] - Pre-loaded config
+   * @param {string} [options.model_file_name=null] - Override the model file name (excluding .onnx suffix)
+   * @param {string} [options.revision='main'] - Model revision
+   * @param {string} [options.cache_dir=null] - Custom cache directory
+   * @param {boolean} [options.local_files_only=false] - Only check local files
+   * @returns {Promise<string[]>} Array of available dtype strings (e.g., ['fp32', 'fp16', 'q4', 'q8'])
+   *
+   * @example
+   * const dtypes = await ModelRegistry.get_available_dtypes('onnx-community/all-MiniLM-L6-v2-ONNX');
+   * console.log(dtypes); // ['fp32', 'fp16', 'int8', 'uint8', 'q8', 'q4']
+   */
+  static async get_available_dtypes(modelId, options = {}) {
+    return get_available_dtypes(modelId, options);
+  }
   /**
    * Quickly checks if a model is fully cached by verifying `config.json` is present,
    * then confirming all required files are cached.
@@ -33877,8 +33982,11 @@ export {
   Gemma2Model,
   Gemma2PreTrainedModel,
   Gemma3ForCausalLM,
+  Gemma3ForConditionalGeneration,
+  Gemma3ImageProcessor,
   Gemma3Model,
   Gemma3PreTrainedModel,
+  Gemma3Processor,
   Gemma3nAudioFeatureExtractor,
   Gemma3nForCausalLM,
   Gemma3nForConditionalGeneration,
@@ -34497,7 +34605,7 @@ export {
 onnxruntime-web/dist/ort.webgpu.bundle.min.mjs:
   (*!
-   * ONNX Runtime Web v1.25.0-dev.20260307-d626b568e0
+   * ONNX Runtime Web v1.25.0-dev.20260323-a99aad9d36
    * Copyright (c) Microsoft Corporation. All rights reserved.
    * Licensed under the MIT License.
    *)