@loreai/gateway 0.18.0 → 0.19.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/embedding-worker.cjs +24 -0
- package/dist/index.cjs +455 -377
- package/dist/index.d.cts +69 -10
- package/package.json +3 -2
|
@@ -0,0 +1,24 @@
|
|
|
1
|
+
"use strict";var Zp=Object.create;var Va=Object.defineProperty;var em=Object.getOwnPropertyDescriptor;var tm=Object.getOwnPropertyNames;var sm=Object.getPrototypeOf,rm=Object.prototype.hasOwnProperty;var Bt=(D,a)=>()=>(D&&(a=D(D=0)),a);var gu=(D,a)=>{for(var e in a)Va(D,e,{get:a[e],enumerable:!0})},om=(D,a,e,i)=>{if(a&&typeof a=="object"||typeof a=="function")for(let d of tm(a))!rm.call(D,d)&&d!==e&&Va(D,d,{get:()=>a[d],enumerable:!(i=em(a,d))||i.enumerable});return D};var dr=(D,a,e)=>(e=D!=null?Zp(sm(D)):{},om(a||!D||!D.__esModule?Va(e,"default",{value:D,enumerable:!0}):e,D));var Nr,Ks,Pu,am,Tu,za=Bt(()=>{Nr=new Map,Ks=[],Pu=(D,a,e)=>{if(a&&typeof a.init=="function"&&typeof a.createInferenceSessionHandler=="function"){let i=Nr.get(D);if(i===void 0)Nr.set(D,{backend:a,priority:e});else{if(i.priority>e)return;if(i.priority===e&&i.backend!==a)throw new Error(`cannot register backend "${D}" using priority ${e}`)}if(e>=0){let d=Ks.indexOf(D);d!==-1&&Ks.splice(d,1);for(let g=0;g<Ks.length;g++)if(Nr.get(Ks[g]).priority<=e){Ks.splice(g,0,D);return}Ks.push(D)}return}throw new TypeError("not a valid backend")},am=async D=>{let a=Nr.get(D);if(!a)return"backend not found.";if(a.initialized)return a.backend;if(a.aborted)return a.error;{let e=!!a.initPromise;try{return e||(a.initPromise=a.backend.init(D)),await a.initPromise,a.initialized=!0,a.backend}catch(i){return e||(a.error=`${i}`,a.aborted=!0),a.error}finally{delete a.initPromise}}},Tu=async D=>{let a=D.executionProviders||[],e=a.map(u=>typeof u=="string"?u:u.name),i=e.length===0?Ks:e,d,g=[],I=new Set;for(let u of i){let m=await am(u);typeof m=="string"?g.push({name:u,err:m}):(d||(d=m),d===m&&I.add(u))}if(!d)throw new Error(`no available backend found. ERR: ${g.map(u=>`[${u.name}] ${u.err}`).join(", ")}`);for(let{name:u,err:m}of g)e.includes(u)&&console.warn(`removing requested execution provider "${u}" from session options because it is not available: ${m}`);let f=a.filter(u=>I.has(typeof u=="string"?u:u.name));return[d,new Proxy(D,{get:(u,m)=>m==="executionProviders"?f:Reflect.get(u,m)})]}});var wu=Bt(()=>{za()});var bu,xu=Bt(()=>{bu="1.21.0"});var vu,ns,Ga=Bt(()=>{xu();vu="warning",ns={wasm:{},webgl:{},webgpu:{},versions:{common:bu},set logLevel(D){if(D!==void 0){if(typeof D!="string"||["verbose","info","warning","error","fatal"].indexOf(D)===-1)throw new Error(`Unsupported logging level: ${D}`);vu=D}},get logLevel(){return vu}};Object.defineProperty(ns,"logLevel",{enumerable:!0})});var nm,Eu=Bt(()=>{Ga();nm=ns});var Fu,Cu,ku=Bt(()=>{Fu=(D,a)=>{let e=typeof document<"u"?document.createElement("canvas"):new OffscreenCanvas(1,1);e.width=D.dims[3],e.height=D.dims[2];let i=e.getContext("2d");if(i!=null){let d,g;a?.tensorLayout!==void 0&&a.tensorLayout==="NHWC"?(d=D.dims[2],g=D.dims[3]):(d=D.dims[3],g=D.dims[2]);let I=a?.format!==void 0?a.format:"RGB",f=a?.norm,u,m;f===void 0||f.mean===void 0?u=[255,255,255,255]:typeof f.mean=="number"?u=[f.mean,f.mean,f.mean,f.mean]:(u=[f.mean[0],f.mean[1],f.mean[2],0],f.mean[3]!==void 0&&(u[3]=f.mean[3])),f===void 0||f.bias===void 0?m=[0,0,0,0]:typeof f.bias=="number"?m=[f.bias,f.bias,f.bias,f.bias]:(m=[f.bias[0],f.bias[1],f.bias[2],0],f.bias[3]!==void 0&&(m[3]=f.bias[3]));let T=g*d,_=0,o=T,x=T*2,w=-1;I==="RGBA"?(_=0,o=T,x=T*2,w=T*3):I==="RGB"?(_=0,o=T,x=T*2):I==="RBG"&&(_=0,x=T,o=T*2);for(let k=0;k<g;k++)for(let G=0;G<d;G++){let b=(D.data[_++]-m[0])*u[0],C=(D.data[o++]-m[1])*u[1],B=(D.data[x++]-m[2])*u[2],P=w===-1?255:(D.data[w++]-m[3])*u[3];i.fillStyle="rgba("+b+","+C+","+B+","+P+")",i.fillRect(G,k,1,1)}if("toDataURL"in e)return e.toDataURL();throw new Error("toDataURL is not supported")}else throw new Error("Can not access image data")},Cu=(D,a)=>{let e=typeof document<"u"?document.createElement("canvas").getContext("2d"):new OffscreenCanvas(1,1).getContext("2d"),i;if(e!=null){let d,g,I;a?.tensorLayout!==void 0&&a.tensorLayout==="NHWC"?(d=D.dims[2],g=D.dims[1],I=D.dims[3]):(d=D.dims[3],g=D.dims[2],I=D.dims[1]);let f=a!==void 0&&a.format!==void 0?a.format:"RGB",u=a?.norm,m,T;u===void 0||u.mean===void 0?m=[255,255,255,255]:typeof u.mean=="number"?m=[u.mean,u.mean,u.mean,u.mean]:(m=[u.mean[0],u.mean[1],u.mean[2],255],u.mean[3]!==void 0&&(m[3]=u.mean[3])),u===void 0||u.bias===void 0?T=[0,0,0,0]:typeof u.bias=="number"?T=[u.bias,u.bias,u.bias,u.bias]:(T=[u.bias[0],u.bias[1],u.bias[2],0],u.bias[3]!==void 0&&(T[3]=u.bias[3]));let _=g*d;if(a!==void 0&&(a.format!==void 0&&I===4&&a.format!=="RGBA"||I===3&&a.format!=="RGB"&&a.format!=="BGR"))throw new Error("Tensor format doesn't match input tensor dims");let o=4,x=0,w=1,k=2,G=3,b=0,C=_,B=_*2,P=-1;f==="RGBA"?(b=0,C=_,B=_*2,P=_*3):f==="RGB"?(b=0,C=_,B=_*2):f==="RBG"&&(b=0,B=_,C=_*2),i=e.createImageData(d,g);for(let M=0;M<g*d;x+=o,w+=o,k+=o,G+=o,M++)i.data[x]=(D.data[b++]-T[0])*m[0],i.data[w]=(D.data[C++]-T[1])*m[1],i.data[k]=(D.data[B++]-T[2])*m[2],i.data[G]=P===-1?255:(D.data[P++]-T[3])*m[3]}else throw new Error("Can not access image data");return i}});var Wa,yu,Su,Au,Lu,Du,Iu=Bt(()=>{Rr();Wa=(D,a)=>{if(D===void 0)throw new Error("Image buffer must be defined");if(a.height===void 0||a.width===void 0)throw new Error("Image height and width must be defined");if(a.tensorLayout==="NHWC")throw new Error("NHWC Tensor layout is not supported yet");let{height:e,width:i}=a,d=a.norm??{mean:255,bias:0},g,I;typeof d.mean=="number"?g=[d.mean,d.mean,d.mean,d.mean]:g=[d.mean[0],d.mean[1],d.mean[2],d.mean[3]??255],typeof d.bias=="number"?I=[d.bias,d.bias,d.bias,d.bias]:I=[d.bias[0],d.bias[1],d.bias[2],d.bias[3]??0];let f=a.format!==void 0?a.format:"RGBA",u=a.tensorFormat!==void 0&&a.tensorFormat!==void 0?a.tensorFormat:"RGB",m=e*i,T=u==="RGBA"?new Float32Array(m*4):new Float32Array(m*3),_=4,o=0,x=1,w=2,k=3,G=0,b=m,C=m*2,B=-1;f==="RGB"&&(_=3,o=0,x=1,w=2,k=-1),u==="RGBA"?B=m*3:u==="RBG"?(G=0,C=m,b=m*2):u==="BGR"&&(C=0,b=m,G=m*2);for(let M=0;M<m;M++,o+=_,w+=_,x+=_,k+=_)T[G++]=(D[o]+I[0])/g[0],T[b++]=(D[x]+I[1])/g[1],T[C++]=(D[w]+I[2])/g[2],B!==-1&&k!==-1&&(T[B++]=(D[k]+I[3])/g[3]);return u==="RGBA"?new Yt("float32",T,[1,4,e,i]):new Yt("float32",T,[1,3,e,i])},yu=async(D,a)=>{let e=typeof HTMLImageElement<"u"&&D instanceof HTMLImageElement,i=typeof ImageData<"u"&&D instanceof ImageData,d=typeof ImageBitmap<"u"&&D instanceof ImageBitmap,g=typeof D=="string",I,f=a??{},u=()=>{if(typeof document<"u")return document.createElement("canvas");if(typeof OffscreenCanvas<"u")return new OffscreenCanvas(1,1);throw new Error("Canvas is not supported")},m=T=>typeof HTMLCanvasElement<"u"&&T instanceof HTMLCanvasElement||T instanceof OffscreenCanvas?T.getContext("2d"):null;if(e){let T=u();T.width=D.width,T.height=D.height;let _=m(T);if(_!=null){let o=D.height,x=D.width;if(a!==void 0&&a.resizedHeight!==void 0&&a.resizedWidth!==void 0&&(o=a.resizedHeight,x=a.resizedWidth),a!==void 0){if(f=a,a.tensorFormat!==void 0)throw new Error("Image input config format must be RGBA for HTMLImageElement");f.tensorFormat="RGBA",f.height=o,f.width=x}else f.tensorFormat="RGBA",f.height=o,f.width=x;_.drawImage(D,0,0),I=_.getImageData(0,0,x,o).data}else throw new Error("Can not access image data")}else if(i){let T,_;if(a!==void 0&&a.resizedWidth!==void 0&&a.resizedHeight!==void 0?(T=a.resizedHeight,_=a.resizedWidth):(T=D.height,_=D.width),a!==void 0&&(f=a),f.format="RGBA",f.height=T,f.width=_,a!==void 0){let o=u();o.width=_,o.height=T;let x=m(o);if(x!=null)x.putImageData(D,0,0),I=x.getImageData(0,0,_,T).data;else throw new Error("Can not access image data")}else I=D.data}else if(d){if(a===void 0)throw new Error("Please provide image config with format for Imagebitmap");let T=u();T.width=D.width,T.height=D.height;let _=m(T);if(_!=null){let o=D.height,x=D.width;return _.drawImage(D,0,0,x,o),I=_.getImageData(0,0,x,o).data,f.height=o,f.width=x,Wa(I,f)}else throw new Error("Can not access image data")}else{if(g)return new Promise((T,_)=>{let o=u(),x=m(o);if(!D||!x)return _();let w=new Image;w.crossOrigin="Anonymous",w.src=D,w.onload=()=>{o.width=w.width,o.height=w.height,x.drawImage(w,0,0,o.width,o.height);let k=x.getImageData(0,0,o.width,o.height);f.height=o.height,f.width=o.width,T(Wa(k.data,f))}});throw new Error("Input data provided is not supported - aborted tensor creation")}if(I!==void 0)return Wa(I,f);throw new Error("Input data provided is not supported - aborted tensor creation")},Su=(D,a)=>{let{width:e,height:i,download:d,dispose:g}=a,I=[1,i,e,4];return new Yt({location:"texture",type:"float32",texture:D,dims:I,download:d,dispose:g})},Au=(D,a)=>{let{dataType:e,dims:i,download:d,dispose:g}=a;return new Yt({location:"gpu-buffer",type:e??"float32",gpuBuffer:D,dims:i,download:d,dispose:g})},Lu=(D,a)=>{let{dataType:e,dims:i,download:d,dispose:g}=a;return new Yt({location:"ml-tensor",type:e??"float32",mlTensor:D,dims:i,download:d,dispose:g})},Du=(D,a,e)=>new Yt({location:"cpu-pinned",type:D,data:a,dims:e??[a.length]})});var Qs,ur,Ou,Bu,ju=Bt(()=>{Qs=new Map([["float32",Float32Array],["uint8",Uint8Array],["int8",Int8Array],["uint16",Uint16Array],["int16",Int16Array],["int32",Int32Array],["bool",Uint8Array],["float64",Float64Array],["uint32",Uint32Array],["int4",Uint8Array],["uint4",Uint8Array]]),ur=new Map([[Float32Array,"float32"],[Uint8Array,"uint8"],[Int8Array,"int8"],[Uint16Array,"uint16"],[Int16Array,"int16"],[Int32Array,"int32"],[Float64Array,"float64"],[Uint32Array,"uint32"]]),Ou=!1,Bu=()=>{if(!Ou){Ou=!0;let D=typeof BigInt64Array<"u"&&BigInt64Array.from,a=typeof BigUint64Array<"u"&&BigUint64Array.from,e=globalThis.Float16Array,i=typeof e<"u"&&e.from;D&&(Qs.set("int64",BigInt64Array),ur.set(BigInt64Array,"int64")),a&&(Qs.set("uint64",BigUint64Array),ur.set(BigUint64Array,"uint64")),i?(Qs.set("float16",e),ur.set(e,"float16")):Qs.set("float16",Uint16Array)}}});var Nu,Ru,Vu=Bt(()=>{Rr();Nu=D=>{let a=1;for(let e=0;e<D.length;e++){let i=D[e];if(typeof i!="number"||!Number.isSafeInteger(i))throw new TypeError(`dims[${e}] must be an integer, got: ${i}`);if(i<0)throw new RangeError(`dims[${e}] must be a non-negative integer, got: ${i}`);a*=i}return a},Ru=(D,a)=>{switch(D.location){case"cpu":return new Yt(D.type,D.data,a);case"cpu-pinned":return new Yt({location:"cpu-pinned",data:D.data,type:D.type,dims:a});case"texture":return new Yt({location:"texture",texture:D.texture,type:D.type,dims:a});case"gpu-buffer":return new Yt({location:"gpu-buffer",gpuBuffer:D.gpuBuffer,type:D.type,dims:a});case"ml-tensor":return new Yt({location:"ml-tensor",mlTensor:D.mlTensor,type:D.type,dims:a});default:throw new Error(`tensorReshape: tensor location ${D.location} is not supported`)}}});var Yt,Rr=Bt(()=>{ku();Iu();ju();Vu();Yt=class{constructor(a,e,i){Bu();let d,g;if(typeof a=="object"&&"location"in a)switch(this.dataLocation=a.location,d=a.type,g=a.dims,a.location){case"cpu-pinned":{let f=Qs.get(d);if(!f)throw new TypeError(`unsupported type "${d}" to create tensor from pinned buffer`);if(!(a.data instanceof f))throw new TypeError(`buffer should be of type ${f.name}`);this.cpuData=a.data;break}case"texture":{if(d!=="float32")throw new TypeError(`unsupported type "${d}" to create tensor from texture`);this.gpuTextureData=a.texture,this.downloader=a.download,this.disposer=a.dispose;break}case"gpu-buffer":{if(d!=="float32"&&d!=="float16"&&d!=="int32"&&d!=="int64"&&d!=="uint32"&&d!=="uint8"&&d!=="bool"&&d!=="uint4"&&d!=="int4")throw new TypeError(`unsupported type "${d}" to create tensor from gpu buffer`);this.gpuBufferData=a.gpuBuffer,this.downloader=a.download,this.disposer=a.dispose;break}case"ml-tensor":{if(d!=="float32"&&d!=="float16"&&d!=="int32"&&d!=="int64"&&d!=="uint32"&&d!=="uint64"&&d!=="int8"&&d!=="uint8"&&d!=="bool"&&d!=="uint4"&&d!=="int4")throw new TypeError(`unsupported type "${d}" to create tensor from MLTensor`);this.mlTensorData=a.mlTensor,this.downloader=a.download,this.disposer=a.dispose;break}default:throw new Error(`Tensor constructor: unsupported location '${this.dataLocation}'`)}else{let f,u;if(typeof a=="string")if(d=a,u=i,a==="string"){if(!Array.isArray(e))throw new TypeError("A string tensor's data must be a string array.");f=e}else{let m=Qs.get(a);if(m===void 0)throw new TypeError(`Unsupported tensor type: ${a}.`);if(Array.isArray(e)){if(a==="float16"&&m===Uint16Array||a==="uint4"||a==="int4")throw new TypeError(`Creating a ${a} tensor from number array is not supported. Please use ${m.name} as data.`);a==="uint64"||a==="int64"?f=m.from(e,BigInt):f=m.from(e)}else if(e instanceof m)f=e;else if(e instanceof Uint8ClampedArray)if(a==="uint8")f=Uint8Array.from(e);else throw new TypeError("A Uint8ClampedArray tensor's data must be type of uint8");else if(a==="float16"&&e instanceof Uint16Array&&m!==Uint16Array)f=new globalThis.Float16Array(e.buffer,e.byteOffset,e.length);else throw new TypeError(`A ${d} tensor's data must be type of ${m}`)}else if(u=e,Array.isArray(a)){if(a.length===0)throw new TypeError("Tensor type cannot be inferred from an empty array.");let m=typeof a[0];if(m==="string")d="string",f=a;else if(m==="boolean")d="bool",f=Uint8Array.from(a);else throw new TypeError(`Invalid element type of data array: ${m}.`)}else if(a instanceof Uint8ClampedArray)d="uint8",f=Uint8Array.from(a);else{let m=ur.get(a.constructor);if(m===void 0)throw new TypeError(`Unsupported type for tensor data: ${a.constructor}.`);d=m,f=a}if(u===void 0)u=[f.length];else if(!Array.isArray(u))throw new TypeError("A tensor's dims must be a number array");g=u,this.cpuData=f,this.dataLocation="cpu"}let I=Nu(g);if(this.cpuData&&I!==this.cpuData.length&&!((d==="uint4"||d==="int4")&&Math.ceil(I/2)===this.cpuData.length))throw new Error(`Tensor's size(${I}) does not match data length(${this.cpuData.length}).`);this.type=d,this.dims=g,this.size=I}static async fromImage(a,e){return yu(a,e)}static fromTexture(a,e){return Su(a,e)}static fromGpuBuffer(a,e){return Au(a,e)}static fromMLTensor(a,e){return Lu(a,e)}static fromPinnedBuffer(a,e,i){return Du(a,e,i)}toDataURL(a){return Fu(this,a)}toImageData(a){return Cu(this,a)}get data(){if(this.ensureValid(),!this.cpuData)throw new Error("The data is not on CPU. Use `getData()` to download GPU data to CPU, or use `texture` or `gpuBuffer` property to access the GPU data directly.");return this.cpuData}get location(){return this.dataLocation}get texture(){if(this.ensureValid(),!this.gpuTextureData)throw new Error("The data is not stored as a WebGL texture.");return this.gpuTextureData}get gpuBuffer(){if(this.ensureValid(),!this.gpuBufferData)throw new Error("The data is not stored as a WebGPU buffer.");return this.gpuBufferData}get mlTensor(){if(this.ensureValid(),!this.mlTensorData)throw new Error("The data is not stored as a WebNN MLTensor.");return this.mlTensorData}async getData(a){switch(this.ensureValid(),this.dataLocation){case"cpu":case"cpu-pinned":return this.data;case"texture":case"gpu-buffer":case"ml-tensor":{if(!this.downloader)throw new Error("The current tensor is not created with a specified data downloader.");if(this.isDownloading)throw new Error("The current tensor is being downloaded.");try{this.isDownloading=!0;let e=await this.downloader();return this.downloader=void 0,this.dataLocation="cpu",this.cpuData=e,a&&this.disposer&&(this.disposer(),this.disposer=void 0),e}finally{this.isDownloading=!1}}default:throw new Error(`cannot get data from location: ${this.dataLocation}`)}}dispose(){if(this.isDownloading)throw new Error("The current tensor is being downloaded.");this.disposer&&(this.disposer(),this.disposer=void 0),this.cpuData=void 0,this.gpuTextureData=void 0,this.gpuBufferData=void 0,this.mlTensorData=void 0,this.downloader=void 0,this.isDownloading=void 0,this.dataLocation="none"}ensureValid(){if(this.dataLocation==="none")throw new Error("The tensor is disposed.")}reshape(a){if(this.ensureValid(),this.downloader||this.disposer)throw new Error("Cannot reshape a tensor that owns GPU resource.");return Ru(this,a)}}});var Xs,Ua=Bt(()=>{Rr();Xs=Yt});var zu,Gu,Vr,zr,$a=Bt(()=>{Ga();zu=(D,a)=>{(typeof ns.trace>"u"?!ns.wasm.trace:!ns.trace)||console.timeStamp(`${D}::ORT::${a}`)},Gu=(D,a)=>{let e=new Error().stack?.split(/\r\n|\r|\n/g)||[],i=!1;for(let d=0;d<e.length;d++){if(i&&!e[d].includes("TRACE_FUNC")){let g=`FUNC_${D}::${e[d].trim().split(" ")[1]}`;a&&(g+=`::${a}`),zu("CPU",g);return}e[d].includes("TRACE_FUNC")&&(i=!0)}},Vr=D=>{(typeof ns.trace>"u"?!ns.wasm.trace:!ns.trace)||Gu("BEGIN",D)},zr=D=>{(typeof ns.trace>"u"?!ns.wasm.trace:!ns.trace)||Gu("END",D)}});var Gr,Wu=Bt(()=>{za();Ua();$a();Gr=class D{constructor(a){this.handler=a}async run(a,e,i){Vr();let d={},g={};if(typeof a!="object"||a===null||a instanceof Xs||Array.isArray(a))throw new TypeError("'feeds' must be an object that use input names as keys and OnnxValue as corresponding values.");let I=!0;if(typeof e=="object"){if(e===null)throw new TypeError("Unexpected argument[1]: cannot be null.");if(e instanceof Xs)throw new TypeError("'fetches' cannot be a Tensor");if(Array.isArray(e)){if(e.length===0)throw new TypeError("'fetches' cannot be an empty array.");I=!1;for(let m of e){if(typeof m!="string")throw new TypeError("'fetches' must be a string array or an object.");if(this.outputNames.indexOf(m)===-1)throw new RangeError(`'fetches' contains invalid output name: ${m}.`);d[m]=null}if(typeof i=="object"&&i!==null)g=i;else if(typeof i<"u")throw new TypeError("'options' must be an object.")}else{let m=!1,T=Object.getOwnPropertyNames(e);for(let _ of this.outputNames)if(T.indexOf(_)!==-1){let o=e[_];(o===null||o instanceof Xs)&&(m=!0,I=!1,d[_]=o)}if(m){if(typeof i=="object"&&i!==null)g=i;else if(typeof i<"u")throw new TypeError("'options' must be an object.")}else g=e}}else if(typeof e<"u")throw new TypeError("Unexpected argument[1]: must be 'fetches' or 'options'.");for(let m of this.inputNames)if(typeof a[m]>"u")throw new Error(`input '${m}' is missing in 'feeds'.`);if(I)for(let m of this.outputNames)d[m]=null;let f=await this.handler.run(a,d,g),u={};for(let m in f)if(Object.hasOwnProperty.call(f,m)){let T=f[m];T instanceof Xs?u[m]=T:u[m]=new Xs(T.type,T.data,T.dims)}return zr(),u}async release(){return this.handler.dispose()}static async create(a,e,i,d){Vr();let g,I={};if(typeof a=="string"){if(g=a,typeof e=="object"&&e!==null)I=e;else if(typeof e<"u")throw new TypeError("'options' must be an object.")}else if(a instanceof Uint8Array){if(g=a,typeof e=="object"&&e!==null)I=e;else if(typeof e<"u")throw new TypeError("'options' must be an object.")}else if(a instanceof ArrayBuffer||typeof SharedArrayBuffer<"u"&&a instanceof SharedArrayBuffer){let T=a,_=0,o=a.byteLength;if(typeof e=="object"&&e!==null)I=e;else if(typeof e=="number"){if(_=e,!Number.isSafeInteger(_))throw new RangeError("'byteOffset' must be an integer.");if(_<0||_>=T.byteLength)throw new RangeError(`'byteOffset' is out of range [0, ${T.byteLength}).`);if(o=a.byteLength-_,typeof i=="number"){if(o=i,!Number.isSafeInteger(o))throw new RangeError("'byteLength' must be an integer.");if(o<=0||_+o>T.byteLength)throw new RangeError(`'byteLength' is out of range (0, ${T.byteLength-_}].`);if(typeof d=="object"&&d!==null)I=d;else if(typeof d<"u")throw new TypeError("'options' must be an object.")}else if(typeof i<"u")throw new TypeError("'byteLength' must be a number.")}else if(typeof e<"u")throw new TypeError("'options' must be an object.");g=new Uint8Array(T,_,o)}else throw new TypeError("Unexpected argument[0]: must be 'path' or 'buffer'.");let[f,u]=await Tu(I),m=await f.createInferenceSessionHandler(g,u);return zr(),new D(m)}startProfiling(){this.handler.startProfiling()}endProfiling(){this.handler.endProfiling()}get inputNames(){return this.handler.inputNames}get outputNames(){return this.handler.outputNames}}});var im,Uu=Bt(()=>{Wu();im=Gr});var $u=Bt(()=>{});var Ku=Bt(()=>{});var Qu=Bt(()=>{});var Xu=Bt(()=>{});var Ka={};gu(Ka,{InferenceSession:()=>im,TRACE:()=>zu,TRACE_FUNC_BEGIN:()=>Vr,TRACE_FUNC_END:()=>zr,Tensor:()=>Xs,env:()=>nm,registerBackend:()=>Pu});var Hu=Bt(()=>{wu();Eu();Uu();Ua();$u();Ku();$a();Qu();Xu()});var Yu={};gu(Yu,{ASTFeatureExtractor:()=>mm,ASTForAudioClassification:()=>hm,ASTModel:()=>Mm,ASTPreTrainedModel:()=>fm,AlbertForMaskedLM:()=>gm,AlbertForQuestionAnswering:()=>Pm,AlbertForSequenceClassification:()=>Tm,AlbertModel:()=>wm,AlbertPreTrainedModel:()=>bm,AlbertTokenizer:()=>xm,ArceeForCausalLM:()=>vm,ArceeModel:()=>Em,ArceePreTrainedModel:()=>Fm,AudioClassificationPipeline:()=>Cm,AutoConfig:()=>km,AutoFeatureExtractor:()=>ym,AutoImageProcessor:()=>Sm,AutoModel:()=>Am,AutoModelForAudioClassification:()=>Lm,AutoModelForAudioFrameClassification:()=>Dm,AutoModelForAudioTextToText:()=>Im,AutoModelForCTC:()=>Om,AutoModelForCausalLM:()=>Bm,AutoModelForDepthEstimation:()=>jm,AutoModelForDocumentQuestionAnswering:()=>Nm,AutoModelForImageClassification:()=>Rm,AutoModelForImageFeatureExtraction:()=>Vm,AutoModelForImageMatting:()=>zm,AutoModelForImageSegmentation:()=>Gm,AutoModelForImageTextToText:()=>Wm,AutoModelForImageToImage:()=>Um,AutoModelForMaskGeneration:()=>$m,AutoModelForMaskedLM:()=>Km,AutoModelForNormalEstimation:()=>Qm,AutoModelForObjectDetection:()=>Xm,AutoModelForPoseEstimation:()=>Hm,AutoModelForQuestionAnswering:()=>Jm,AutoModelForSemanticSegmentation:()=>Ym,AutoModelForSeq2SeqLM:()=>qm,AutoModelForSequenceClassification:()=>Zm,AutoModelForSpeechSeq2Seq:()=>eh,AutoModelForTextToSpectrogram:()=>th,AutoModelForTextToWaveform:()=>sh,AutoModelForTokenClassification:()=>rh,AutoModelForUniversalSegmentation:()=>oh,AutoModelForVision2Seq:()=>ah,AutoModelForXVector:()=>nh,AutoModelForZeroShotObjectDetection:()=>ih,AutoProcessor:()=>lh,AutoTokenizer:()=>ch,AutomaticSpeechRecognitionPipeline:()=>_h,BackgroundRemovalPipeline:()=>dh,BartForConditionalGeneration:()=>uh,BartForSequenceClassification:()=>ph,BartModel:()=>mh,BartPretrainedModel:()=>hh,BartTokenizer:()=>Mh,BaseModelOutput:()=>fh,BaseStreamer:()=>gh,BeitFeatureExtractor:()=>Ph,BeitForImageClassification:()=>Th,BeitModel:()=>wh,BeitPreTrainedModel:()=>bh,BertForMaskedLM:()=>xh,BertForQuestionAnswering:()=>vh,BertForSequenceClassification:()=>Eh,BertForTokenClassification:()=>Fh,BertModel:()=>Ch,BertPreTrainedModel:()=>kh,BertTokenizer:()=>yh,BitImageProcessor:()=>Sh,BlenderbotForConditionalGeneration:()=>Ah,BlenderbotModel:()=>Lh,BlenderbotPreTrainedModel:()=>Dh,BlenderbotSmallForConditionalGeneration:()=>Ih,BlenderbotSmallModel:()=>Oh,BlenderbotSmallPreTrainedModel:()=>Bh,BlenderbotSmallTokenizer:()=>jh,BlenderbotTokenizer:()=>Nh,BloomForCausalLM:()=>Rh,BloomModel:()=>Vh,BloomPreTrainedModel:()=>zh,BloomTokenizer:()=>Gh,CLIPFeatureExtractor:()=>Wh,CLIPImageProcessor:()=>Uh,CLIPModel:()=>$h,CLIPPreTrainedModel:()=>Kh,CLIPSegForImageSegmentation:()=>Qh,CLIPSegModel:()=>Xh,CLIPSegPreTrainedModel:()=>Hh,CLIPTextModel:()=>Jh,CLIPTextModelWithProjection:()=>Yh,CLIPTokenizer:()=>qh,CLIPVisionModel:()=>Zh,CLIPVisionModelWithProjection:()=>eM,CamembertForMaskedLM:()=>tM,CamembertForQuestionAnswering:()=>sM,CamembertForSequenceClassification:()=>rM,CamembertForTokenClassification:()=>oM,CamembertModel:()=>aM,CamembertPreTrainedModel:()=>nM,CamembertTokenizer:()=>iM,CausalLMOutput:()=>lM,CausalLMOutputWithPast:()=>cM,ChineseCLIPFeatureExtractor:()=>_M,ChineseCLIPModel:()=>dM,ChineseCLIPPreTrainedModel:()=>uM,ClapAudioModelWithProjection:()=>pM,ClapFeatureExtractor:()=>mM,ClapModel:()=>hM,ClapPreTrainedModel:()=>MM,ClapTextModelWithProjection:()=>fM,ClassifierFreeGuidanceLogitsProcessor:()=>gM,CodeGenForCausalLM:()=>PM,CodeGenModel:()=>TM,CodeGenPreTrainedModel:()=>wM,CodeGenTokenizer:()=>bM,CodeLlamaTokenizer:()=>xM,CohereForCausalLM:()=>vM,CohereModel:()=>EM,CoherePreTrainedModel:()=>FM,CohereTokenizer:()=>CM,ConvBertForMaskedLM:()=>kM,ConvBertForQuestionAnswering:()=>yM,ConvBertForSequenceClassification:()=>SM,ConvBertForTokenClassification:()=>AM,ConvBertModel:()=>LM,ConvBertPreTrainedModel:()=>DM,ConvBertTokenizer:()=>IM,ConvNextFeatureExtractor:()=>OM,ConvNextForImageClassification:()=>BM,ConvNextImageProcessor:()=>jM,ConvNextModel:()=>NM,ConvNextPreTrainedModel:()=>RM,ConvNextV2ForImageClassification:()=>VM,ConvNextV2Model:()=>zM,ConvNextV2PreTrainedModel:()=>GM,DFineForObjectDetection:()=>WM,DFineModel:()=>UM,DFinePreTrainedModel:()=>$M,DINOv3ConvNextModel:()=>KM,DINOv3ConvNextPreTrainedModel:()=>QM,DINOv3ViTImageProcessor:()=>XM,DINOv3ViTModel:()=>HM,DINOv3ViTPreTrainedModel:()=>JM,DPTFeatureExtractor:()=>YM,DPTForDepthEstimation:()=>qM,DPTImageProcessor:()=>ZM,DPTModel:()=>ef,DPTPreTrainedModel:()=>tf,DacDecoderModel:()=>sf,DacDecoderOutput:()=>rf,DacEncoderModel:()=>of,DacEncoderOutput:()=>af,DacFeatureExtractor:()=>nf,DacModel:()=>lf,DacPreTrainedModel:()=>cf,DataTypeMap:()=>_f,DebertaForMaskedLM:()=>df,DebertaForQuestionAnswering:()=>uf,DebertaForSequenceClassification:()=>pf,DebertaForTokenClassification:()=>mf,DebertaModel:()=>hf,DebertaPreTrainedModel:()=>Mf,DebertaTokenizer:()=>ff,DebertaV2ForMaskedLM:()=>gf,DebertaV2ForQuestionAnswering:()=>Pf,DebertaV2ForSequenceClassification:()=>Tf,DebertaV2ForTokenClassification:()=>wf,DebertaV2Model:()=>bf,DebertaV2PreTrainedModel:()=>xf,DebertaV2Tokenizer:()=>vf,DecisionTransformerModel:()=>Ef,DecisionTransformerPreTrainedModel:()=>Ff,DeiTFeatureExtractor:()=>Cf,DeiTForImageClassification:()=>kf,DeiTImageProcessor:()=>yf,DeiTModel:()=>Sf,DeiTPreTrainedModel:()=>Af,DepthAnythingForDepthEstimation:()=>Lf,DepthAnythingPreTrainedModel:()=>Df,DepthEstimationPipeline:()=>If,DepthProForDepthEstimation:()=>Of,DepthProPreTrainedModel:()=>Bf,DetrFeatureExtractor:()=>jf,DetrForObjectDetection:()=>Nf,DetrForSegmentation:()=>Rf,DetrImageProcessor:()=>Vf,DetrModel:()=>zf,DetrObjectDetectionOutput:()=>Gf,DetrPreTrainedModel:()=>Wf,DetrSegmentationOutput:()=>Uf,Dinov2ForImageClassification:()=>$f,Dinov2Model:()=>Kf,Dinov2PreTrainedModel:()=>Qf,Dinov2WithRegistersForImageClassification:()=>Xf,Dinov2WithRegistersModel:()=>Hf,Dinov2WithRegistersPreTrainedModel:()=>Jf,DistilBertForMaskedLM:()=>Yf,DistilBertForQuestionAnswering:()=>qf,DistilBertForSequenceClassification:()=>Zf,DistilBertForTokenClassification:()=>eg,DistilBertModel:()=>tg,DistilBertPreTrainedModel:()=>sg,DistilBertTokenizer:()=>rg,DocumentQuestionAnsweringPipeline:()=>og,DonutFeatureExtractor:()=>ag,DonutImageProcessor:()=>ng,DonutSwinModel:()=>ig,DonutSwinPreTrainedModel:()=>lg,EdgeTamModel:()=>cg,EfficientNetForImageClassification:()=>_g,EfficientNetImageProcessor:()=>dg,EfficientNetModel:()=>ug,EfficientNetPreTrainedModel:()=>pg,ElectraForMaskedLM:()=>mg,ElectraForQuestionAnswering:()=>hg,ElectraForSequenceClassification:()=>Mg,ElectraForTokenClassification:()=>fg,ElectraModel:()=>gg,ElectraPreTrainedModel:()=>Pg,ElectraTokenizer:()=>Tg,EncodecFeatureExtractor:()=>wg,EosTokenCriteria:()=>bg,Ernie4_5ForCausalLM:()=>xg,Ernie4_5Model:()=>vg,Ernie4_5PreTrainedModel:()=>Eg,EsmForMaskedLM:()=>Fg,EsmForSequenceClassification:()=>Cg,EsmForTokenClassification:()=>kg,EsmModel:()=>yg,EsmPreTrainedModel:()=>Sg,EsmTokenizer:()=>Ag,ExaoneForCausalLM:()=>Lg,ExaoneModel:()=>Dg,ExaonePreTrainedModel:()=>Ig,FFT:()=>Og,FalconForCausalLM:()=>Bg,FalconModel:()=>jg,FalconPreTrainedModel:()=>Ng,FalconTokenizer:()=>Rg,FastViTForImageClassification:()=>Vg,FastViTModel:()=>zg,FastViTPreTrainedModel:()=>Gg,FeatureExtractionPipeline:()=>Wg,FeatureExtractor:()=>Ug,FillMaskPipeline:()=>$g,Florence2ForConditionalGeneration:()=>Kg,Florence2PreTrainedModel:()=>Qg,Florence2Processor:()=>Xg,ForcedBOSTokenLogitsProcessor:()=>Hg,ForcedEOSTokenLogitsProcessor:()=>Jg,GLPNFeatureExtractor:()=>Yg,GLPNForDepthEstimation:()=>qg,GLPNModel:()=>Zg,GLPNPreTrainedModel:()=>eP,GPT2LMHeadModel:()=>tP,GPT2Model:()=>sP,GPT2PreTrainedModel:()=>rP,GPT2Tokenizer:()=>oP,GPTBigCodeForCausalLM:()=>aP,GPTBigCodeModel:()=>nP,GPTBigCodePreTrainedModel:()=>iP,GPTJForCausalLM:()=>lP,GPTJModel:()=>cP,GPTJPreTrainedModel:()=>_P,GPTNeoForCausalLM:()=>dP,GPTNeoModel:()=>uP,GPTNeoPreTrainedModel:()=>pP,GPTNeoXForCausalLM:()=>mP,GPTNeoXModel:()=>hP,GPTNeoXPreTrainedModel:()=>MP,GPTNeoXTokenizer:()=>fP,Gemma2ForCausalLM:()=>gP,Gemma2Model:()=>PP,Gemma2PreTrainedModel:()=>TP,Gemma3ForCausalLM:()=>wP,Gemma3Model:()=>bP,Gemma3PreTrainedModel:()=>xP,Gemma3nAudioFeatureExtractor:()=>vP,Gemma3nForConditionalGeneration:()=>EP,Gemma3nPreTrainedModel:()=>FP,Gemma3nProcessor:()=>CP,GemmaForCausalLM:()=>kP,GemmaModel:()=>yP,GemmaPreTrainedModel:()=>SP,GemmaTokenizer:()=>AP,GlmForCausalLM:()=>LP,GlmModel:()=>DP,GlmPreTrainedModel:()=>IP,GraniteForCausalLM:()=>OP,GraniteModel:()=>BP,GraniteMoeHybridForCausalLM:()=>jP,GraniteMoeHybridModel:()=>NP,GraniteMoeHybridPreTrainedModel:()=>RP,GranitePreTrainedModel:()=>VP,Grok1Tokenizer:()=>zP,GroundingDinoForObjectDetection:()=>GP,GroundingDinoImageProcessor:()=>WP,GroundingDinoPreTrainedModel:()=>UP,GroundingDinoProcessor:()=>$P,GroupViTModel:()=>KP,GroupViTPreTrainedModel:()=>QP,HeliumForCausalLM:()=>XP,HeliumModel:()=>HP,HeliumPreTrainedModel:()=>JP,HerbertTokenizer:()=>YP,HieraForImageClassification:()=>qP,HieraModel:()=>ZP,HieraPreTrainedModel:()=>eT,HubertForCTC:()=>tT,HubertForSequenceClassification:()=>sT,HubertModel:()=>rT,HubertPreTrainedModel:()=>oT,IJepaForImageClassification:()=>aT,IJepaModel:()=>nT,IJepaPreTrainedModel:()=>iT,Idefics3ForConditionalGeneration:()=>lT,Idefics3ImageProcessor:()=>cT,Idefics3PreTrainedModel:()=>_T,Idefics3Processor:()=>dT,ImageClassificationPipeline:()=>uT,ImageFeatureExtractionPipeline:()=>pT,ImageFeatureExtractor:()=>mT,ImageMattingOutput:()=>hT,ImageProcessor:()=>MT,ImageSegmentationPipeline:()=>fT,ImageToImagePipeline:()=>gT,ImageToTextPipeline:()=>PT,InterruptableStoppingCriteria:()=>TT,JAISLMHeadModel:()=>wT,JAISModel:()=>bT,JAISPreTrainedModel:()=>xT,JinaCLIPImageProcessor:()=>vT,JinaCLIPModel:()=>ET,JinaCLIPPreTrainedModel:()=>FT,JinaCLIPProcessor:()=>CT,JinaCLIPTextModel:()=>kT,JinaCLIPVisionModel:()=>yT,Lfm2ForCausalLM:()=>ST,Lfm2Model:()=>AT,Lfm2PreTrainedModel:()=>LT,LiteWhisperForConditionalGeneration:()=>DT,Llama4ForCausalLM:()=>IT,Llama4PreTrainedModel:()=>OT,LlamaForCausalLM:()=>BT,LlamaModel:()=>jT,LlamaPreTrainedModel:()=>NT,LlamaTokenizer:()=>RT,LlavaForConditionalGeneration:()=>VT,LlavaOnevisionForConditionalGeneration:()=>zT,LlavaOnevisionImageProcessor:()=>GT,LlavaPreTrainedModel:()=>WT,LlavaProcessor:()=>UT,LlavaQwen2ForCausalLM:()=>$T,LogitsProcessor:()=>KT,LogitsProcessorList:()=>QT,LogitsWarper:()=>XT,LongT5ForConditionalGeneration:()=>HT,LongT5Model:()=>JT,LongT5PreTrainedModel:()=>YT,M2M100ForConditionalGeneration:()=>qT,M2M100Model:()=>ZT,M2M100PreTrainedModel:()=>ew,M2M100Tokenizer:()=>tw,MBart50Tokenizer:()=>sw,MBartForCausalLM:()=>rw,MBartForConditionalGeneration:()=>ow,MBartForSequenceClassification:()=>aw,MBartModel:()=>nw,MBartPreTrainedModel:()=>iw,MBartTokenizer:()=>lw,MPNetForMaskedLM:()=>cw,MPNetForQuestionAnswering:()=>_w,MPNetForSequenceClassification:()=>dw,MPNetForTokenClassification:()=>uw,MPNetModel:()=>pw,MPNetPreTrainedModel:()=>mw,MPNetTokenizer:()=>hw,MT5ForConditionalGeneration:()=>Mw,MT5Model:()=>fw,MT5PreTrainedModel:()=>gw,MarianMTModel:()=>Pw,MarianModel:()=>Tw,MarianPreTrainedModel:()=>ww,MarianTokenizer:()=>bw,Mask2FormerImageProcessor:()=>xw,MaskFormerFeatureExtractor:()=>vw,MaskFormerForInstanceSegmentation:()=>Ew,MaskFormerImageProcessor:()=>Fw,MaskFormerModel:()=>Cw,MaskFormerPreTrainedModel:()=>kw,MaskedLMOutput:()=>yw,MaxLengthCriteria:()=>Sw,Metric3DForDepthEstimation:()=>Aw,Metric3DPreTrainedModel:()=>Lw,Metric3Dv2ForDepthEstimation:()=>Dw,Metric3Dv2PreTrainedModel:()=>Iw,MgpstrForSceneTextRecognition:()=>Ow,MgpstrModelOutput:()=>Bw,MgpstrPreTrainedModel:()=>jw,MgpstrProcessor:()=>Nw,MgpstrTokenizer:()=>Rw,MimiDecoderModel:()=>Vw,MimiDecoderOutput:()=>zw,MimiEncoderModel:()=>Gw,MimiEncoderOutput:()=>Ww,MimiModel:()=>Uw,MimiPreTrainedModel:()=>$w,MinLengthLogitsProcessor:()=>Kw,MinNewTokensLengthLogitsProcessor:()=>Qw,Ministral3ForCausalLM:()=>Xw,Ministral3Model:()=>Hw,Ministral3PreTrainedModel:()=>Jw,MinistralForCausalLM:()=>Yw,MinistralModel:()=>qw,MinistralPreTrainedModel:()=>Zw,Mistral3ForConditionalGeneration:()=>eb,MistralForCausalLM:()=>tb,MistralModel:()=>sb,MistralPreTrainedModel:()=>rb,MobileBertForMaskedLM:()=>ob,MobileBertForQuestionAnswering:()=>ab,MobileBertForSequenceClassification:()=>nb,MobileBertModel:()=>ib,MobileBertPreTrainedModel:()=>lb,MobileBertTokenizer:()=>cb,MobileLLMForCausalLM:()=>_b,MobileLLMModel:()=>db,MobileLLMPreTrainedModel:()=>ub,MobileNetV1FeatureExtractor:()=>pb,MobileNetV1ForImageClassification:()=>mb,MobileNetV1ForSemanticSegmentation:()=>hb,MobileNetV1ImageProcessor:()=>Mb,MobileNetV1Model:()=>fb,MobileNetV1PreTrainedModel:()=>gb,MobileNetV2FeatureExtractor:()=>Pb,MobileNetV2ForImageClassification:()=>Tb,MobileNetV2ForSemanticSegmentation:()=>wb,MobileNetV2ImageProcessor:()=>bb,MobileNetV2Model:()=>xb,MobileNetV2PreTrainedModel:()=>vb,MobileNetV3FeatureExtractor:()=>Eb,MobileNetV3ForImageClassification:()=>Fb,MobileNetV3ForSemanticSegmentation:()=>Cb,MobileNetV3ImageProcessor:()=>kb,MobileNetV3Model:()=>yb,MobileNetV3PreTrainedModel:()=>Sb,MobileNetV4FeatureExtractor:()=>Ab,MobileNetV4ForImageClassification:()=>Lb,MobileNetV4ForSemanticSegmentation:()=>Db,MobileNetV4ImageProcessor:()=>Ib,MobileNetV4Model:()=>Ob,MobileNetV4PreTrainedModel:()=>Bb,MobileViTFeatureExtractor:()=>jb,MobileViTForImageClassification:()=>Nb,MobileViTImageProcessor:()=>Rb,MobileViTModel:()=>Vb,MobileViTPreTrainedModel:()=>zb,MobileViTV2ForImageClassification:()=>Gb,MobileViTV2Model:()=>Wb,MobileViTV2PreTrainedModel:()=>Ub,ModelOutput:()=>$b,ModernBertDecoderForCausalLM:()=>Kb,ModernBertDecoderModel:()=>Qb,ModernBertDecoderPreTrainedModel:()=>Xb,ModernBertForMaskedLM:()=>Hb,ModernBertForSequenceClassification:()=>Jb,ModernBertForTokenClassification:()=>Yb,ModernBertModel:()=>qb,ModernBertPreTrainedModel:()=>Zb,Moondream1ForConditionalGeneration:()=>ex,MoonshineFeatureExtractor:()=>tx,MoonshineForConditionalGeneration:()=>sx,MoonshineModel:()=>rx,MoonshinePreTrainedModel:()=>ox,MoonshineProcessor:()=>ax,MptForCausalLM:()=>nx,MptModel:()=>ix,MptPreTrainedModel:()=>lx,MultiModalityCausalLM:()=>cx,MultiModalityPreTrainedModel:()=>_x,MusicgenForCausalLM:()=>dx,MusicgenForConditionalGeneration:()=>ux,MusicgenModel:()=>px,MusicgenPreTrainedModel:()=>mx,NanoChatForCausalLM:()=>hx,NanoChatModel:()=>Mx,NanoChatPreTrainedModel:()=>fx,NeoBertForMaskedLM:()=>gx,NeoBertForQuestionAnswering:()=>Px,NeoBertForSequenceClassification:()=>Tx,NeoBertForTokenClassification:()=>wx,NeoBertModel:()=>bx,NeoBertPreTrainedModel:()=>xx,NllbTokenizer:()=>vx,NoBadWordsLogitsProcessor:()=>Ex,NoRepeatNGramLogitsProcessor:()=>Fx,NomicBertModel:()=>Cx,NomicBertPreTrainedModel:()=>kx,NougatImageProcessor:()=>yx,NougatTokenizer:()=>Sx,OPTForCausalLM:()=>Ax,OPTModel:()=>Lx,OPTPreTrainedModel:()=>Dx,ObjectDetectionPipeline:()=>Ix,Olmo2ForCausalLM:()=>Ox,Olmo2Model:()=>Bx,Olmo2PreTrainedModel:()=>jx,OlmoForCausalLM:()=>Nx,OlmoModel:()=>Rx,OlmoPreTrainedModel:()=>Vx,OpenELMForCausalLM:()=>zx,OpenELMModel:()=>Gx,OpenELMPreTrainedModel:()=>Wx,OwlViTFeatureExtractor:()=>Ux,OwlViTForObjectDetection:()=>$x,OwlViTImageProcessor:()=>Kx,OwlViTModel:()=>Qx,OwlViTPreTrainedModel:()=>Xx,OwlViTProcessor:()=>Hx,Owlv2ForObjectDetection:()=>Jx,Owlv2ImageProcessor:()=>Yx,Owlv2Model:()=>qx,Owlv2PreTrainedModel:()=>Zx,PaliGemmaForConditionalGeneration:()=>ev,PaliGemmaPreTrainedModel:()=>tv,PaliGemmaProcessor:()=>sv,ParakeetFeatureExtractor:()=>rv,ParakeetForCTC:()=>ov,ParakeetPreTrainedModel:()=>av,PatchTSMixerForPrediction:()=>nv,PatchTSMixerModel:()=>iv,PatchTSMixerPreTrainedModel:()=>lv,PatchTSTForPrediction:()=>cv,PatchTSTModel:()=>_v,PatchTSTPreTrainedModel:()=>dv,Phi3ForCausalLM:()=>uv,Phi3Model:()=>pv,Phi3PreTrainedModel:()=>mv,Phi3VForCausalLM:()=>hv,Phi3VImageProcessor:()=>Mv,Phi3VPreTrainedModel:()=>fv,Phi3VProcessor:()=>gv,PhiForCausalLM:()=>Pv,PhiModel:()=>Tv,PhiPreTrainedModel:()=>wv,Pipeline:()=>bv,PixtralImageProcessor:()=>xv,PixtralProcessor:()=>vv,PreTrainedModel:()=>Ev,PreTrainedTokenizer:()=>Fv,PretrainedConfig:()=>Cv,PretrainedMixin:()=>kv,Processor:()=>yv,PvtForImageClassification:()=>Sv,PvtImageProcessor:()=>Av,PvtModel:()=>Lv,PvtPreTrainedModel:()=>Dv,PyAnnoteFeatureExtractor:()=>Iv,PyAnnoteForAudioFrameClassification:()=>Ov,PyAnnoteModel:()=>Bv,PyAnnotePreTrainedModel:()=>jv,PyAnnoteProcessor:()=>Nv,QuestionAnsweringModelOutput:()=>Rv,QuestionAnsweringPipeline:()=>Vv,Qwen2ForCausalLM:()=>zv,Qwen2Model:()=>Gv,Qwen2PreTrainedModel:()=>Wv,Qwen2Tokenizer:()=>Uv,Qwen2VLForConditionalGeneration:()=>$v,Qwen2VLImageProcessor:()=>Kv,Qwen2VLPreTrainedModel:()=>Qv,Qwen2VLProcessor:()=>Xv,Qwen3ForCausalLM:()=>Hv,Qwen3Model:()=>Jv,Qwen3PreTrainedModel:()=>Yv,RFDetrForObjectDetection:()=>qv,RFDetrModel:()=>Zv,RFDetrObjectDetectionOutput:()=>eE,RFDetrPreTrainedModel:()=>tE,RTDetrForObjectDetection:()=>sE,RTDetrImageProcessor:()=>rE,RTDetrModel:()=>oE,RTDetrObjectDetectionOutput:()=>aE,RTDetrPreTrainedModel:()=>nE,RTDetrV2ForObjectDetection:()=>iE,RTDetrV2Model:()=>lE,RTDetrV2ObjectDetectionOutput:()=>cE,RTDetrV2PreTrainedModel:()=>_E,RawAudio:()=>dE,RawImage:()=>uE,RawVideo:()=>pE,RawVideoFrame:()=>mE,RepetitionPenaltyLogitsProcessor:()=>hE,ResNetForImageClassification:()=>ME,ResNetModel:()=>fE,ResNetPreTrainedModel:()=>gE,RoFormerForMaskedLM:()=>PE,RoFormerForQuestionAnswering:()=>TE,RoFormerForSequenceClassification:()=>wE,RoFormerForTokenClassification:()=>bE,RoFormerModel:()=>xE,RoFormerPreTrainedModel:()=>vE,RoFormerTokenizer:()=>EE,RobertaForMaskedLM:()=>FE,RobertaForQuestionAnswering:()=>CE,RobertaForSequenceClassification:()=>kE,RobertaForTokenClassification:()=>yE,RobertaModel:()=>SE,RobertaPreTrainedModel:()=>AE,RobertaTokenizer:()=>LE,Sam2ImageProcessor:()=>DE,Sam2ImageSegmentationOutput:()=>IE,Sam2Model:()=>OE,Sam2PreTrainedModel:()=>BE,Sam2Processor:()=>jE,Sam2VideoProcessor:()=>NE,Sam3ImageProcessor:()=>RE,Sam3TrackerModel:()=>VE,SamImageProcessor:()=>zE,SamImageSegmentationOutput:()=>GE,SamModel:()=>WE,SamPreTrainedModel:()=>UE,SamProcessor:()=>$E,SapiensForDepthEstimation:()=>KE,SapiensForNormalEstimation:()=>QE,SapiensForSemanticSegmentation:()=>XE,SapiensPreTrainedModel:()=>HE,SeamlessM4TFeatureExtractor:()=>JE,SegformerFeatureExtractor:()=>YE,SegformerForImageClassification:()=>qE,SegformerForSemanticSegmentation:()=>ZE,SegformerImageProcessor:()=>eF,SegformerModel:()=>tF,SegformerPreTrainedModel:()=>sF,Seq2SeqLMOutput:()=>rF,SequenceClassifierOutput:()=>oF,SiglipImageProcessor:()=>aF,SiglipModel:()=>nF,SiglipPreTrainedModel:()=>iF,SiglipTextModel:()=>lF,SiglipTokenizer:()=>cF,SiglipVisionModel:()=>_F,SmolLM3ForCausalLM:()=>dF,SmolLM3Model:()=>uF,SmolLM3PreTrainedModel:()=>pF,SmolVLMForConditionalGeneration:()=>mF,SmolVLMImageProcessor:()=>hF,SmolVLMProcessor:()=>MF,SnacDecoderModel:()=>fF,SnacEncoderModel:()=>gF,SnacFeatureExtractor:()=>PF,SnacModel:()=>TF,SnacPreTrainedModel:()=>wF,SpeechT5FeatureExtractor:()=>bF,SpeechT5ForSpeechToText:()=>xF,SpeechT5ForTextToSpeech:()=>vF,SpeechT5HifiGan:()=>EF,SpeechT5Model:()=>FF,SpeechT5PreTrainedModel:()=>CF,SpeechT5Processor:()=>kF,SpeechT5Tokenizer:()=>yF,SqueezeBertForMaskedLM:()=>SF,SqueezeBertForQuestionAnswering:()=>AF,SqueezeBertForSequenceClassification:()=>LF,SqueezeBertModel:()=>DF,SqueezeBertPreTrainedModel:()=>IF,SqueezeBertTokenizer:()=>OF,StableLmForCausalLM:()=>BF,StableLmModel:()=>jF,StableLmPreTrainedModel:()=>NF,Starcoder2ForCausalLM:()=>RF,Starcoder2Model:()=>VF,Starcoder2PreTrainedModel:()=>zF,StoppingCriteria:()=>GF,StoppingCriteriaList:()=>WF,StyleTextToSpeech2Model:()=>UF,StyleTextToSpeech2PreTrainedModel:()=>$F,SummarizationPipeline:()=>KF,SupertonicForConditionalGeneration:()=>QF,SupertonicPreTrainedModel:()=>XF,SuppressTokensAtBeginLogitsProcessor:()=>HF,Swin2SRForImageSuperResolution:()=>JF,Swin2SRImageProcessor:()=>YF,Swin2SRModel:()=>qF,Swin2SRPreTrainedModel:()=>ZF,SwinForImageClassification:()=>eC,SwinForSemanticSegmentation:()=>tC,SwinModel:()=>sC,SwinPreTrainedModel:()=>rC,T5ForConditionalGeneration:()=>oC,T5Model:()=>aC,T5PreTrainedModel:()=>nC,T5Tokenizer:()=>iC,TableTransformerForObjectDetection:()=>lC,TableTransformerModel:()=>cC,TableTransformerObjectDetectionOutput:()=>_C,TableTransformerPreTrainedModel:()=>dC,TemperatureLogitsWarper:()=>uC,Tensor:()=>pC,Text2TextGenerationPipeline:()=>mC,TextClassificationPipeline:()=>hC,TextGenerationPipeline:()=>MC,TextStreamer:()=>fC,TextToAudioPipeline:()=>gC,TokenClassificationPipeline:()=>PC,TokenClassifierOutput:()=>TC,TokenizerModel:()=>wC,TopKLogitsWarper:()=>bC,TopPLogitsWarper:()=>xC,TrOCRForCausalLM:()=>vC,TrOCRPreTrainedModel:()=>EC,TranslationPipeline:()=>FC,UltravoxModel:()=>CC,UltravoxPreTrainedModel:()=>kC,UltravoxProcessor:()=>yC,UniSpeechForCTC:()=>SC,UniSpeechForSequenceClassification:()=>AC,UniSpeechModel:()=>LC,UniSpeechPreTrainedModel:()=>DC,UniSpeechSatForAudioFrameClassification:()=>IC,UniSpeechSatForCTC:()=>OC,UniSpeechSatForSequenceClassification:()=>BC,UniSpeechSatModel:()=>jC,UniSpeechSatPreTrainedModel:()=>NC,VLChatProcessor:()=>RC,VLMImageProcessor:()=>VC,VaultGemmaForCausalLM:()=>zC,VaultGemmaModel:()=>GC,VaultGemmaPreTrainedModel:()=>WC,ViTFeatureExtractor:()=>UC,ViTForImageClassification:()=>$C,ViTImageProcessor:()=>KC,ViTMAEModel:()=>QC,ViTMAEPreTrainedModel:()=>XC,ViTMSNForImageClassification:()=>HC,ViTMSNModel:()=>JC,ViTMSNPreTrainedModel:()=>YC,ViTModel:()=>qC,ViTPreTrainedModel:()=>ZC,VisionEncoderDecoderModel:()=>ek,VitMatteForImageMatting:()=>tk,VitMatteImageProcessor:()=>sk,VitMattePreTrainedModel:()=>rk,VitPoseForPoseEstimation:()=>ok,VitPoseImageProcessor:()=>ak,VitPosePreTrainedModel:()=>nk,VitsModel:()=>ik,VitsModelOutput:()=>lk,VitsPreTrainedModel:()=>ck,VitsTokenizer:()=>_k,VoxtralForConditionalGeneration:()=>dk,VoxtralProcessor:()=>uk,Wav2Vec2BertForCTC:()=>pk,Wav2Vec2BertForSequenceClassification:()=>mk,Wav2Vec2BertModel:()=>hk,Wav2Vec2BertPreTrainedModel:()=>Mk,Wav2Vec2CTCTokenizer:()=>fk,Wav2Vec2FeatureExtractor:()=>gk,Wav2Vec2ForAudioFrameClassification:()=>Pk,Wav2Vec2ForCTC:()=>Tk,Wav2Vec2ForSequenceClassification:()=>wk,Wav2Vec2Model:()=>bk,Wav2Vec2PreTrainedModel:()=>xk,Wav2Vec2Processor:()=>vk,Wav2Vec2ProcessorWithLM:()=>Ek,WavLMForAudioFrameClassification:()=>Fk,WavLMForCTC:()=>Ck,WavLMForSequenceClassification:()=>kk,WavLMForXVector:()=>yk,WavLMModel:()=>Sk,WavLMPreTrainedModel:()=>Ak,WeSpeakerFeatureExtractor:()=>Lk,WeSpeakerResNetModel:()=>Dk,WeSpeakerResNetPreTrainedModel:()=>Ik,WhisperFeatureExtractor:()=>Ok,WhisperForConditionalGeneration:()=>Bk,WhisperModel:()=>jk,WhisperPreTrainedModel:()=>Nk,WhisperProcessor:()=>Rk,WhisperTextStreamer:()=>Vk,WhisperTimeStampLogitsProcessor:()=>zk,WhisperTokenizer:()=>Gk,XLMForQuestionAnswering:()=>Wk,XLMForSequenceClassification:()=>Uk,XLMForTokenClassification:()=>$k,XLMModel:()=>Kk,XLMPreTrainedModel:()=>Qk,XLMRobertaForMaskedLM:()=>Xk,XLMRobertaForQuestionAnswering:()=>Hk,XLMRobertaForSequenceClassification:()=>Jk,XLMRobertaForTokenClassification:()=>Yk,XLMRobertaModel:()=>qk,XLMRobertaPreTrainedModel:()=>Zk,XLMRobertaTokenizer:()=>ey,XLMTokenizer:()=>ty,XLMWithLMHeadModel:()=>sy,XVectorOutput:()=>ry,YolosFeatureExtractor:()=>oy,YolosForObjectDetection:()=>ay,YolosImageProcessor:()=>ny,YolosModel:()=>iy,YolosObjectDetectionOutput:()=>ly,YolosPreTrainedModel:()=>cy,ZeroShotAudioClassificationPipeline:()=>_y,ZeroShotClassificationPipeline:()=>dy,ZeroShotImageClassificationPipeline:()=>uy,ZeroShotObjectDetectionPipeline:()=>py,bankers_round:()=>my,cat:()=>hy,cos_sim:()=>My,dot:()=>fy,dynamic_time_warping:()=>gy,env:()=>Py,full:()=>Ty,full_like:()=>wy,getCacheShapes:()=>by,hamming:()=>xy,hanning:()=>vy,interpolate:()=>Ey,interpolate_4d:()=>Fy,interpolate_data:()=>Cy,is_chinese_char:()=>ky,layer_norm:()=>yy,load_image:()=>Sy,load_video:()=>Ay,log_softmax:()=>Ly,magnitude:()=>Dy,matmul:()=>Iy,max:()=>Oy,mean:()=>By,mean_pooling:()=>jy,medianFilter:()=>Ny,mel_filter_bank:()=>Ry,min:()=>Vy,ones:()=>zy,ones_like:()=>Gy,permute:()=>Wy,permute_data:()=>Uy,pipeline:()=>$y,quantize_embeddings:()=>Ky,rand:()=>Qy,randn:()=>Xy,read_audio:()=>Hy,rfft:()=>Jy,round:()=>Yy,slice:()=>qy,softmax:()=>Zy,spectrogram:()=>eS,stack:()=>tS,std_mean:()=>sS,topk:()=>rS,window_function:()=>oS,zeros:()=>aS,zeros_like:()=>nS});function mt(D){var a=Ju[D];if(a!==void 0)return a.exports;var e=Ju[D]={exports:{}};return pm[D](e,e.exports,mt),e.exports}var lm,cm,_m,dm,um,iS,pm,Ju,t,mm,hm,Mm,fm,gm,Pm,Tm,wm,bm,xm,vm,Em,Fm,Cm,km,ym,Sm,Am,Lm,Dm,Im,Om,Bm,jm,Nm,Rm,Vm,zm,Gm,Wm,Um,$m,Km,Qm,Xm,Hm,Jm,Ym,qm,Zm,eh,th,sh,rh,oh,ah,nh,ih,lh,ch,_h,dh,uh,ph,mh,hh,Mh,fh,gh,Ph,Th,wh,bh,xh,vh,Eh,Fh,Ch,kh,yh,Sh,Ah,Lh,Dh,Ih,Oh,Bh,jh,Nh,Rh,Vh,zh,Gh,Wh,Uh,$h,Kh,Qh,Xh,Hh,Jh,Yh,qh,Zh,eM,tM,sM,rM,oM,aM,nM,iM,lM,cM,_M,dM,uM,pM,mM,hM,MM,fM,gM,PM,TM,wM,bM,xM,vM,EM,FM,CM,kM,yM,SM,AM,LM,DM,IM,OM,BM,jM,NM,RM,VM,zM,GM,WM,UM,$M,KM,QM,XM,HM,JM,YM,qM,ZM,ef,tf,sf,rf,of,af,nf,lf,cf,_f,df,uf,pf,mf,hf,Mf,ff,gf,Pf,Tf,wf,bf,xf,vf,Ef,Ff,Cf,kf,yf,Sf,Af,Lf,Df,If,Of,Bf,jf,Nf,Rf,Vf,zf,Gf,Wf,Uf,$f,Kf,Qf,Xf,Hf,Jf,Yf,qf,Zf,eg,tg,sg,rg,og,ag,ng,ig,lg,cg,_g,dg,ug,pg,mg,hg,Mg,fg,gg,Pg,Tg,wg,bg,xg,vg,Eg,Fg,Cg,kg,yg,Sg,Ag,Lg,Dg,Ig,Og,Bg,jg,Ng,Rg,Vg,zg,Gg,Wg,Ug,$g,Kg,Qg,Xg,Hg,Jg,Yg,qg,Zg,eP,tP,sP,rP,oP,aP,nP,iP,lP,cP,_P,dP,uP,pP,mP,hP,MP,fP,gP,PP,TP,wP,bP,xP,vP,EP,FP,CP,kP,yP,SP,AP,LP,DP,IP,OP,BP,jP,NP,RP,VP,zP,GP,WP,UP,$P,KP,QP,XP,HP,JP,YP,qP,ZP,eT,tT,sT,rT,oT,aT,nT,iT,lT,cT,_T,dT,uT,pT,mT,hT,MT,fT,gT,PT,TT,wT,bT,xT,vT,ET,FT,CT,kT,yT,ST,AT,LT,DT,IT,OT,BT,jT,NT,RT,VT,zT,GT,WT,UT,$T,KT,QT,XT,HT,JT,YT,qT,ZT,ew,tw,sw,rw,ow,aw,nw,iw,lw,cw,_w,dw,uw,pw,mw,hw,Mw,fw,gw,Pw,Tw,ww,bw,xw,vw,Ew,Fw,Cw,kw,yw,Sw,Aw,Lw,Dw,Iw,Ow,Bw,jw,Nw,Rw,Vw,zw,Gw,Ww,Uw,$w,Kw,Qw,Xw,Hw,Jw,Yw,qw,Zw,eb,tb,sb,rb,ob,ab,nb,ib,lb,cb,_b,db,ub,pb,mb,hb,Mb,fb,gb,Pb,Tb,wb,bb,xb,vb,Eb,Fb,Cb,kb,yb,Sb,Ab,Lb,Db,Ib,Ob,Bb,jb,Nb,Rb,Vb,zb,Gb,Wb,Ub,$b,Kb,Qb,Xb,Hb,Jb,Yb,qb,Zb,ex,tx,sx,rx,ox,ax,nx,ix,lx,cx,_x,dx,ux,px,mx,hx,Mx,fx,gx,Px,Tx,wx,bx,xx,vx,Ex,Fx,Cx,kx,yx,Sx,Ax,Lx,Dx,Ix,Ox,Bx,jx,Nx,Rx,Vx,zx,Gx,Wx,Ux,$x,Kx,Qx,Xx,Hx,Jx,Yx,qx,Zx,ev,tv,sv,rv,ov,av,nv,iv,lv,cv,_v,dv,uv,pv,mv,hv,Mv,fv,gv,Pv,Tv,wv,bv,xv,vv,Ev,Fv,Cv,kv,yv,Sv,Av,Lv,Dv,Iv,Ov,Bv,jv,Nv,Rv,Vv,zv,Gv,Wv,Uv,$v,Kv,Qv,Xv,Hv,Jv,Yv,qv,Zv,eE,tE,sE,rE,oE,aE,nE,iE,lE,cE,_E,dE,uE,pE,mE,hE,ME,fE,gE,PE,TE,wE,bE,xE,vE,EE,FE,CE,kE,yE,SE,AE,LE,DE,IE,OE,BE,jE,NE,RE,VE,zE,GE,WE,UE,$E,KE,QE,XE,HE,JE,YE,qE,ZE,eF,tF,sF,rF,oF,aF,nF,iF,lF,cF,_F,dF,uF,pF,mF,hF,MF,fF,gF,PF,TF,wF,bF,xF,vF,EF,FF,CF,kF,yF,SF,AF,LF,DF,IF,OF,BF,jF,NF,RF,VF,zF,GF,WF,UF,$F,KF,QF,XF,HF,JF,YF,qF,ZF,eC,tC,sC,rC,oC,aC,nC,iC,lC,cC,_C,dC,uC,pC,mC,hC,MC,fC,gC,PC,TC,wC,bC,xC,vC,EC,FC,CC,kC,yC,SC,AC,LC,DC,IC,OC,BC,jC,NC,RC,VC,zC,GC,WC,UC,$C,KC,QC,XC,HC,JC,YC,qC,ZC,ek,tk,sk,rk,ok,ak,nk,ik,lk,ck,_k,dk,uk,pk,mk,hk,Mk,fk,gk,Pk,Tk,wk,bk,xk,vk,Ek,Fk,Ck,kk,yk,Sk,Ak,Lk,Dk,Ik,Ok,Bk,jk,Nk,Rk,Vk,zk,Gk,Wk,Uk,$k,Kk,Qk,Xk,Hk,Jk,Yk,qk,Zk,ey,ty,sy,ry,oy,ay,ny,iy,ly,cy,_y,dy,uy,py,my,hy,My,fy,gy,Py,Ty,wy,by,xy,vy,Ey,Fy,Cy,ky,yy,Sy,Ay,Ly,Dy,Iy,Oy,By,jy,Ny,Ry,Vy,zy,Gy,Wy,Uy,$y,Ky,Qy,Xy,Hy,Jy,Yy,qy,Zy,eS,tS,sS,rS,oS,aS,nS,qu=Bt(()=>{lm=dr(require("node:fs"),1),cm=dr(require("node:path"),1),_m=dr(require("node:url"),1);Hu();dm=dr(require("onnxruntime-node"),1),um=dr(require("sharp"),1),iS={},pm={"node:fs":(D=>{D.exports=lm}),"node:path":(D=>{D.exports=cm}),"node:url":(D=>{D.exports=_m}),"onnxruntime-common":(D=>{D.exports=Ka}),"onnxruntime-node":(D=>{D.exports=dm}),sharp:(D=>{D.exports=um}),"?8b6b":(()=>{}),"./node_modules/@huggingface/jinja/dist/index.js":((D,a,e)=>{e.r(a),e.d(a,{Environment:()=>qe,Interpreter:()=>Pt,Template:()=>Os,parse:()=>be,tokenize:()=>_});var i=Object.freeze({Text:"Text",NumericLiteral:"NumericLiteral",StringLiteral:"StringLiteral",Identifier:"Identifier",Equals:"Equals",OpenParen:"OpenParen",CloseParen:"CloseParen",OpenStatement:"OpenStatement",CloseStatement:"CloseStatement",OpenExpression:"OpenExpression",CloseExpression:"CloseExpression",OpenSquareBracket:"OpenSquareBracket",CloseSquareBracket:"CloseSquareBracket",OpenCurlyBracket:"OpenCurlyBracket",CloseCurlyBracket:"CloseCurlyBracket",Comma:"Comma",Dot:"Dot",Colon:"Colon",Pipe:"Pipe",CallOperator:"CallOperator",AdditiveBinaryOperator:"AdditiveBinaryOperator",MultiplicativeBinaryOperator:"MultiplicativeBinaryOperator",ComparisonBinaryOperator:"ComparisonBinaryOperator",UnaryOperator:"UnaryOperator",Comment:"Comment"}),d=class{constructor(n,j){this.value=n,this.type=j}};function g(n){return/\w/.test(n)}function I(n){return/[0-9]/.test(n)}function f(n){return/\s/.test(n)}var u=[["{%",i.OpenStatement],["%}",i.CloseStatement],["{{",i.OpenExpression],["}}",i.CloseExpression],["(",i.OpenParen],[")",i.CloseParen],["{",i.OpenCurlyBracket],["}",i.CloseCurlyBracket],["[",i.OpenSquareBracket],["]",i.CloseSquareBracket],[",",i.Comma],[".",i.Dot],[":",i.Colon],["|",i.Pipe],["<=",i.ComparisonBinaryOperator],[">=",i.ComparisonBinaryOperator],["==",i.ComparisonBinaryOperator],["!=",i.ComparisonBinaryOperator],["<",i.ComparisonBinaryOperator],[">",i.ComparisonBinaryOperator],["+",i.AdditiveBinaryOperator],["-",i.AdditiveBinaryOperator],["~",i.AdditiveBinaryOperator],["*",i.MultiplicativeBinaryOperator],["/",i.MultiplicativeBinaryOperator],["%",i.MultiplicativeBinaryOperator],["=",i.Equals]],m=new Map([["n",`
|
|
2
|
+
`],["t"," "],["r","\r"],["b","\b"],["f","\f"],["v","\v"],["'","'"],['"','"'],["\\","\\"]]);function T(n,j={}){return n.endsWith(`
|
|
3
|
+
`)&&(n=n.slice(0,-1)),j.lstrip_blocks&&(n=n.replace(/^[ \t]*({[#%-])/gm,"$1")),j.trim_blocks&&(n=n.replace(/([#%-]})\n/g,"$1")),n.replace(/{%\s*(end)?generation\s*%}/gs,"")}function _(n,j={}){let v=[],O=T(n,j),z=0,Z=0,ue=Oe=>{let st="";for(;Oe(O[z]);){if(O[z]==="\\"){if(++z,z>=O.length)throw new SyntaxError("Unexpected end of input");let We=O[z++],it=m.get(We);if(it===void 0)throw new SyntaxError(`Unexpected escaped character: ${We}`);st+=it;continue}if(st+=O[z++],z>=O.length)throw new SyntaxError("Unexpected end of input")}return st},Ge=()=>{let Oe=v.at(-1);Oe&&Oe.type===i.Text&&(Oe.value=Oe.value.trimEnd(),Oe.value===""&&v.pop())},Je=()=>{for(;z<O.length&&f(O[z]);)++z};e:for(;z<O.length;){let Oe=v.at(-1)?.type;if(Oe===void 0||Oe===i.CloseStatement||Oe===i.CloseExpression||Oe===i.Comment){let We="";for(;z<O.length&&!(O[z]==="{"&&(O[z+1]==="%"||O[z+1]==="{"||O[z+1]==="#"));)We+=O[z++];if(We.length>0){v.push(new d(We,i.Text));continue}}if(O[z]==="{"&&O[z+1]==="#"){z+=2;let We=O[z]==="-";We&&++z;let it="";for(;O[z]!=="#"||O[z+1]!=="}";){if(z+2>=O.length)throw new SyntaxError("Missing end of comment tag");it+=O[z++]}let gt=it.endsWith("-");gt&&(it=it.slice(0,-1)),We&&Ge(),v.push(new d(it,i.Comment)),z+=2,gt&&Je();continue}if(O.slice(z,z+3)==="{%-"){Ge(),v.push(new d("{%",i.OpenStatement)),z+=3;continue}if(O.slice(z,z+3)==="{{-"){Ge(),v.push(new d("{{",i.OpenExpression)),Z=0,z+=3;continue}if(ue(f),O.slice(z,z+3)==="-%}"){v.push(new d("%}",i.CloseStatement)),z+=3,Je();continue}if(O.slice(z,z+3)==="-}}"){v.push(new d("}}",i.CloseExpression)),z+=3,Je();continue}let st=O[z];if(st==="-"||st==="+"){let We=v.at(-1)?.type;if(We===i.Text||We===void 0)throw new SyntaxError(`Unexpected character: ${st}`);switch(We){case i.Identifier:case i.NumericLiteral:case i.StringLiteral:case i.CloseParen:case i.CloseSquareBracket:break;default:{++z;let it=ue(I);v.push(new d(`${st}${it}`,it.length>0?i.NumericLiteral:i.UnaryOperator));continue}}}for(let[We,it]of u){if(We==="}}"&&Z>0)continue;if(O.slice(z,z+We.length)===We){v.push(new d(We,it)),it===i.OpenExpression?Z=0:it===i.OpenCurlyBracket?++Z:it===i.CloseCurlyBracket&&--Z,z+=We.length;continue e}}if(st==="'"||st==='"'){++z;let We=ue(it=>it!==st);v.push(new d(We,i.StringLiteral)),++z;continue}if(I(st)){let We=ue(I);if(O[z]==="."&&I(O[z+1])){++z;let it=ue(I);We=`${We}.${it}`}v.push(new d(We,i.NumericLiteral));continue}if(g(st)){let We=ue(g);v.push(new d(We,i.Identifier));continue}throw new SyntaxError(`Unexpected character: ${st}`)}return v}var o=class{type="Statement"},x=class extends o{constructor(n){super(),this.body=n}type="Program"},w=class extends o{constructor(n,j,v){super(),this.test=n,this.body=j,this.alternate=v}type="If"},k=class extends o{constructor(n,j,v,O){super(),this.loopvar=n,this.iterable=j,this.body=v,this.defaultBlock=O}type="For"},G=class extends o{type="Break"},b=class extends o{type="Continue"},C=class extends o{constructor(n,j,v){super(),this.assignee=n,this.value=j,this.body=v}type="Set"},B=class extends o{constructor(n,j,v){super(),this.name=n,this.args=j,this.body=v}type="Macro"},P=class extends o{constructor(n){super(),this.value=n}type="Comment"},M=class extends o{type="Expression"},y=class extends M{constructor(n,j,v){super(),this.object=n,this.property=j,this.computed=v}type="MemberExpression"},l=class extends M{constructor(n,j){super(),this.callee=n,this.args=j}type="CallExpression"},h=class extends M{constructor(n){super(),this.value=n}type="Identifier"},F=class extends M{constructor(n){super(),this.value=n}type="Literal"},S=class extends F{type="IntegerLiteral"},V=class extends F{type="FloatLiteral"},R=class extends F{type="StringLiteral"},N=class extends F{type="ArrayLiteral"},Q=class extends F{type="TupleLiteral"},K=class extends F{type="ObjectLiteral"},J=class extends M{constructor(n,j,v){super(),this.operator=n,this.left=j,this.right=v}type="BinaryExpression"},te=class extends M{constructor(n,j){super(),this.operand=n,this.filter=j}type="FilterExpression"},se=class extends o{constructor(n,j){super(),this.filter=n,this.body=j}type="FilterStatement"},ce=class extends M{constructor(n,j){super(),this.lhs=n,this.test=j}type="SelectExpression"},we=class extends M{constructor(n,j,v){super(),this.operand=n,this.negate=j,this.test=v}type="TestExpression"},_e=class extends M{constructor(n,j){super(),this.operator=n,this.argument=j}type="UnaryExpression"},X=class extends M{constructor(n=void 0,j=void 0,v=void 0){super(),this.start=n,this.stop=j,this.step=v}type="SliceExpression"},L=class extends M{constructor(n,j){super(),this.key=n,this.value=j}type="KeywordArgumentExpression"},W=class extends M{constructor(n){super(),this.argument=n}type="SpreadExpression"},Y=class extends o{constructor(n,j,v){super(),this.call=n,this.callerArgs=j,this.body=v}type="CallStatement"},ae=class extends M{constructor(n,j,v){super(),this.condition=n,this.trueExpr=j,this.falseExpr=v}type="Ternary"};function be(n){let j=new x([]),v=0;function O(Fe,Se){let Ke=n[v++];if(!Ke||Ke.type!==Fe)throw new Error(`Parser Error: ${Se}. ${Ke.type} !== ${Fe}.`);return Ke}function z(Fe){if(!Je(Fe))throw new SyntaxError(`Expected ${Fe}`);++v}function Z(){switch(n[v].type){case i.Comment:return new P(n[v++].value);case i.Text:return Oe();case i.OpenStatement:return st();case i.OpenExpression:return We();default:throw new SyntaxError(`Unexpected token type: ${n[v].type}`)}}function ue(...Fe){return v+Fe.length<=n.length&&Fe.every((Se,Ke)=>Se===n[v+Ke].type)}function Ge(...Fe){return n[v]?.type===i.OpenStatement&&n[v+1]?.type===i.Identifier&&Fe.includes(n[v+1]?.value)}function Je(...Fe){return v+Fe.length<=n.length&&Fe.every((Se,Ke)=>n[v+Ke].type==="Identifier"&&Se===n[v+Ke].value)}function Oe(){return new R(O(i.Text,"Expected text token").value)}function st(){if(O(i.OpenStatement,"Expected opening statement token"),n[v].type!==i.Identifier)throw new SyntaxError(`Unknown statement, got ${n[v].type}`);let Fe=n[v].value,Se;switch(Fe){case"set":++v,Se=it();break;case"if":++v,Se=gt(),O(i.OpenStatement,"Expected {% token"),z("endif"),O(i.CloseStatement,"Expected %} token");break;case"macro":++v,Se=Kt(),O(i.OpenStatement,"Expected {% token"),z("endmacro"),O(i.CloseStatement,"Expected %} token");break;case"for":++v,Se=ss(),O(i.OpenStatement,"Expected {% token"),z("endfor"),O(i.CloseStatement,"Expected %} token");break;case"call":{++v;let Ke=null;ue(i.OpenParen)&&(Ke=ps());let Tt=rs();if(Tt.type!=="Identifier")throw new SyntaxError("Expected identifier following call statement");let Rs=ps();O(i.CloseStatement,"Expected closing statement token");let Fs=[];for(;!Ge("endcall");)Fs.push(Z());O(i.OpenStatement,"Expected '{%'"),z("endcall"),O(i.CloseStatement,"Expected closing statement token");let Vs=new l(Tt,Rs);Se=new Y(Vs,Ke,Fs);break}case"break":++v,O(i.CloseStatement,"Expected closing statement token"),Se=new G;break;case"continue":++v,O(i.CloseStatement,"Expected closing statement token"),Se=new b;break;case"filter":{++v;let Ke=rs();Ke instanceof h&&ue(i.OpenParen)&&(Ke=ls(Ke)),O(i.CloseStatement,"Expected closing statement token");let Tt=[];for(;!Ge("endfilter");)Tt.push(Z());O(i.OpenStatement,"Expected '{%'"),z("endfilter"),O(i.CloseStatement,"Expected '%}'"),Se=new se(Ke,Tt);break}default:throw new SyntaxError(`Unknown statement type: ${Fe}`)}return Se}function We(){O(i.OpenExpression,"Expected opening expression token");let Fe=Qt();return O(i.CloseExpression,"Expected closing expression token"),Fe}function it(){let Fe=Nt(),Se=null,Ke=[];if(ue(i.Equals))++v,Se=Nt();else{for(O(i.CloseStatement,"Expected %} token");!Ge("endset");)Ke.push(Z());O(i.OpenStatement,"Expected {% token"),z("endset")}return O(i.CloseStatement,"Expected closing statement token"),new C(Fe,Se,Ke)}function gt(){let Fe=Qt();O(i.CloseStatement,"Expected closing statement token");let Se=[],Ke=[];for(;!Ge("elif","else","endif");)Se.push(Z());if(Ge("elif")){++v,++v;let Tt=gt();Ke.push(Tt)}else if(Ge("else"))for(++v,++v,O(i.CloseStatement,"Expected closing statement token");!Ge("endif");)Ke.push(Z());return new w(Fe,Se,Ke)}function Kt(){let Fe=rs();if(Fe.type!=="Identifier")throw new SyntaxError("Expected identifier following macro statement");let Se=ps();O(i.CloseStatement,"Expected closing statement token");let Ke=[];for(;!Ge("endmacro");)Ke.push(Z());return new B(Fe,Se,Ke)}function Nt(Fe=!1){let Se=Fe?rs:Qt,Ke=[Se()],Tt=ue(i.Comma);for(;Tt&&(++v,Ke.push(Se()),!!ue(i.Comma)););return Tt?new Q(Ke):Ke[0]}function ss(){let Fe=Nt(!0);if(!(Fe instanceof h||Fe instanceof Q))throw new SyntaxError(`Expected identifier/tuple for the loop variable, got ${Fe.type} instead`);if(!Je("in"))throw new SyntaxError("Expected `in` keyword following loop variable");++v;let Se=Qt();O(i.CloseStatement,"Expected closing statement token");let Ke=[];for(;!Ge("endfor","else");)Ke.push(Z());let Tt=[];if(Ge("else"))for(++v,++v,O(i.CloseStatement,"Expected closing statement token");!Ge("endfor");)Tt.push(Z());return new k(Fe,Se,Ke,Tt)}function Qt(){return Ps()}function Ps(){let Fe=Ts();if(Je("if")){++v;let Se=Ts();if(Je("else")){++v;let Ke=Ps();return new ae(Se,Fe,Ke)}else return new ce(Fe,Se)}return Fe}function Ts(){let Fe=ws();for(;Je("or");){let Se=n[v];++v;let Ke=ws();Fe=new J(Se,Fe,Ke)}return Fe}function ws(){let Fe=os();for(;Je("and");){let Se=n[v];++v;let Ke=os();Fe=new J(Se,Fe,Ke)}return Fe}function os(){let Fe;for(;Je("not");){let Se=n[v];++v;let Ke=os();Fe=new _e(Se,Ke)}return Fe??Bs()}function Bs(){let Fe=bs();for(;;){let Se;if(Je("not","in"))Se=new d("not in",i.Identifier),v+=2;else if(Je("in"))Se=n[v++];else if(ue(i.ComparisonBinaryOperator))Se=n[v++];else break;let Ke=bs();Fe=new J(Se,Fe,Ke)}return Fe}function bs(){let Fe=vs();for(;ue(i.AdditiveBinaryOperator);){let Se=n[v];++v;let Ke=vs();Fe=new J(Se,Fe,Ke)}return Fe}function js(){let Fe=xs(rs());return ue(i.OpenParen)?ls(Fe):Fe}function ls(Fe){let Se=new l(Fe,ps());return Se=xs(Se),ue(i.OpenParen)&&(Se=ls(Se)),Se}function ps(){O(i.OpenParen,"Expected opening parenthesis for arguments list");let Fe=ms();return O(i.CloseParen,"Expected closing parenthesis for arguments list"),Fe}function ms(){let Fe=[];for(;!ue(i.CloseParen);){let Se;if(n[v].type===i.MultiplicativeBinaryOperator&&n[v].value==="*"){++v;let Ke=Qt();Se=new W(Ke)}else if(Se=Qt(),ue(i.Equals)){if(++v,!(Se instanceof h))throw new SyntaxError("Expected identifier for keyword argument");let Ke=Qt();Se=new L(Se,Ke)}Fe.push(Se),ue(i.Comma)&&++v}return Fe}function Ns(){let Fe=[],Se=!1;for(;!ue(i.CloseSquareBracket);)ue(i.Colon)?(Fe.push(void 0),++v,Se=!0):(Fe.push(Qt()),ue(i.Colon)&&(++v,Se=!0));if(Fe.length===0)throw new SyntaxError("Expected at least one argument for member/slice expression");if(Se){if(Fe.length>3)throw new SyntaxError("Expected 0-3 arguments for slice expression");return new X(...Fe)}return Fe[0]}function xs(Fe){for(;ue(i.Dot)||ue(i.OpenSquareBracket);){let Se=n[v];++v;let Ke,Tt=Se.type===i.OpenSquareBracket;if(Tt)Ke=Ns(),O(i.CloseSquareBracket,"Expected closing square bracket");else if(Ke=rs(),Ke.type!=="Identifier")throw new SyntaxError("Expected identifier following dot operator");Fe=new y(Fe,Ke,Tt)}return Fe}function vs(){let Fe=Es();for(;ue(i.MultiplicativeBinaryOperator);){let Se=n[v++],Ke=Es();Fe=new J(Se,Fe,Ke)}return Fe}function Es(){let Fe=hs();for(;Je("is");){++v;let Se=Je("not");Se&&++v;let Ke=rs();if(!(Ke instanceof h))throw new SyntaxError("Expected identifier for the test");Fe=new we(Fe,Se,Ke)}return Fe}function hs(){let Fe=js();for(;ue(i.Pipe);){++v;let Se=rs();if(!(Se instanceof h))throw new SyntaxError("Expected identifier for the filter");ue(i.OpenParen)&&(Se=ls(Se)),Fe=new te(Fe,Se)}return Fe}function rs(){let Fe=n[v++];switch(Fe.type){case i.NumericLiteral:{let Se=Fe.value;return Se.includes(".")?new V(Number(Se)):new S(Number(Se))}case i.StringLiteral:{let Se=Fe.value;for(;ue(i.StringLiteral);)Se+=n[v++].value;return new R(Se)}case i.Identifier:return new h(Fe.value);case i.OpenParen:{let Se=Nt();return O(i.CloseParen,"Expected closing parenthesis, got ${tokens[current].type} instead."),Se}case i.OpenSquareBracket:{let Se=[];for(;!ue(i.CloseSquareBracket);)Se.push(Qt()),ue(i.Comma)&&++v;return++v,new N(Se)}case i.OpenCurlyBracket:{let Se=new Map;for(;!ue(i.CloseCurlyBracket);){let Ke=Qt();O(i.Colon,"Expected colon between key and value in object literal");let Tt=Qt();Se.set(Ke,Tt),ue(i.Comma)&&++v}return++v,new K(Se)}default:throw new SyntaxError(`Unexpected token: ${Fe.type}`)}}for(;v<n.length;)j.body.push(Z());return j}function xe(n,j,v=1){j===void 0&&(j=n,n=0);let O=[];for(let z=n;z<j;z+=v)O.push(z);return O}function Le(n,j,v,O=1){let z=Math.sign(O);z>=0?(j=(j??=0)<0?Math.max(n.length+j,0):Math.min(j,n.length),v=(v??=n.length)<0?Math.max(n.length+v,0):Math.min(v,n.length)):(j=(j??=n.length-1)<0?Math.max(n.length+j,-1):Math.min(j,n.length-1),v=(v??=-1)<-1?Math.max(n.length+v,-1):Math.min(v,n.length-1));let Z=[];for(let ue=j;z*ue<z*v;ue+=O)Z.push(n[ue]);return Z}function $e(n){return n.replace(/\b\w/g,j=>j.toUpperCase())}function ge(n){return p(new Date,n)}function p(n,j){let v=new Intl.DateTimeFormat(void 0,{month:"long"}),O=new Intl.DateTimeFormat(void 0,{month:"short"}),z=Z=>Z<10?"0"+Z:Z.toString();return j.replace(/%[YmdbBHM%]/g,Z=>{switch(Z){case"%Y":return n.getFullYear().toString();case"%m":return z(n.getMonth()+1);case"%d":return z(n.getDate());case"%b":return O.format(n);case"%B":return v.format(n);case"%H":return z(n.getHours());case"%M":return z(n.getMinutes());case"%%":return"%";default:return Z}})}function q(n){return n.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function de(n,j,v,O){if(O===0)return n;let z=O==null||O<0?1/0:O,Z=j.length===0?new RegExp("(?=)","gu"):new RegExp(q(j),"gu");return n.replaceAll(Z,ue=>z>0?(--z,v):ue)}var pe=class extends Error{},Te=class extends Error{},me=class{type="RuntimeValue";value;builtins=new Map;constructor(n=void 0){this.value=n}__bool__(){return new he(!!this.value)}toString(){return String(this.value)}},ne=class extends me{type="IntegerValue"},fe=class extends me{type="FloatValue";toString(){return this.value%1===0?this.value.toFixed(1):this.value.toString()}},le=class extends me{type="StringValue";builtins=new Map([["upper",new Be(()=>new le(this.value.toUpperCase()))],["lower",new Be(()=>new le(this.value.toLowerCase()))],["strip",new Be(()=>new le(this.value.trim()))],["title",new Be(()=>new le($e(this.value)))],["capitalize",new Be(()=>new le(this.value.charAt(0).toUpperCase()+this.value.slice(1)))],["length",new ne(this.value.length)],["rstrip",new Be(()=>new le(this.value.trimEnd()))],["lstrip",new Be(()=>new le(this.value.trimStart()))],["startswith",new Be(n=>{if(n.length===0)throw new Error("startswith() requires at least one argument");let j=n[0];if(j instanceof le)return new he(this.value.startsWith(j.value));if(j instanceof Ce){for(let v of j.value){if(!(v instanceof le))throw new Error("startswith() tuple elements must be strings");if(this.value.startsWith(v.value))return new he(!0)}return new he(!1)}throw new Error("startswith() argument must be a string or tuple of strings")})],["endswith",new Be(n=>{if(n.length===0)throw new Error("endswith() requires at least one argument");let j=n[0];if(j instanceof le)return new he(this.value.endsWith(j.value));if(j instanceof Ce){for(let v of j.value){if(!(v instanceof le))throw new Error("endswith() tuple elements must be strings");if(this.value.endsWith(v.value))return new he(!0)}return new he(!1)}throw new Error("endswith() argument must be a string or tuple of strings")})],["split",new Be(n=>{let j=n[0]??new Re;if(!(j instanceof le||j instanceof Re))throw new Error("sep argument must be a string or null");let v=n[1]??new ne(-1);if(!(v instanceof ne))throw new Error("maxsplit argument must be a number");let O=[];if(j instanceof Re){let z=this.value.trimStart();for(let{0:Z,index:ue}of z.matchAll(/\S+/g)){if(v.value!==-1&&O.length>=v.value&&ue!==void 0){O.push(Z+z.slice(ue+Z.length));break}O.push(Z)}}else{if(j.value==="")throw new Error("empty separator");O=this.value.split(j.value),v.value!==-1&&O.length>v.value&&O.push(O.splice(v.value).join(j.value))}return new Ce(O.map(z=>new le(z)))})],["replace",new Be(n=>{if(n.length<2)throw new Error("replace() requires at least two arguments");let j=n[0],v=n[1];if(!(j instanceof le&&v instanceof le))throw new Error("replace() arguments must be strings");let O;if(n.length>2?n[2].type==="KeywordArgumentsValue"?O=n[2].value.get("count")??new Re:O=n[2]:O=new Re,!(O instanceof ne||O instanceof Re))throw new Error("replace() count argument must be a number or null");return new le(de(this.value,j.value,v.value,O.value))})]])},he=class extends me{type="BooleanValue"};function De(n,j,v,O=!0){let z=v??0;switch(n.type){case"NullValue":return"null";case"UndefinedValue":return O?"null":"undefined";case"IntegerValue":case"FloatValue":case"StringValue":case"BooleanValue":return JSON.stringify(n.value);case"ArrayValue":case"ObjectValue":{let Z=j?" ".repeat(j):"",ue=`
|
|
4
|
+
`+Z.repeat(z),Ge=ue+Z;if(n.type==="ArrayValue"){let Je=n.value.map(Oe=>De(Oe,j,z+1,O));return j?`[${Ge}${Je.join(`,${Ge}`)}${ue}]`:`[${Je.join(", ")}]`}else{let Je=Array.from(n.value.entries()).map(([Oe,st])=>{let We=`"${Oe}": ${De(st,j,z+1,O)}`;return j?`${Ge}${We}`:We});return j?`{${Je.join(",")}${ue}}`:`{${Je.join(", ")}}`}}default:throw new Error(`Cannot convert to JSON: ${n.type}`)}}var ve=class extends me{type="ObjectValue";__bool__(){return new he(this.value.size>0)}builtins=new Map([["get",new Be(([n,j])=>{if(!(n instanceof le))throw new Error(`Object key must be a string: got ${n.type}`);return this.value.get(n.value)??j??new Re})],["items",new Be(()=>this.items())],["keys",new Be(()=>this.keys())],["values",new Be(()=>this.values())],["dictsort",new Be(n=>{let j=new Map,v=n.filter(Ge=>Ge instanceof ye?(j=Ge.value,!1):!0),O=v.at(0)??j.get("case_sensitive")??new he(!1);if(!(O instanceof he))throw new Error("case_sensitive must be a boolean");let z=v.at(1)??j.get("by")??new le("key");if(!(z instanceof le))throw new Error("by must be a string");if(!["key","value"].includes(z.value))throw new Error("by must be either 'key' or 'value'");let Z=v.at(2)??j.get("reverse")??new he(!1);if(!(Z instanceof he))throw new Error("reverse must be a boolean");let ue=Array.from(this.value.entries()).map(([Ge,Je])=>new Ce([new le(Ge),Je])).sort((Ge,Je)=>{let Oe=z.value==="key"?0:1,st=Ge.value[Oe],We=Je.value[Oe],it=ut(st,We,O.value);return Z.value?-it:it});return new Ce(ue)})]]);items(){return new Ce(Array.from(this.value.entries()).map(([n,j])=>new Ce([new le(n),j])))}keys(){return new Ce(Array.from(this.value.keys()).map(n=>new le(n)))}values(){return new Ce(Array.from(this.value.values()))}toString(){return De(this,null,0,!1)}},ye=class extends ve{type="KeywordArgumentsValue"},Ce=class extends me{type="ArrayValue";builtins=new Map([["length",new ne(this.value.length)]]);__bool__(){return new he(this.value.length>0)}toString(){return De(this,null,0,!1)}},Qe=class extends Ce{type="TupleValue"},Be=class extends me{type="FunctionValue"},Re=class extends me{type="NullValue"},ke=class extends me{type="UndefinedValue"},qe=class{constructor(n){this.parent=n}variables=new Map([["namespace",new Be(n=>{if(n.length===0)return new ve(new Map);if(n.length!==1||!(n[0]instanceof ve))throw new Error("`namespace` expects either zero arguments or a single object argument");return n[0]})]]);tests=new Map([["boolean",n=>n.type==="BooleanValue"],["callable",n=>n instanceof Be],["odd",n=>{if(!(n instanceof ne))throw new Error(`cannot odd on ${n.type}`);return n.value%2!==0}],["even",n=>{if(!(n instanceof ne))throw new Error(`cannot even on ${n.type}`);return n.value%2===0}],["false",n=>n.type==="BooleanValue"&&!n.value],["true",n=>n.type==="BooleanValue"&&n.value],["none",n=>n.type==="NullValue"],["string",n=>n.type==="StringValue"],["number",n=>n instanceof ne||n instanceof fe],["integer",n=>n instanceof ne],["iterable",n=>n.type==="ArrayValue"||n.type==="StringValue"],["mapping",n=>n.type==="ObjectValue"],["lower",n=>{let j=n.value;return n.type==="StringValue"&&j===j.toLowerCase()}],["upper",n=>{let j=n.value;return n.type==="StringValue"&&j===j.toUpperCase()}],["none",n=>n.type==="NullValue"],["defined",n=>n.type!=="UndefinedValue"],["undefined",n=>n.type==="UndefinedValue"],["equalto",(n,j)=>n.value===j.value],["eq",(n,j)=>n.value===j.value]]);set(n,j){return this.declareVariable(n,jt(j))}declareVariable(n,j){if(this.variables.has(n))throw new SyntaxError(`Variable already declared: ${n}`);return this.variables.set(n,j),j}setVariable(n,j){return this.variables.set(n,j),j}resolve(n){if(this.variables.has(n))return this;if(this.parent)return this.parent.resolve(n);throw new Error(`Unknown variable: ${n}`)}lookupVariable(n){try{return this.resolve(n).variables.get(n)??new ke}catch{return new ke}}};function je(n){n.set("false",!1),n.set("true",!0),n.set("none",null),n.set("raise_exception",j=>{throw new Error(j)}),n.set("range",xe),n.set("strftime_now",ge),n.set("True",!0),n.set("False",!1),n.set("None",null)}function nt(n,j){let v=j.split("."),O=n;for(let z of v)if(O instanceof ve)O=O.value.get(z)??new ke;else if(O instanceof Ce){let Z=parseInt(z,10);if(!isNaN(Z)&&Z>=0&&Z<O.value.length)O=O.value[Z];else return new ke}else return new ke;return O}function ut(n,j,v=!1){if(n instanceof Re&&j instanceof Re)return 0;if(n instanceof Re||j instanceof Re)throw new Error(`Cannot compare ${n.type} with ${j.type}`);if(n instanceof ke&&j instanceof ke)return 0;if(n instanceof ke||j instanceof ke)throw new Error(`Cannot compare ${n.type} with ${j.type}`);let O=Z=>Z instanceof ne||Z instanceof fe||Z instanceof he,z=Z=>Z instanceof he?Z.value?1:0:Z.value;if(O(n)&&O(j)){let Z=z(n),ue=z(j);return Z<ue?-1:Z>ue?1:0}if(n.type!==j.type)throw new Error(`Cannot compare different types: ${n.type} and ${j.type}`);switch(n.type){case"StringValue":{let Z=n.value,ue=j.value;return v||(Z=Z.toLowerCase(),ue=ue.toLowerCase()),Z<ue?-1:Z>ue?1:0}default:throw new Error(`Cannot compare type: ${n.type}`)}}var Pt=class{global;constructor(n){this.global=n??new qe}run(n){return this.evaluate(n,this.global)}evaluateBinaryExpression(n,j){let v=this.evaluate(n.left,j);switch(n.operator.value){case"and":return v.__bool__().value?this.evaluate(n.right,j):v;case"or":return v.__bool__().value?v:this.evaluate(n.right,j)}let O=this.evaluate(n.right,j);switch(n.operator.value){case"==":return new he(v.value==O.value);case"!=":return new he(v.value!=O.value)}if(v instanceof ke||O instanceof ke){if(O instanceof ke&&["in","not in"].includes(n.operator.value))return new he(n.operator.value==="not in");throw new Error(`Cannot perform operation ${n.operator.value} on undefined values`)}else{if(v instanceof Re||O instanceof Re)throw new Error("Cannot perform operation on null values");if(n.operator.value==="~")return new le(v.value.toString()+O.value.toString());if((v instanceof ne||v instanceof fe)&&(O instanceof ne||O instanceof fe)){let z=v.value,Z=O.value;switch(n.operator.value){case"+":case"-":case"*":{let ue=n.operator.value==="+"?z+Z:n.operator.value==="-"?z-Z:z*Z;return v instanceof fe||O instanceof fe?new fe(ue):new ne(ue)}case"/":return new fe(z/Z);case"%":{let ue=z%Z;return v instanceof fe||O instanceof fe?new fe(ue):new ne(ue)}case"<":return new he(z<Z);case">":return new he(z>Z);case">=":return new he(z>=Z);case"<=":return new he(z<=Z)}}else if(v instanceof Ce&&O instanceof Ce)switch(n.operator.value){case"+":return new Ce(v.value.concat(O.value))}else if(O instanceof Ce){let z=O.value.find(Z=>Z.value===v.value)!==void 0;switch(n.operator.value){case"in":return new he(z);case"not in":return new he(!z)}}}if(v instanceof le||O instanceof le)switch(n.operator.value){case"+":return new le(v.value.toString()+O.value.toString())}if(v instanceof le&&O instanceof le)switch(n.operator.value){case"in":return new he(O.value.includes(v.value));case"not in":return new he(!O.value.includes(v.value))}if(v instanceof le&&O instanceof ve)switch(n.operator.value){case"in":return new he(O.value.has(v.value));case"not in":return new he(!O.value.has(v.value))}throw new SyntaxError(`Unknown operator "${n.operator.value}" between ${v.type} and ${O.type}`)}evaluateArguments(n,j){let v=[],O=new Map;for(let z of n)if(z.type==="SpreadExpression"){let Z=z,ue=this.evaluate(Z.argument,j);if(!(ue instanceof Ce))throw new Error(`Cannot unpack non-iterable type: ${ue.type}`);for(let Ge of ue.value)v.push(Ge)}else if(z.type==="KeywordArgumentExpression"){let Z=z;O.set(Z.key.value,this.evaluate(Z.value,j))}else{if(O.size>0)throw new Error("Positional arguments must come before keyword arguments");v.push(this.evaluate(z,j))}return[v,O]}applyFilter(n,j,v){if(j.type==="Identifier"){let O=j;if(O.value==="tojson")return new le(De(n));if(n instanceof Ce)switch(O.value){case"list":return n;case"first":return n.value[0];case"last":return n.value[n.value.length-1];case"length":return new ne(n.value.length);case"reverse":return new Ce(n.value.slice().reverse());case"sort":return new Ce(n.value.slice().sort((z,Z)=>ut(z,Z,!1)));case"join":return new le(n.value.map(z=>z.value).join(""));case"string":return new le(De(n,null,0,!1));case"unique":{let z=new Set,Z=[];for(let ue of n.value)z.has(ue.value)||(z.add(ue.value),Z.push(ue));return new Ce(Z)}default:throw new Error(`Unknown ArrayValue filter: ${O.value}`)}else if(n instanceof le)switch(O.value){case"length":case"upper":case"lower":case"title":case"capitalize":{let z=n.builtins.get(O.value);if(z instanceof Be)return z.value([],v);if(z instanceof ne)return z;throw new Error(`Unknown StringValue filter: ${O.value}`)}case"trim":return new le(n.value.trim());case"indent":return new le(n.value.split(`
|
|
5
|
+
`).map((z,Z)=>Z===0||z.length===0?z:" "+z).join(`
|
|
6
|
+
`));case"join":case"string":return n;case"int":{let z=parseInt(n.value,10);return new ne(isNaN(z)?0:z)}case"float":{let z=parseFloat(n.value);return new fe(isNaN(z)?0:z)}default:throw new Error(`Unknown StringValue filter: ${O.value}`)}else if(n instanceof ne||n instanceof fe)switch(O.value){case"abs":return n instanceof ne?new ne(Math.abs(n.value)):new fe(Math.abs(n.value));case"int":return new ne(Math.floor(n.value));case"float":return new fe(n.value);default:throw new Error(`Unknown NumericValue filter: ${O.value}`)}else if(n instanceof ve)switch(O.value){case"items":return new Ce(Array.from(n.value.entries()).map(([z,Z])=>new Ce([new le(z),Z])));case"length":return new ne(n.value.size);default:{let z=n.builtins.get(O.value);if(z)return z instanceof Be?z.value([],v):z;throw new Error(`Unknown ObjectValue filter: ${O.value}`)}}else if(n instanceof he)switch(O.value){case"bool":return new he(n.value);case"int":return new ne(n.value?1:0);case"float":return new fe(n.value?1:0);case"string":return new le(n.value?"true":"false");default:throw new Error(`Unknown BooleanValue filter: ${O.value}`)}throw new Error(`Cannot apply filter "${O.value}" to type: ${n.type}`)}else if(j.type==="CallExpression"){let O=j;if(O.callee.type!=="Identifier")throw new Error(`Unknown filter: ${O.callee.type}`);let z=O.callee.value;if(z==="tojson"){let[,Z]=this.evaluateArguments(O.args,v),ue=Z.get("indent")??new Re;if(!(ue instanceof ne||ue instanceof Re))throw new Error("If set, indent must be a number");return new le(De(n,ue.value))}else if(z==="join"){let Z;if(n instanceof le)Z=Array.from(n.value);else if(n instanceof Ce)Z=n.value.map(Oe=>Oe.value);else throw new Error(`Cannot apply filter "${z}" to type: ${n.type}`);let[ue,Ge]=this.evaluateArguments(O.args,v),Je=ue.at(0)??Ge.get("separator")??new le("");if(!(Je instanceof le))throw new Error("separator must be a string");return new le(Z.join(Je.value))}else if(z==="int"||z==="float"){let[Z,ue]=this.evaluateArguments(O.args,v),Ge=Z.at(0)??ue.get("default")??(z==="int"?new ne(0):new fe(0));if(n instanceof le){let Je=z==="int"?parseInt(n.value,10):parseFloat(n.value);return isNaN(Je)?Ge:z==="int"?new ne(Je):new fe(Je)}else{if(n instanceof ne||n instanceof fe)return n;if(n instanceof he)return z==="int"?new ne(n.value?1:0):new fe(n.value?1:0);throw new Error(`Cannot apply filter "${z}" to type: ${n.type}`)}}else if(z==="default"){let[Z,ue]=this.evaluateArguments(O.args,v),Ge=Z[0]??new le(""),Je=Z[1]??ue.get("boolean")??new he(!1);if(!(Je instanceof he))throw new Error("`default` filter flag must be a boolean");return n instanceof ke||Je.value&&!n.__bool__().value?Ge:n}if(n instanceof Ce){switch(z){case"sort":{let[Z,ue]=this.evaluateArguments(O.args,v),Ge=Z.at(0)??ue.get("reverse")??new he(!1);if(!(Ge instanceof he))throw new Error("reverse must be a boolean");let Je=Z.at(1)??ue.get("case_sensitive")??new he(!1);if(!(Je instanceof he))throw new Error("case_sensitive must be a boolean");let Oe=Z.at(2)??ue.get("attribute")??new Re;if(!(Oe instanceof le||Oe instanceof ne||Oe instanceof Re))throw new Error("attribute must be a string, integer, or null");let st=We=>{if(Oe instanceof Re)return We;let it=Oe instanceof ne?String(Oe.value):Oe.value;return nt(We,it)};return new Ce(n.value.slice().sort((We,it)=>{let gt=st(We),Kt=st(it),Nt=ut(gt,Kt,Je.value);return Ge.value?-Nt:Nt}))}case"selectattr":case"rejectattr":{let Z=z==="selectattr";if(n.value.some(We=>!(We instanceof ve)))throw new Error(`\`${z}\` can only be applied to array of objects`);if(O.args.some(We=>We.type!=="StringLiteral"))throw new Error(`arguments of \`${z}\` must be strings`);let[ue,Ge,Je]=O.args.map(We=>this.evaluate(We,v)),Oe;if(Ge){let We=v.tests.get(Ge.value);if(!We)throw new Error(`Unknown test: ${Ge.value}`);Oe=We}else Oe=(...We)=>We[0].__bool__().value;let st=n.value.filter(We=>{let it=We.value.get(ue.value),gt=it?Oe(it,Je):!1;return Z?gt:!gt});return new Ce(st)}case"map":{let[,Z]=this.evaluateArguments(O.args,v);if(Z.has("attribute")){let ue=Z.get("attribute");if(!(ue instanceof le))throw new Error("attribute must be a string");let Ge=Z.get("default"),Je=n.value.map(Oe=>{if(!(Oe instanceof ve))throw new Error("items in map must be an object");let st=nt(Oe,ue.value);return st instanceof ke?Ge??new ke:st});return new Ce(Je)}else throw new Error("`map` expressions without `attribute` set are not currently supported.")}}throw new Error(`Unknown ArrayValue filter: ${z}`)}else if(n instanceof le){switch(z){case"indent":{let[Z,ue]=this.evaluateArguments(O.args,v),Ge=Z.at(0)??ue.get("width")??new ne(4);if(!(Ge instanceof ne))throw new Error("width must be a number");let Je=Z.at(1)??ue.get("first")??new he(!1),Oe=Z.at(2)??ue.get("blank")??new he(!1),st=n.value.split(`
|
|
7
|
+
`),We=" ".repeat(Ge.value),it=st.map((gt,Kt)=>!Je.value&&Kt===0||!Oe.value&>.length===0?gt:We+gt);return new le(it.join(`
|
|
8
|
+
`))}case"replace":{let Z=n.builtins.get("replace");if(!(Z instanceof Be))throw new Error("replace filter not available");let[ue,Ge]=this.evaluateArguments(O.args,v);return Z.value([...ue,new ye(Ge)],v)}}throw new Error(`Unknown StringValue filter: ${z}`)}else if(n instanceof ve){let Z=n.builtins.get(z);if(Z&&Z instanceof Be){let[ue,Ge]=this.evaluateArguments(O.args,v);return Ge.size>0&&ue.push(new ye(Ge)),Z.value(ue,v)}throw new Error(`Unknown ObjectValue filter: ${z}`)}else throw new Error(`Cannot apply filter "${z}" to type: ${n.type}`)}throw new Error(`Unknown filter: ${j.type}`)}evaluateFilterExpression(n,j){let v=this.evaluate(n.operand,j);return this.applyFilter(v,n.filter,j)}evaluateTestExpression(n,j){let v=this.evaluate(n.operand,j),O=j.tests.get(n.test.value);if(!O)throw new Error(`Unknown test: ${n.test.value}`);let z=O(v);return new he(n.negate?!z:z)}evaluateSelectExpression(n,j){return this.evaluate(n.test,j).__bool__().value?this.evaluate(n.lhs,j):new ke}evaluateUnaryExpression(n,j){let v=this.evaluate(n.argument,j);switch(n.operator.value){case"not":return new he(!v.value);default:throw new SyntaxError(`Unknown operator: ${n.operator.value}`)}}evaluateTernaryExpression(n,j){return this.evaluate(n.condition,j).__bool__().value?this.evaluate(n.trueExpr,j):this.evaluate(n.falseExpr,j)}evalProgram(n,j){return this.evaluateBlock(n.body,j)}evaluateBlock(n,j){let v="";for(let O of n){let z=this.evaluate(O,j);z.type!=="NullValue"&&z.type!=="UndefinedValue"&&(v+=z.toString())}return new le(v)}evaluateIdentifier(n,j){return j.lookupVariable(n.value)}evaluateCallExpression(n,j){let[v,O]=this.evaluateArguments(n.args,j);O.size>0&&v.push(new ye(O));let z=this.evaluate(n.callee,j);if(z.type!=="FunctionValue")throw new Error(`Cannot call something that is not a function: got ${z.type}`);return z.value(v,j)}evaluateSliceExpression(n,j,v){if(!(n instanceof Ce||n instanceof le))throw new Error("Slice object must be an array or string");let O=this.evaluate(j.start,v),z=this.evaluate(j.stop,v),Z=this.evaluate(j.step,v);if(!(O instanceof ne||O instanceof ke))throw new Error("Slice start must be numeric or undefined");if(!(z instanceof ne||z instanceof ke))throw new Error("Slice stop must be numeric or undefined");if(!(Z instanceof ne||Z instanceof ke))throw new Error("Slice step must be numeric or undefined");return n instanceof Ce?new Ce(Le(n.value,O.value,z.value,Z.value)):new le(Le(Array.from(n.value),O.value,z.value,Z.value).join(""))}evaluateMemberExpression(n,j){let v=this.evaluate(n.object,j),O;if(n.computed){if(n.property.type==="SliceExpression")return this.evaluateSliceExpression(v,n.property,j);O=this.evaluate(n.property,j)}else O=new le(n.property.value);let z;if(v instanceof ve){if(!(O instanceof le))throw new Error(`Cannot access property with non-string: got ${O.type}`);z=v.value.get(O.value)??v.builtins.get(O.value)}else if(v instanceof Ce||v instanceof le)if(O instanceof ne)z=v.value.at(O.value),v instanceof le&&(z=new le(v.value.at(O.value)));else if(O instanceof le)z=v.builtins.get(O.value);else throw new Error(`Cannot access property with non-string/non-number: got ${O.type}`);else{if(!(O instanceof le))throw new Error(`Cannot access property with non-string: got ${O.type}`);z=v.builtins.get(O.value)}return z instanceof me?z:new ke}evaluateSet(n,j){let v=n.value?this.evaluate(n.value,j):this.evaluateBlock(n.body,j);if(n.assignee.type==="Identifier"){let O=n.assignee.value;j.setVariable(O,v)}else if(n.assignee.type==="TupleLiteral"){let O=n.assignee;if(!(v instanceof Ce))throw new Error(`Cannot unpack non-iterable type in set: ${v.type}`);let z=v.value;if(z.length!==O.value.length)throw new Error(`Too ${O.value.length>z.length?"few":"many"} items to unpack in set`);for(let Z=0;Z<O.value.length;++Z){let ue=O.value[Z];if(ue.type!=="Identifier")throw new Error(`Cannot unpack to non-identifier in set: ${ue.type}`);j.setVariable(ue.value,z[Z])}}else if(n.assignee.type==="MemberExpression"){let O=n.assignee,z=this.evaluate(O.object,j);if(!(z instanceof ve))throw new Error("Cannot assign to member of non-object");if(O.property.type!=="Identifier")throw new Error("Cannot assign to member with non-identifier property");z.value.set(O.property.value,v)}else throw new Error(`Invalid LHS inside assignment expression: ${JSON.stringify(n.assignee)}`);return new Re}evaluateIf(n,j){let v=this.evaluate(n.test,j);return this.evaluateBlock(v.__bool__().value?n.body:n.alternate,j)}evaluateFor(n,j){let v=new qe(j),O,z;if(n.iterable.type==="SelectExpression"){let Oe=n.iterable;z=this.evaluate(Oe.lhs,v),O=Oe.test}else z=this.evaluate(n.iterable,v);if(!(z instanceof Ce||z instanceof ve))throw new Error(`Expected iterable or object type in for loop: got ${z.type}`);z instanceof ve&&(z=z.keys());let Z=[],ue=[];for(let Oe=0;Oe<z.value.length;++Oe){let st=new qe(v),We=z.value[Oe],it;if(n.loopvar.type==="Identifier")it=gt=>gt.setVariable(n.loopvar.value,We);else if(n.loopvar.type==="TupleLiteral"){let gt=n.loopvar;if(We.type!=="ArrayValue")throw new Error(`Cannot unpack non-iterable type: ${We.type}`);let Kt=We;if(gt.value.length!==Kt.value.length)throw new Error(`Too ${gt.value.length>Kt.value.length?"few":"many"} items to unpack`);it=Nt=>{for(let ss=0;ss<gt.value.length;++ss){if(gt.value[ss].type!=="Identifier")throw new Error(`Cannot unpack non-identifier type: ${gt.value[ss].type}`);Nt.setVariable(gt.value[ss].value,Kt.value[ss])}}}else throw new Error(`Invalid loop variable(s): ${n.loopvar.type}`);O&&(it(st),!this.evaluate(O,st).__bool__().value)||(Z.push(We),ue.push(it))}let Ge="",Je=!0;for(let Oe=0;Oe<Z.length;++Oe){let st=new Map([["index",new ne(Oe+1)],["index0",new ne(Oe)],["revindex",new ne(Z.length-Oe)],["revindex0",new ne(Z.length-Oe-1)],["first",new he(Oe===0)],["last",new he(Oe===Z.length-1)],["length",new ne(Z.length)],["previtem",Oe>0?Z[Oe-1]:new ke],["nextitem",Oe<Z.length-1?Z[Oe+1]:new ke]]);v.setVariable("loop",new ve(st)),ue[Oe](v);try{let We=this.evaluateBlock(n.body,v);Ge+=We.value}catch(We){if(We instanceof Te)continue;if(We instanceof pe)break;throw We}Je=!1}if(Je){let Oe=this.evaluateBlock(n.defaultBlock,v);Ge+=Oe.value}return new le(Ge)}evaluateMacro(n,j){return j.setVariable(n.name.value,new Be((v,O)=>{let z=new qe(O);v=v.slice();let Z;v.at(-1)?.type==="KeywordArgumentsValue"&&(Z=v.pop());for(let ue=0;ue<n.args.length;++ue){let Ge=n.args[ue],Je=v[ue];if(Ge.type==="Identifier"){let Oe=Ge;if(!Je)throw new Error(`Missing positional argument: ${Oe.value}`);z.setVariable(Oe.value,Je)}else if(Ge.type==="KeywordArgumentExpression"){let Oe=Ge,st=Je??Z?.value.get(Oe.key.value)??this.evaluate(Oe.value,z);z.setVariable(Oe.key.value,st)}else throw new Error(`Unknown argument type: ${Ge.type}`)}return this.evaluateBlock(n.body,z)})),new Re}evaluateCallStatement(n,j){let v=new Be((Ge,Je)=>{let Oe=new qe(Je);if(n.callerArgs)for(let st=0;st<n.callerArgs.length;++st){let We=n.callerArgs[st];if(We.type!=="Identifier")throw new Error(`Caller parameter must be an identifier, got ${We.type}`);Oe.setVariable(We.value,Ge[st]??new ke)}return this.evaluateBlock(n.body,Oe)}),[O,z]=this.evaluateArguments(n.call.args,j);O.push(new ye(z));let Z=this.evaluate(n.call.callee,j);if(Z.type!=="FunctionValue")throw new Error(`Cannot call something that is not a function: got ${Z.type}`);let ue=new qe(j);return ue.setVariable("caller",v),Z.value(O,ue)}evaluateFilterStatement(n,j){let v=this.evaluateBlock(n.body,j);return this.applyFilter(v,n.filter,j)}evaluate(n,j){if(!n)return new ke;switch(n.type){case"Program":return this.evalProgram(n,j);case"Set":return this.evaluateSet(n,j);case"If":return this.evaluateIf(n,j);case"For":return this.evaluateFor(n,j);case"Macro":return this.evaluateMacro(n,j);case"CallStatement":return this.evaluateCallStatement(n,j);case"Break":throw new pe;case"Continue":throw new Te;case"IntegerLiteral":return new ne(n.value);case"FloatLiteral":return new fe(n.value);case"StringLiteral":return new le(n.value);case"ArrayLiteral":return new Ce(n.value.map(v=>this.evaluate(v,j)));case"TupleLiteral":return new Qe(n.value.map(v=>this.evaluate(v,j)));case"ObjectLiteral":{let v=new Map;for(let[O,z]of n.value){let Z=this.evaluate(O,j);if(!(Z instanceof le))throw new Error(`Object keys must be strings: got ${Z.type}`);v.set(Z.value,this.evaluate(z,j))}return new ve(v)}case"Identifier":return this.evaluateIdentifier(n,j);case"CallExpression":return this.evaluateCallExpression(n,j);case"MemberExpression":return this.evaluateMemberExpression(n,j);case"UnaryExpression":return this.evaluateUnaryExpression(n,j);case"BinaryExpression":return this.evaluateBinaryExpression(n,j);case"FilterExpression":return this.evaluateFilterExpression(n,j);case"FilterStatement":return this.evaluateFilterStatement(n,j);case"TestExpression":return this.evaluateTestExpression(n,j);case"SelectExpression":return this.evaluateSelectExpression(n,j);case"Ternary":return this.evaluateTernaryExpression(n,j);case"Comment":return new Re;default:throw new SyntaxError(`Unknown node type: ${n.type}`)}}};function jt(n){switch(typeof n){case"number":return Number.isInteger(n)?new ne(n):new fe(n);case"string":return new le(n);case"boolean":return new he(n);case"undefined":return new ke;case"object":return n===null?new Re:Array.isArray(n)?new Ce(n.map(jt)):new ve(new Map(Object.entries(n).map(([j,v])=>[j,jt(v)])));case"function":return new Be((j,v)=>{let O=n(...j.map(z=>z.value))??null;return jt(O)});default:throw new Error(`Cannot convert to runtime value: ${n}`)}}var ft=`
|
|
9
|
+
`,$t="{%- ",Hs=" -%}";function Js(n){switch(n.operator.type){case"MultiplicativeBinaryOperator":return 4;case"AdditiveBinaryOperator":return 3;case"ComparisonBinaryOperator":return 2;case"Identifier":return n.operator.value==="and"?1:n.operator.value==="in"||n.operator.value==="not in"?2:0}return 0}function Ys(n,j=" "){let v=typeof j=="number"?" ".repeat(j):j;return qt(n.body,0,v).replace(/\n$/,"")}function kt(...n){return $t+n.join(" ")+Hs}function qt(n,j,v){return n.map(O=>us(O,j,v)).join(ft)}function us(n,j,v){let O=v.repeat(j);switch(n.type){case"Program":return qt(n.body,j,v);case"If":return qs(n,j,v);case"For":return Ze(n,j,v);case"Set":return Ls(n,j,v);case"Macro":return Ds(n,j,v);case"Break":return O+kt("break");case"Continue":return O+kt("continue");case"CallStatement":return Is(n,j,v);case"FilterStatement":return is(n,j,v);case"Comment":return O+"{# "+n.value+" #}";default:return O+"{{- "+lt(n)+" -}}"}}function qs(n,j,v){let O=v.repeat(j),z=[],Z=n;for(;Z&&(z.push({test:Z.test,body:Z.body}),Z.alternate.length===1&&Z.alternate[0].type==="If");)Z=Z.alternate[0];let ue=O+kt("if",lt(z[0].test))+ft+qt(z[0].body,j+1,v);for(let Ge=1;Ge<z.length;++Ge)ue+=ft+O+kt("elif",lt(z[Ge].test))+ft+qt(z[Ge].body,j+1,v);return Z&&Z.alternate.length>0&&(ue+=ft+O+kt("else")+ft+qt(Z.alternate,j+1,v)),ue+=ft+O+kt("endif"),ue}function Ze(n,j,v){let O=v.repeat(j),z="";if(n.iterable.type==="SelectExpression"){let ue=n.iterable;z=`${lt(ue.lhs)} if ${lt(ue.test)}`}else z=lt(n.iterable);let Z=O+kt("for",lt(n.loopvar),"in",z)+ft+qt(n.body,j+1,v);return n.defaultBlock.length>0&&(Z+=ft+O+kt("else")+ft+qt(n.defaultBlock,j+1,v)),Z+=ft+O+kt("endfor"),Z}function Ls(n,j,v){let O=v.repeat(j),z=lt(n.assignee),Z=n.value?lt(n.value):"",ue=O+kt("set",`${z}${n.value?" = "+Z:""}`);return n.body.length===0?ue:ue+ft+qt(n.body,j+1,v)+ft+O+kt("endset")}function Ds(n,j,v){let O=v.repeat(j),z=n.args.map(lt).join(", ");return O+kt("macro",`${n.name.value}(${z})`)+ft+qt(n.body,j+1,v)+ft+O+kt("endmacro")}function Is(n,j,v){let O=v.repeat(j),z=n.callerArgs&&n.callerArgs.length>0?`(${n.callerArgs.map(lt).join(", ")})`:"",Z=lt(n.call),ue=O+kt(`call${z}`,Z)+ft;return ue+=qt(n.body,j+1,v)+ft,ue+=O+kt("endcall"),ue}function is(n,j,v){let O=v.repeat(j),z=n.filter.type==="Identifier"?n.filter.value:lt(n.filter),Z=O+kt("filter",z)+ft;return Z+=qt(n.body,j+1,v)+ft,Z+=O+kt("endfilter"),Z}function lt(n,j=-1){switch(n.type){case"SpreadExpression":return`*${lt(n.argument)}`;case"Identifier":return n.value;case"IntegerLiteral":return`${n.value}`;case"FloatLiteral":return`${n.value}`;case"StringLiteral":return JSON.stringify(n.value);case"BinaryExpression":{let v=n,O=Js(v),z=lt(v.left,O),Z=lt(v.right,O+1),ue=`${z} ${v.operator.value} ${Z}`;return O<j?`(${ue})`:ue}case"UnaryExpression":{let v=n;return v.operator.value+(v.operator.value==="not"?" ":"")+lt(v.argument,1/0)}case"CallExpression":{let v=n,O=v.args.map(lt).join(", ");return`${lt(v.callee)}(${O})`}case"MemberExpression":{let v=n,O=lt(v.object);["Identifier","MemberExpression","CallExpression","StringLiteral","IntegerLiteral","FloatLiteral","ArrayLiteral","TupleLiteral","ObjectLiteral"].includes(v.object.type)||(O=`(${O})`);let z=lt(v.property);return!v.computed&&v.property.type!=="Identifier"&&(z=`(${z})`),v.computed?`${O}[${z}]`:`${O}.${z}`}case"FilterExpression":{let v=n,O=lt(v.operand,1/0);return v.filter.type==="CallExpression"?`${O} | ${lt(v.filter)}`:`${O} | ${v.filter.value}`}case"SelectExpression":{let v=n;return`${lt(v.lhs)} if ${lt(v.test)}`}case"TestExpression":{let v=n;return`${lt(v.operand)} is${v.negate?" not":""} ${v.test.value}`}case"ArrayLiteral":case"TupleLiteral":{let v=n.value.map(lt),O=n.type==="ArrayLiteral"?"[]":"()";return`${O[0]}${v.join(", ")}${O[1]}`}case"ObjectLiteral":return`{${Array.from(n.value.entries()).map(([O,z])=>`${lt(O)}: ${lt(z)}`).join(", ")}}`;case"SliceExpression":{let v=n,O=v.start?lt(v.start):"",z=v.stop?lt(v.stop):"",Z=v.step?`:${lt(v.step)}`:"";return`${O}:${z}${Z}`}case"KeywordArgumentExpression":{let v=n;return`${v.key.value}=${lt(v.value)}`}case"Ternary":{let v=n,O=`${lt(v.trueExpr)} if ${lt(v.condition,0)} else ${lt(v.falseExpr)}`;return j>-1?`(${O})`:O}default:throw new Error(`Unknown expression type: ${n.type}`)}}var Os=class{parsed;constructor(n){let j=_(n,{lstrip_blocks:!0,trim_blocks:!0});this.parsed=be(j)}render(n){let j=new qe;if(je(j),n)for(let[z,Z]of Object.entries(n))j.set(z,Z);return new Pt(j).run(this.parsed).value}format(n){return Ys(this.parsed,n?.indent||" ")}}}),"./src/backends/onnx.js":((D,a,e)=>{var i;e.r(a),e.d(a,{Tensor:()=>f.Tensor,createInferenceSession:()=>G,deviceToExecutionProviders:()=>w,isONNXProxy:()=>y,isONNXTensor:()=>P,runInferenceSession:()=>B});var d=e("./src/env.js"),g=e("onnxruntime-node"),I=e("?8b6b"),f=e("onnxruntime-common");let u=Object.freeze({auto:null,gpu:null,cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",webnn:{name:"webnn",deviceType:"cpu"},"webnn-npu":{name:"webnn",deviceType:"npu"},"webnn-gpu":{name:"webnn",deviceType:"gpu"},"webnn-cpu":{name:"webnn",deviceType:"cpu"}}),m=[],T,_,o=Symbol.for("onnxruntime");if(o in globalThis)_=globalThis[o];else if(d.apis.IS_NODE_ENV){switch(_=g.default??g,process.platform){case"win32":m.push("dml");break;case"linux":process.arch==="x64"&&m.push("cuda");break;case"darwin":break}m.push("cpu"),T=["cpu"]}else _=i||(i=e.t(I,2)),d.apis.IS_WEBNN_AVAILABLE&&m.push("webnn-npu","webnn-gpu","webnn-cpu","webnn"),d.apis.IS_WEBGPU_AVAILABLE&&m.push("webgpu"),m.push("wasm"),T=["wasm"];let x=_.InferenceSession;function w(l=null){if(!l)return T;switch(l){case"auto":return m;case"gpu":return m.filter(h=>["webgpu","cuda","dml","webnn-gpu"].includes(h))}if(m.includes(l))return[u[l]??l];throw new Error(`Unsupported device: "${l}". Should be one of: ${m.join(", ")}.`)}let k=null;async function G(l,h,F){k&&await k;let S=x.create(l,h);k??=S;let V=await S;return V.config=F,V}let b=Promise.resolve(),C=d.apis.IS_BROWSER_ENV||d.apis.IS_WEBWORKER_ENV;async function B(l,h){let F=()=>l.run(h);return await(C?b=b.then(F):F())}function P(l){return l instanceof _.Tensor}let M=_?.env;M?.wasm&&(!(typeof ServiceWorkerGlobalScope<"u"&&self instanceof ServiceWorkerGlobalScope)&&!M.wasm.wasmPaths&&(M.wasm.wasmPaths=`https://cdn.jsdelivr.net/npm/@huggingface/transformers@${d.env.version}/dist/`),M.wasm.proxy=!1),M?.webgpu&&(M.webgpu.powerPreference="high-performance");function y(){return M?.wasm?.proxy}d.env.backends.onnx=M}),"./src/base/feature_extraction_utils.js":((D,a,e)=>{e.r(a),e.d(a,{FeatureExtractor:()=>I,validate_audio_inputs:()=>f});var i=e("./src/utils/constants.js"),d=e("./src/utils/generic.js"),g=e("./src/utils/hub.js");class I extends d.Callable{constructor(m){super(),this.config=m}static async from_pretrained(m,T={}){let _=await(0,g.getModelJSON)(m,i.FEATURE_EXTRACTOR_NAME,!0,T);return new this(_)}}function f(u,m){if(!(u instanceof Float32Array||u instanceof Float64Array))throw new Error(`${m} expects input to be a Float32Array or a Float64Array, but got ${u?.constructor?.name??typeof u} instead. If using the feature extractor directly, remember to use \`read_audio(url, sampling_rate)\` to obtain the raw audio data of the file/url.`)}}),"./src/base/image_processors_utils.js":((D,a,e)=>{e.r(a),e.d(a,{ImageProcessor:()=>M,center_to_corners_format:()=>o,post_process_instance_segmentation:()=>P,post_process_object_detection:()=>x,post_process_panoptic_segmentation:()=>B,post_process_semantic_segmentation:()=>w});var i=e("./src/utils/generic.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/maths.js"),I=e("./src/utils/image.js"),f=e("./src/utils/core.js"),u=e("./src/utils/hub.js"),m=e("./src/utils/constants.js");function T(y,l,h=0,F=null){let S=y/l,V=(0,g.bankers_round)(S)*l;return F!==null&&V>F&&(V=Math.floor(S)*l),V<h&&(V=Math.ceil(S)*l),V}function _([y,l],h){return[Math.max(Math.floor(y/h),1)*h,Math.max(Math.floor(l/h),1)*h]}function o([y,l,h,F]){return[y-h/2,l-F/2,y+h/2,l+F/2]}function x(y,l=.5,h=null,F=!1){let S=y.logits,V=y.pred_boxes,[R,N,Q]=S.dims;if(h!==null&&h.length!==R)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let K=[];for(let J=0;J<R;++J){let te=h!==null?h[J]:null,se={boxes:[],classes:[],scores:[]},ce=S[J],we=V[J];for(let _e=0;_e<N;++_e){let X=ce[_e],L=[],W;if(F){W=X.sigmoid().data;for(let Y=0;Y<W.length;++Y)W[Y]>l&&L.push(Y)}else{let Y=(0,g.max)(X.data)[1];if(Y===Q-1||(W=(0,g.softmax)(X.data),W[Y]<l))continue;L.push(Y)}for(let Y of L){let ae=we[_e].data;ae=o(ae),te!==null&&(ae=ae.map((be,xe)=>be*te[(xe+1)%2])),se.boxes.push(ae),se.classes.push(Y),se.scores.push(W[Y])}}K.push(se)}return K}function w(y,l=null){let h=y.logits,F=h.dims[0];if(l!==null&&l.length!==F)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let S=[];for(let V=0;V<F;++V){let R=l!==null?l[V]:null,N=h[V];R!==null&&(N=(0,d.interpolate)(N,R,"bilinear",!1));let[Q,K]=R??N.dims.slice(-2),J=new d.Tensor("int32",new Int32Array(Q*K),[Q,K]),te=N[0].data,se=J.data;for(let _e=1;_e<N.dims[0];++_e){let X=N[_e].data;for(let L=0;L<X.length;++L)X[L]>te[L]&&(te[L]=X[L],se[L]=_e)}let ce=new Array(N.dims[0]);for(let _e=0;_e<se.length;++_e){let X=se[_e];ce[X]=X}let we=ce.filter(_e=>_e!==void 0);S.push({segmentation:J,labels:we})}return S}function k(y,l,h,F){let S=[],V=[],R=[];for(let N=0;N<y.dims[0];++N){let Q=y[N],K=l[N],J=(0,g.max)(Q.data)[1];if(J===F)continue;let se=(0,g.softmax)(Q.data)[J];se>h&&(S.push(K),V.push(se),R.push(J))}return[S,V,R]}function G(y,l,h,F=.5,S=.8){let V=[],R=0,N=0,Q=l[h].data;for(let J=0;J<y.length;++J)y[J]===h&&(V.push(J),++R),Q[J]>=F&&++N;let K=R>0&&N>0;return K&&(K=R/N>S),[K,V]}function b(y,l,h,F,S,V=null,R=null){let[N,Q]=R??y[0].dims,K=new d.Tensor("int32",new Int32Array(N*Q),[N,Q]),J=[];if(R!==null)for(let _e=0;_e<y.length;++_e)y[_e]=(0,d.interpolate)(y[_e],R,"bilinear",!1);let te=new Int32Array(y[0].data.length),se=new Float32Array(y[0].data.length);for(let _e=0;_e<y.length;++_e){let X=l[_e],L=y[_e].data;for(let W=0;W<L.length;++W)L[W]*=X,L[W]>se[W]&&(te[W]=_e,se[W]=L[W])}let ce=0,we=K.data;for(let _e=0;_e<h.length;++_e){let X=h[_e],[L,W]=G(te,y,_e,F,S);if(L){++ce;for(let Y of W)we[Y]=ce;J.push({id:ce,label_id:X,score:l[_e]})}}return[K,J]}function C(y,l,h=28,F=3136,S=784*1280){if(y<h||l<h)throw new Error(`height:${y} or width:${l} must be larger than factor:${h}`);if(Math.max(y,l)/Math.min(y,l)>200)throw new Error(`absolute aspect ratio must be smaller than 200, got ${Math.max(y,l)/Math.min(y,l)}`);let V=Math.round(y/h)*h,R=Math.round(l/h)*h;if(V*R>S){let N=Math.sqrt(y*l/S);V=Math.floor(y/N/h)*h,R=Math.floor(l/N/h)*h}else if(V*R<F){let N=Math.sqrt(F/(y*l));V=Math.ceil(y*N/h)*h,R=Math.ceil(l*N/h)*h}return[V,R]}function B(y,l=.5,h=.5,F=.8,S=null,V=null){S===null&&(console.warn("`label_ids_to_fuse` unset. No instance will be fused."),S=new Set);let R=y.class_queries_logits??y.logits,Q=(y.masks_queries_logits??y.pred_masks).sigmoid(),[K,J,te]=R.dims;if(te-=1,V!==null&&V.length!==K)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let se=[];for(let ce=0;ce<K;++ce){let we=V!==null?V[ce]:null,_e=R[ce],X=Q[ce],[L,W,Y]=k(_e,X,l,te);if(Y.length===0){let[xe,Le]=we??X.dims.slice(-2),$e=new d.Tensor("int32",new Int32Array(xe*Le).fill(-1),[xe,Le]);se.push({segmentation:$e,segments_info:[]});continue}let[ae,be]=b(L,W,Y,h,F,S,we);se.push({segmentation:ae,segments_info:be})}return se}function P(y,l=.5,h=null){throw new Error("`post_process_instance_segmentation` is not yet implemented.")}class M extends i.Callable{constructor(l){super(),this.image_mean=l.image_mean??l.mean,this.image_std=l.image_std??l.std,this.resample=l.resample??2,this.do_rescale=l.do_rescale??!0,this.rescale_factor=l.rescale_factor??1/255,this.do_normalize=l.do_normalize,this.do_thumbnail=l.do_thumbnail,this.size=l.size??l.image_size,this.do_resize=l.do_resize??this.size!==void 0,this.size_divisibility=l.size_divisibility??l.size_divisor,this.do_center_crop=l.do_center_crop,this.crop_size=l.crop_size,this.do_convert_rgb=l.do_convert_rgb??!0,this.do_crop_margin=l.do_crop_margin,this.pad_size=l.pad_size,this.do_pad=l.do_pad,this.min_pixels=l.min_pixels,this.max_pixels=l.max_pixels,this.do_pad&&!this.pad_size&&this.size&&this.size.width!==void 0&&this.size.height!==void 0&&(this.pad_size=this.size),this.do_flip_channel_order=l.do_flip_channel_order??!1,this.config=l}async thumbnail(l,h,F=2){let S=l.height,V=l.width,R=h.height,N=h.width,Q=Math.min(S,R),K=Math.min(V,N);return Q===S&&K===V?l:(S>V?K=Math.floor(V*Q/S):V>S&&(Q=Math.floor(S*K/V)),await l.resize(K,Q,{resample:F}))}async crop_margin(l,h=200){let F=l.clone().grayscale(),S=(0,g.min)(F.data)[0],R=(0,g.max)(F.data)[0]-S;if(R===0)return l;let N=h/255,Q=F.width,K=F.height,J=0,te=0,se=F.data;for(let ce=0;ce<F.height;++ce){let we=ce*F.width;for(let _e=0;_e<F.width;++_e)(se[we+_e]-S)/R<N&&(Q=Math.min(Q,_e),K=Math.min(K,ce),J=Math.max(J,_e),te=Math.max(te,ce))}return l=await l.crop([Q,K,J,te]),l}pad_image(l,h,F,{mode:S="constant",center:V=!1,constant_values:R=0}={}){let[N,Q,K]=h,J,te;if(typeof F=="number"?(J=F,te=F):F==="square"?J=te=Math.max(N,Q):(J=F.width,te=F.height),J!==Q||te!==N){let se=new Float32Array(J*te*K);if(Array.isArray(R))for(let _e=0;_e<se.length;++_e)se[_e]=R[_e%K];else R!==0&&se.fill(R);let[ce,we]=V?[Math.floor((J-Q)/2),Math.floor((te-N)/2)]:[0,0];for(let _e=0;_e<N;++_e){let X=(_e+we)*J,L=_e*Q;for(let W=0;W<Q;++W){let Y=(X+W+ce)*K,ae=(L+W)*K;for(let be=0;be<K;++be)se[Y+be]=l[ae+be]}}if(S==="symmetric"){if(V)throw new Error("`center` padding is not supported when `mode` is set to `symmetric`.");let _e=N-1,X=Q-1;for(let L=0;L<te;++L){let W=L*J,Y=(0,f.calculateReflectOffset)(L,_e)*Q;for(let ae=0;ae<J;++ae){if(L<N&&ae<Q)continue;let be=(W+ae)*K,xe=(Y+(0,f.calculateReflectOffset)(ae,X))*K;for(let Le=0;Le<K;++Le)se[be+Le]=l[xe+Le]}}}l=se,h=[te,J,K]}return[l,h]}rescale(l){for(let h=0;h<l.length;++h)l[h]=this.rescale_factor*l[h]}get_resize_output_image_size(l,h){let[F,S]=l.size,V,R;if(this.do_thumbnail){let{height:N,width:Q}=h;V=Math.min(N,Q)}else Number.isInteger(h)?(V=h,R=this.config.max_size??V):h!==void 0&&(V=h.shortest_edge,R=h.longest_edge);if(V!==void 0||R!==void 0){let N=V===void 0?1:Math.max(V/F,V/S),Q=F*N,K=S*N,J=R===void 0?1:Math.min(R/Q,R/K),te=Math.floor(Number((Q*J).toFixed(2))),se=Math.floor(Number((K*J).toFixed(2)));return this.size_divisibility!==void 0&&([te,se]=_([te,se],this.size_divisibility)),[te,se]}else if(h!==void 0&&h.width!==void 0&&h.height!==void 0){let N=h.width,Q=h.height;if(this.config.keep_aspect_ratio&&this.config.ensure_multiple_of){let K=Q/S,J=N/F;Math.abs(1-J)<Math.abs(1-K)?K=J:J=K,Q=T(K*S,this.config.ensure_multiple_of),N=T(J*F,this.config.ensure_multiple_of)}return[N,Q]}else{if(this.size_divisibility!==void 0)return _([F,S],this.size_divisibility);if(this.min_pixels!==void 0&&this.max_pixels!==void 0){let N=this.config.patch_size*this.config.merge_size;return C(S,F,N,this.min_pixels,this.max_pixels)}else throw new Error(`Could not resize image due to unsupported \`this.size\` option in config: ${JSON.stringify(h)}`)}}async resize(l){let[h,F]=this.get_resize_output_image_size(l,this.size);return await l.resize(h,F,{resample:this.resample})}async preprocess(l,{do_normalize:h=null,do_pad:F=null,do_convert_rgb:S=null,do_convert_grayscale:V=null,do_flip_channel_order:R=null}={}){this.do_crop_margin&&(l=await this.crop_margin(l));let[N,Q]=l.size;if(S??this.do_convert_rgb?l=l.rgb():V&&(l=l.grayscale()),this.do_resize&&(l=await this.resize(l)),this.do_thumbnail&&(l=await this.thumbnail(l,this.size,this.resample)),this.do_center_crop){let ce,we;Number.isInteger(this.crop_size)?(ce=this.crop_size,we=this.crop_size):(ce=this.crop_size.width,we=this.crop_size.height),l=await l.center_crop(ce,we)}let K=[l.height,l.width],J=Float32Array.from(l.data),te=[l.height,l.width,l.channels];if(this.do_rescale&&this.rescale(J),h??this.do_normalize){let ce=this.image_mean;Array.isArray(this.image_mean)||(ce=new Array(l.channels).fill(ce));let we=this.image_std;if(Array.isArray(this.image_std)||(we=new Array(l.channels).fill(we)),ce.length!==l.channels||we.length!==l.channels)throw new Error(`When set to arrays, the length of \`image_mean\` (${ce.length}) and \`image_std\` (${we.length}) must match the number of channels in the image (${l.channels}).`);for(let _e=0;_e<J.length;_e+=l.channels)for(let X=0;X<l.channels;++X)J[_e+X]=(J[_e+X]-ce[X])/we[X]}if(F??this.do_pad){if(this.pad_size)[J,te]=this.pad_image(J,[l.height,l.width,l.channels],this.pad_size);else if(this.size_divisibility){let[ce,we]=_([te[1],te[0]],this.size_divisibility);[J,te]=this.pad_image(J,te,{width:ce,height:we})}}if(R??this.do_flip_channel_order){if(te[2]!==3)throw new Error("Flipping channel order is only supported for RGB images.");for(let ce=0;ce<J.length;ce+=3){let we=J[ce];J[ce]=J[ce+2],J[ce+2]=we}}let se=new d.Tensor("float32",J,te).permute(2,0,1);return{original_size:[Q,N],reshaped_input_size:K,pixel_values:se}}async _call(l,...h){Array.isArray(l)||(l=[l]);let F=await Promise.all(l.map(V=>this.preprocess(V)));return{pixel_values:(0,d.stack)(F.map(V=>V.pixel_values),0),original_sizes:F.map(V=>V.original_size),reshaped_input_sizes:F.map(V=>V.reshaped_input_size)}}static async from_pretrained(l,h={}){let F=await(0,u.getModelJSON)(l,m.IMAGE_PROCESSOR_NAME,!0,h);return new this(F)}}}),"./src/base/processing_utils.js":((D,a,e)=>{e.r(a),e.d(a,{Processor:()=>I});var i=e("./src/utils/constants.js"),d=e("./src/utils/generic.js"),g=e("./src/utils/hub.js");class I extends d.Callable{static classes=["image_processor_class","tokenizer_class","feature_extractor_class"];static uses_processor_config=!1;static uses_chat_template_file=!1;constructor(u,m,T){super(),this.config=u,this.components=m,this.chat_template=T}get image_processor(){return this.components.image_processor}get tokenizer(){return this.components.tokenizer}get feature_extractor(){return this.components.feature_extractor}apply_chat_template(u,m={}){if(!this.tokenizer)throw new Error("Unable to apply chat template without a tokenizer.");return this.tokenizer.apply_chat_template(u,{tokenize:!1,chat_template:this.chat_template??void 0,...m})}batch_decode(...u){if(!this.tokenizer)throw new Error("Unable to decode without a tokenizer.");return this.tokenizer.batch_decode(...u)}decode(...u){if(!this.tokenizer)throw new Error("Unable to decode without a tokenizer.");return this.tokenizer.decode(...u)}async _call(u,...m){for(let T of[this.image_processor,this.feature_extractor,this.tokenizer])if(T)return T(u,...m);throw new Error("No image processor, feature extractor, or tokenizer found.")}static async from_pretrained(u,m={}){let[T,_,o]=await Promise.all([this.uses_processor_config?(0,g.getModelJSON)(u,i.PROCESSOR_NAME,!0,m):{},Promise.all(this.classes.filter(x=>x in this).map(async x=>{let w=await this[x].from_pretrained(u,m);return[x.replace(/_class$/,""),w]})).then(Object.fromEntries),this.uses_chat_template_file?(0,g.getModelText)(u,i.CHAT_TEMPLATE_NAME,!0,m):null]);return new this(T,_,o)}}}),"./src/configs.js":((D,a,e)=>{e.r(a),e.d(a,{AutoConfig:()=>T,PretrainedConfig:()=>m,getCacheShapes:()=>f});var i=e("./src/utils/core.js"),d=e("./src/utils/hub.js");async function g(_,o){return await(0,d.getModelJSON)(_,"config.json",!0,o)}function I(_){let o={},x={};switch(_.model_type){case"llava":case"paligemma":case"gemma3":case"florence2":case"llava_onevision":case"idefics3":case"ultravox":case"voxtral":case"smolvlm":case"gemma3n":case"mistral3":x=I(_.text_config);break;case"moondream1":x=I(_.phi_config);break;case"musicgen":x=I(_.decoder);break;case"multi_modality":x=I(_.language_config);break;case"gpt2":case"gptj":case"jais":case"codegen":case"gpt_bigcode":o.num_heads="n_head",o.num_layers="n_layer",o.hidden_size="n_embd";break;case"gpt_neox":case"stablelm":case"opt":case"falcon":case"modernbert-decoder":o.num_heads="num_attention_heads",o.num_layers="num_hidden_layers",o.hidden_size="hidden_size";break;case"llama":case"llama4_text":case"nanochat":case"arcee":case"lfm2":case"smollm3":case"olmo":case"olmo2":case"mobilellm":case"granite":case"granitemoehybrid":case"cohere":case"mistral":case"starcoder2":case"qwen2":case"qwen2_vl":case"phi":case"phi3":case"phi3_v":case"llava_qwen2":o.num_heads="num_key_value_heads",o.num_layers="num_hidden_layers",o.hidden_size="hidden_size",o.num_attention_heads="num_attention_heads",o.dim_kv="head_dim";break;case"qwen3":case"gemma":case"gemma2":case"vaultgemma":case"gemma3_text":case"gemma3n_text":case"glm":case"helium":case"ernie4_5":case"ministral":case"ministral3":o.num_heads="num_key_value_heads",o.num_layers="num_hidden_layers",o.dim_kv="head_dim";break;case"openelm":o.num_heads="num_kv_heads",o.num_layers="num_transformer_layers",o.dim_kv="head_dim";break;case"gpt_neo":case"donut-swin":o.num_heads="num_heads",o.num_layers="num_layers",o.hidden_size="hidden_size";break;case"bloom":o.num_heads="n_head",o.num_layers="n_layer",o.hidden_size="hidden_size";break;case"mpt":o.num_heads="n_heads",o.num_layers="n_layers",o.hidden_size="d_model";break;case"exaone":o.num_heads="num_key_value_heads",o.num_layers="num_layers",o.dim_kv="head_dim",o.num_attention_heads="num_attention_heads";break;case"t5":case"mt5":case"longt5":o.num_decoder_layers="num_decoder_layers",o.num_decoder_heads="num_heads",o.decoder_dim_kv="d_kv",o.num_encoder_layers="num_layers",o.num_encoder_heads="num_heads",o.encoder_dim_kv="d_kv";break;case"bart":case"mbart":case"marian":case"whisper":case"lite-whisper":case"m2m_100":case"blenderbot":case"blenderbot-small":case"florence2_language":o.num_decoder_layers="decoder_layers",o.num_decoder_heads="decoder_attention_heads",o.decoder_hidden_size="d_model",o.num_encoder_layers="encoder_layers",o.num_encoder_heads="encoder_attention_heads",o.encoder_hidden_size="d_model";break;case"speecht5":o.num_decoder_layers="decoder_layers",o.num_decoder_heads="decoder_attention_heads",o.decoder_hidden_size="hidden_size",o.num_encoder_layers="encoder_layers",o.num_encoder_heads="encoder_attention_heads",o.encoder_hidden_size="hidden_size";break;case"trocr":o.num_encoder_layers=o.num_decoder_layers="decoder_layers",o.num_encoder_heads=o.num_decoder_heads="decoder_attention_heads",o.encoder_hidden_size=o.decoder_hidden_size="d_model";break;case"musicgen_decoder":o.num_encoder_layers=o.num_decoder_layers="num_hidden_layers",o.num_encoder_heads=o.num_decoder_heads="num_attention_heads",o.encoder_hidden_size=o.decoder_hidden_size="hidden_size";break;case"moonshine":o.num_decoder_layers="decoder_num_hidden_layers",o.num_decoder_heads="decoder_num_key_value_heads",o.num_encoder_layers="encoder_num_hidden_layers",o.num_encoder_heads="encoder_num_key_value_heads",o.encoder_hidden_size=o.decoder_hidden_size="hidden_size";break;case"vision-encoder-decoder":let k=I(_.decoder),G="num_decoder_layers"in k,b=(0,i.pick)(_,["model_type","is_encoder_decoder"]);return G?(b.num_decoder_layers=k.num_decoder_layers,b.num_decoder_heads=k.num_decoder_heads,b.decoder_hidden_size=k.decoder_hidden_size,b.num_encoder_layers=k.num_encoder_layers,b.num_encoder_heads=k.num_encoder_heads,b.encoder_hidden_size=k.encoder_hidden_size):(b.num_layers=k.num_layers,b.num_heads=k.num_heads,b.hidden_size=k.hidden_size),b}let w={...x,...(0,i.pick)(_,["model_type","multi_query","is_encoder_decoder"])};for(let k in o)w[k]=_[o[k]];return w}function f(_,o){if(_.model_type==="lfm2"){let x=o?.prefix??"past_key_values",w=x==="present"?"present":"past",k={},{layer_types:G,num_attention_heads:b,num_key_value_heads:C,hidden_size:B,conv_L_cache:P}=_,M=B/b,y=o?.batch_size??1;for(let l=0;l<G.length;++l)if(G[l]==="full_attention")for(let h of["key","value"])k[`${x}.${l}.${h}`]=[y,C,0,M];else if(G[l]==="conv")k[`${w}_conv.${l}`]=[y,B,P];else throw new Error(`Unsupported layer type: ${G[l]}`);return k}return u(_,o)}function u(_,{prefix:o="past_key_values",batch_size:x=1}={}){let w={},k=_.normalized_config;if(k.is_encoder_decoder&&"num_encoder_heads"in k&&"num_decoder_heads"in k){let G=k.encoder_dim_kv??k.encoder_hidden_size/k.num_encoder_heads,b=k.decoder_dim_kv??k.decoder_hidden_size/k.num_decoder_heads,C=[x,k.num_encoder_heads,0,G],B=[x,k.num_decoder_heads,0,b];for(let P=0;P<k.num_decoder_layers;++P)w[`${o}.${P}.encoder.key`]=C,w[`${o}.${P}.encoder.value`]=C,w[`${o}.${P}.decoder.key`]=B,w[`${o}.${P}.decoder.value`]=B}else{let G=k.num_heads,b=k.num_layers,C=k.dim_kv??k.hidden_size/(k.num_attention_heads??G);if(k.model_type==="falcon"){let B=[x*G,0,C];for(let P=0;P<b;++P)w[`${o}.${P}.key`]=B,w[`${o}.${P}.value`]=B}else if(k.multi_query){let B=[x*G,0,2*C];for(let P=0;P<b;++P)w[`${o}.${P}.key_value`]=B}else if(k.model_type==="bloom"){let B=[x*G,C,0],P=[x*G,0,C];for(let M=0;M<b;++M)w[`${o}.${M}.key`]=B,w[`${o}.${M}.value`]=P}else if(k.model_type==="openelm")for(let B=0;B<b;++B){let P=[x,G[B],0,C];w[`${o}.${B}.key`]=P,w[`${o}.${B}.value`]=P}else{let B=[x,G,0,C];for(let P=0;P<b;++P)w[`${o}.${P}.key`]=B,w[`${o}.${P}.value`]=B}}return w}class m{model_type=null;is_encoder_decoder=!1;max_position_embeddings;"transformers.js_config";constructor(o){Object.assign(this,o),this.normalized_config=I(this)}static async from_pretrained(o,{progress_callback:x=null,config:w=null,cache_dir:k=null,local_files_only:G=!1,revision:b="main"}={}){w&&!(w instanceof m)&&(w=new m(w));let C=w??await g(o,{progress_callback:x,config:w,cache_dir:k,local_files_only:G,revision:b});return new this(C)}}class T{static async from_pretrained(...o){return m.from_pretrained(...o)}}}),"./src/env.js":((D,a,e)=>{e.r(a),e.d(a,{apis:()=>C,env:()=>h});var i=e("node:fs"),d=e("node:path"),g=e("node:url");let I="3.8.1",f=typeof window<"u"&&typeof window.document<"u",u=typeof self<"u"&&["DedicatedWorkerGlobalScope","ServiceWorkerGlobalScope","SharedWorkerGlobalScope"].includes(self.constructor?.name),m=typeof self<"u"&&"caches"in self,T=typeof navigator<"u"&&"gpu"in navigator,_=typeof navigator<"u"&&"ml"in navigator,o=typeof process<"u",x=o&&process?.release?.name==="node",w=!F(i.default),k=!F(d.default),G=typeof globalThis.Deno<"u",b=typeof globalThis.Bun<"u",C=Object.freeze({IS_BROWSER_ENV:f,IS_WEBWORKER_ENV:u,IS_WEB_CACHE_AVAILABLE:m,IS_WEBGPU_AVAILABLE:T,IS_WEBNN_AVAILABLE:_,IS_PROCESS_AVAILABLE:o,IS_NODE_ENV:x,IS_FS_AVAILABLE:w,IS_PATH_AVAILABLE:k}),B=w&&k,P="./";if(B){let S=Object(iS).url;S?P=d.default.dirname(d.default.dirname(g.default.fileURLToPath(S))):typeof __dirname<"u"&&(P=d.default.dirname(__dirname))}let M=B?d.default.join(P,"/.cache/"):null,y="/models/",l=B?d.default.join(P,y):y,h={version:I,backends:{onnx:{}},allowRemoteModels:!0,remoteHost:"https://huggingface.co/",remotePathTemplate:"{model}/resolve/{revision}/",allowLocalModels:!(f||u),localModelPath:l,useFS:w,useBrowserCache:m&&!G,useFSCache:w,cacheDir:M,useCustomCache:!1,customCache:null};function F(S){return Object.keys(S).length===0}}),"./src/generation/configuration_utils.js":((D,a,e)=>{e.r(a),e.d(a,{GenerationConfig:()=>d});var i=e("./src/utils/core.js");class d{max_length=20;max_new_tokens=null;min_length=0;min_new_tokens=null;early_stopping=!1;max_time=null;do_sample=!1;num_beams=1;num_beam_groups=1;penalty_alpha=null;use_cache=!0;temperature=1;top_k=50;top_p=1;typical_p=1;epsilon_cutoff=0;eta_cutoff=0;diversity_penalty=0;repetition_penalty=1;encoder_repetition_penalty=1;length_penalty=1;no_repeat_ngram_size=0;bad_words_ids=null;force_words_ids=null;renormalize_logits=!1;constraints=null;forced_bos_token_id=null;forced_eos_token_id=null;remove_invalid_values=!1;exponential_decay_length_penalty=null;suppress_tokens=null;streamer=null;begin_suppress_tokens=null;forced_decoder_ids=null;guidance_scale=null;num_return_sequences=1;output_attentions=!1;output_hidden_states=!1;output_scores=!1;return_dict_in_generate=!1;pad_token_id=null;bos_token_id=null;eos_token_id=null;encoder_no_repeat_ngram_size=0;decoder_start_token_id=null;generation_kwargs={};constructor(I){Object.assign(this,(0,i.pick)(I,Object.getOwnPropertyNames(this)))}}}),"./src/generation/logits_process.js":((D,a,e)=>{e.r(a),e.d(a,{ClassifierFreeGuidanceLogitsProcessor:()=>C,ForcedBOSTokenLogitsProcessor:()=>m,ForcedEOSTokenLogitsProcessor:()=>T,LogitsProcessor:()=>I,LogitsProcessorList:()=>u,LogitsWarper:()=>f,MinLengthLogitsProcessor:()=>k,MinNewTokensLengthLogitsProcessor:()=>G,NoBadWordsLogitsProcessor:()=>b,NoRepeatNGramLogitsProcessor:()=>x,RepetitionPenaltyLogitsProcessor:()=>w,SuppressTokensAtBeginLogitsProcessor:()=>_,TemperatureLogitsWarper:()=>B,TopKLogitsWarper:()=>M,TopPLogitsWarper:()=>P,WhisperTimeStampLogitsProcessor:()=>o});var i=e("./src/utils/generic.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/maths.js");class I extends i.Callable{_call(l,h){throw Error("`_call` should be implemented in a subclass")}}class f extends i.Callable{_call(l,h){throw Error("`_call` should be implemented in a subclass")}}class u extends i.Callable{constructor(){super(),this.processors=[]}push(l){this.processors.push(l)}extend(l){this.processors.push(...l)}_call(l,h){let F=h;for(let S of this.processors)F=S(l,F);return F}[Symbol.iterator](){return this.processors.values()}}class m extends I{constructor(l){super(),this.bos_token_id=l}_call(l,h){for(let F=0;F<l.length;++F)if(l[F].length===1){let S=h[F].data;S.fill(-1/0),S[this.bos_token_id]=0}return h}}class T extends I{constructor(l,h){super(),this.max_length=l,this.eos_token_id=Array.isArray(h)?h:[h]}_call(l,h){for(let F=0;F<l.length;++F)if(l[F].length===this.max_length-1){let S=h[F].data;S.fill(-1/0);for(let V of this.eos_token_id)S[V]=0}return h}}class _ extends I{constructor(l,h){super(),this.begin_suppress_tokens=l,this.begin_index=h}_call(l,h){for(let F=0;F<l.length;++F)if(l[F].length===this.begin_index){let S=h[F].data;for(let V of this.begin_suppress_tokens)S[V]=-1/0}return h}}class o extends I{constructor(l,h){super(),this.eos_token_id=Array.isArray(l.eos_token_id)?l.eos_token_id[0]:l.eos_token_id,this.no_timestamps_token_id=l.no_timestamps_token_id,this.timestamp_begin=this.no_timestamps_token_id+1,this.begin_index=h.length,h.at(-1)===this.no_timestamps_token_id&&(this.begin_index-=1),this.max_initial_timestamp_index=l.max_initial_timestamp_index}_call(l,h){for(let F=0;F<l.length;++F){let S=h[F].data;if(S[this.no_timestamps_token_id]=-1/0,l[F].length===this.begin_index-1){S.fill(-1/0),S[this.timestamp_begin]=0;continue}let V=l[F].slice(this.begin_index),R=V.length>=1&&V[V.length-1]>=this.timestamp_begin,N=V.length<2||V[V.length-2]>=this.timestamp_begin;if(R&&(N?S.subarray(this.timestamp_begin).fill(-1/0):S.subarray(0,this.eos_token_id).fill(-1/0)),l[F].length===this.begin_index&&this.max_initial_timestamp_index!==null){let te=this.timestamp_begin+this.max_initial_timestamp_index;S.subarray(te+1).fill(-1/0)}let Q=(0,g.log_softmax)(S),K=Math.log(Q.subarray(this.timestamp_begin).map(Math.exp).reduce((te,se)=>te+se)),J=(0,g.max)(Q.subarray(0,this.timestamp_begin))[0];K>J&&S.subarray(0,this.timestamp_begin).fill(-1/0)}return h}}class x extends I{constructor(l){super(),this.no_repeat_ngram_size=l}getNgrams(l){let h=l.length,F=[];for(let V=0;V<h+1-this.no_repeat_ngram_size;++V){let R=[];for(let N=0;N<this.no_repeat_ngram_size;++N)R.push(l[V+N]);F.push(R.map(Number))}let S=new Map;for(let V of F){let R=V.slice(0,V.length-1),N=JSON.stringify(R),Q=S.get(N)??[];Q.push(V[V.length-1]),S.set(N,Q)}return S}getGeneratedNgrams(l,h){let F=h.slice(h.length+1-this.no_repeat_ngram_size,h.length);return l.get(JSON.stringify(F.map(Number)))??[]}calcBannedNgramTokens(l){let h=[];if(l.length+1<this.no_repeat_ngram_size)return h;{let F=this.getNgrams(l);return this.getGeneratedNgrams(F,l)}}_call(l,h){for(let F=0;F<l.length;++F){let S=h[F].data,V=this.calcBannedNgramTokens(l[F]);for(let R of V)S[R]=-1/0}return h}}class w extends I{constructor(l){super(),this.penalty=l}_call(l,h){for(let F=0;F<l.length;++F){let S=h[F].data;for(let V of new Set(l[F])){let R=Number(V);S[R]<0?S[R]*=this.penalty:S[R]/=this.penalty}}return h}}class k extends I{constructor(l,h){super(),this.min_length=l,this.eos_token_id=Array.isArray(h)?h:[h]}_call(l,h){for(let F=0;F<l.length;++F)if(l[F].length<this.min_length){let S=h[F].data;for(let V of this.eos_token_id)S[V]=-1/0}return h}}class G extends I{constructor(l,h,F){super(),this.prompt_length_to_skip=l,this.min_new_tokens=h,this.eos_token_id=Array.isArray(F)?F:[F]}_call(l,h){for(let F=0;F<l.length;++F)if(l[F].length-this.prompt_length_to_skip<this.min_new_tokens){let V=h[F].data;for(let R of this.eos_token_id)V[R]=-1/0}return h}}class b extends I{constructor(l,h){super(),this.bad_words_ids=l,this.eos_token_id=Array.isArray(h)?h:[h]}_call(l,h){for(let F=0;F<l.length;++F){let S=h[F].data,V=l[F];for(let R of this.bad_words_ids){if(V.length<R.length-1)continue;let N=!0;for(let Q=1;Q<=R.length-1;++Q)if(R.at(-Q-1)!=V.at(-Q)){N=!1;break}N&&(S[R.at(-1)]=-1/0)}}return h}}class C extends I{constructor(l){if(super(),l<=1)throw new Error(`Require guidance scale >1 to use the classifier free guidance processor, got guidance scale ${l}.`);this.guidance_scale=l}_call(l,h){if(h.dims[0]!==2*l.length)throw new Error(`Logits should have twice the batch size of the input ids, the first half of batches corresponding to the conditional inputs, and the second half of batches corresponding to the unconditional inputs. Got batch size ${h.dims[0]} for the logits and ${l.length} for the input ids.`);let F=l.length,S=h.slice([0,F],null),V=h.slice([F,h.dims[0]],null);for(let R=0;R<V.data.length;++R)V.data[R]+=(S.data[R]-V.data[R])*this.guidance_scale;return V}}class B extends f{constructor(l){if(super(),typeof l!="number"||l<=0){let h=`\`temperature\` (=${l}) must be a strictly positive float, otherwise your next token scores will be invalid.`;l===0&&(h+=" If you're looking for greedy decoding strategies, set `do_sample=false`.")}this.temperature=l}_call(l,h){let F=h.data;for(let S=0;S<F.length;++S)F[S]/=this.temperature;return h}}class P extends f{constructor(l,{filter_value:h=-1/0,min_tokens_to_keep:F=1}={}){if(super(),l<0||l>1)throw new Error(`\`top_p\` must be a float > 0 and < 1, but is ${l}`);if(!Number.isInteger(F)||F<1)throw new Error(`\`min_tokens_to_keep\` must be a positive integer, but is ${F}`);this.top_p=l,this.filter_value=h,this.min_tokens_to_keep=F}}class M extends f{constructor(l,{filter_value:h=-1/0,min_tokens_to_keep:F=1}={}){if(super(),!Number.isInteger(l)||l<0)throw new Error(`\`top_k\` must be a positive integer, but is ${l}`);this.top_k=Math.max(l,F),this.filter_value=h}}}),"./src/generation/logits_sampler.js":((D,a,e)=>{e.r(a),e.d(a,{LogitsSampler:()=>f});var i=e("./src/utils/generic.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/maths.js"),I=e("./src/generation/configuration_utils.js");class f extends i.Callable{constructor(o){super(),this.generation_config=o}async _call(o){return this.sample(o)}async sample(o){throw Error("sample should be implemented in subclasses.")}getLogits(o,x){let w=o.dims.at(-1),k=o.data;if(x===-1)k=k.slice(-w);else{let G=x*w;k=k.slice(G,G+w)}return k}randomSelect(o){let x=0;for(let k=0;k<o.length;++k)x+=o[k];let w=Math.random()*x;for(let k=0;k<o.length;++k)if(w-=o[k],w<=0)return k;return 0}static getSampler(o){if(o.do_sample)return new m(o);if(o.num_beams>1)return new T(o);if(o.num_return_sequences>1)throw Error(`num_return_sequences has to be 1 when doing greedy search, but is ${o.num_return_sequences}.`);return new u(o)}}class u extends f{async sample(o){let x=(0,g.max)(o.data)[1];return[[BigInt(x),0]]}}class m extends f{async sample(o){let x=o.dims.at(-1);this.generation_config.top_k>0&&(x=Math.min(this.generation_config.top_k,x));let[w,k]=await(0,d.topk)(o,x),G=(0,g.softmax)(w.data);return Array.from({length:this.generation_config.num_beams},()=>{let b=this.randomSelect(G);return[k.data[b],Math.log(G[b])]})}}class T extends f{async sample(o){let x=o.dims.at(-1);this.generation_config.top_k>0&&(x=Math.min(this.generation_config.top_k,x));let[w,k]=await(0,d.topk)(o,x),G=(0,g.softmax)(w.data);return Array.from({length:this.generation_config.num_beams},(b,C)=>[k.data[C],Math.log(G[C])])}}}),"./src/generation/stopping_criteria.js":((D,a,e)=>{e.r(a),e.d(a,{EosTokenCriteria:()=>f,InterruptableStoppingCriteria:()=>u,MaxLengthCriteria:()=>I,StoppingCriteria:()=>d,StoppingCriteriaList:()=>g});var i=e("./src/utils/generic.js");class d extends i.Callable{_call(T,_){throw Error("StoppingCriteria needs to be subclassed")}}class g extends i.Callable{constructor(){super(),this.criteria=[]}push(T){this.criteria.push(T)}extend(T){T instanceof g?T=T.criteria:T instanceof d&&(T=[T]),this.criteria.push(...T)}_call(T,_){let o=new Array(T.length).fill(!1);for(let x of this.criteria){let w=x(T,_);for(let k=0;k<o.length;++k)o[k]||=w[k]}return o}[Symbol.iterator](){return this.criteria.values()}}class I extends d{constructor(T,_=null){super(),this.max_length=T,this.max_position_embeddings=_}_call(T){return T.map(_=>_.length>=this.max_length)}}class f extends d{constructor(T){super(),Array.isArray(T)||(T=[T]),this.eos_token_id=T}_call(T,_){return T.map(o=>{let x=o.at(-1);return this.eos_token_id.some(w=>x==w)})}}class u extends d{constructor(){super(),this.interrupted=!1}interrupt(){this.interrupted=!0}reset(){this.interrupted=!1}_call(T,_){return new Array(T.length).fill(this.interrupted)}}}),"./src/generation/streamers.js":((D,a,e)=>{e.r(a),e.d(a,{BaseStreamer:()=>I,TextStreamer:()=>u,WhisperTextStreamer:()=>m});var i=e("./src/utils/core.js"),d=e("./src/tokenizers.js"),g=e("./src/env.js");class I{put(_){throw Error("Not implemented")}end(){throw Error("Not implemented")}}let f=g.apis.IS_PROCESS_AVAILABLE?T=>process.stdout.write(T):T=>console.log(T);class u extends I{constructor(_,{skip_prompt:o=!1,callback_function:x=null,token_callback_function:w=null,skip_special_tokens:k=!0,decode_kwargs:G={},...b}={}){super(),this.tokenizer=_,this.skip_prompt=o,this.callback_function=x??f,this.token_callback_function=w,this.decode_kwargs={skip_special_tokens:k,...G,...b},this.token_cache=[],this.print_len=0,this.next_tokens_are_prompt=!0}put(_){if(_.length>1)throw Error("TextStreamer only supports batch size of 1");let o=this.next_tokens_are_prompt;if(o&&(this.next_tokens_are_prompt=!1,this.skip_prompt))return;let x=_[0];this.token_callback_function?.(x),this.token_cache=(0,i.mergeArrays)(this.token_cache,x);let w=this.tokenizer.decode(this.token_cache,this.decode_kwargs),k;o||w.endsWith(`
|
|
10
|
+
`)?(k=w.slice(this.print_len),this.token_cache=[],this.print_len=0):w.length>0&&(0,d.is_chinese_char)(w.charCodeAt(w.length-1))?(k=w.slice(this.print_len),this.print_len+=k.length):(k=w.slice(this.print_len,w.lastIndexOf(" ")+1),this.print_len+=k.length),this.on_finalized_text(k,!1)}end(){let _;this.token_cache.length>0?(_=this.tokenizer.decode(this.token_cache,this.decode_kwargs).slice(this.print_len),this.token_cache=[],this.print_len=0):_="",this.next_tokens_are_prompt=!0,this.on_finalized_text(_,!0)}on_finalized_text(_,o){_.length>0&&this.callback_function?.(_),o&&this.callback_function===f&&g.apis.IS_PROCESS_AVAILABLE&&this.callback_function?.(`
|
|
11
|
+
`)}}class m extends u{constructor(_,{skip_prompt:o=!1,callback_function:x=null,token_callback_function:w=null,on_chunk_start:k=null,on_chunk_end:G=null,on_finalize:b=null,time_precision:C=.02,skip_special_tokens:B=!0,decode_kwargs:P={}}={}){super(_,{skip_prompt:o,skip_special_tokens:B,callback_function:x,token_callback_function:w,decode_kwargs:P}),this.timestamp_begin=_.timestamp_begin,this.on_chunk_start=k,this.on_chunk_end=G,this.on_finalize=b,this.time_precision=C,this.waiting_for_timestamp=!1}put(_){if(_.length>1)throw Error("WhisperTextStreamer only supports batch size of 1");let o=_[0];if(o.length===1){let x=Number(o[0])-this.timestamp_begin;if(x>=0){let w=x*this.time_precision;this.waiting_for_timestamp?this.on_chunk_end?.(w):this.on_chunk_start?.(w),this.waiting_for_timestamp=!this.waiting_for_timestamp,this.token_callback_function?.(o);return}}return super.put(_)}end(){super.end(),this.on_finalize?.()}}}),"./src/models.js":((D,a,e)=>{e.r(a),e.d(a,{ASTForAudioClassification:()=>fn,ASTModel:()=>Mn,ASTPreTrainedModel:()=>$r,AlbertForMaskedLM:()=>Ie,AlbertForQuestionAnswering:()=>ze,AlbertForSequenceClassification:()=>Ve,AlbertModel:()=>Ne,AlbertPreTrainedModel:()=>Pe,ArceeForCausalLM:()=>di,ArceeModel:()=>_i,ArceePreTrainedModel:()=>po,AutoModel:()=>hp,AutoModelForAudioClassification:()=>Ip,AutoModelForAudioFrameClassification:()=>Bp,AutoModelForAudioTextToText:()=>$p,AutoModelForCTC:()=>Dp,AutoModelForCausalLM:()=>bp,AutoModelForDepthEstimation:()=>Vp,AutoModelForDocumentQuestionAnswering:()=>jp,AutoModelForImageClassification:()=>Fp,AutoModelForImageFeatureExtraction:()=>Wp,AutoModelForImageMatting:()=>Np,AutoModelForImageSegmentation:()=>Cp,AutoModelForImageTextToText:()=>Up,AutoModelForImageToImage:()=>Rp,AutoModelForMaskGeneration:()=>Lp,AutoModelForMaskedLM:()=>xp,AutoModelForNormalEstimation:()=>zp,AutoModelForObjectDetection:()=>Sp,AutoModelForPoseEstimation:()=>Gp,AutoModelForQuestionAnswering:()=>vp,AutoModelForSemanticSegmentation:()=>kp,AutoModelForSeq2SeqLM:()=>gp,AutoModelForSequenceClassification:()=>Mp,AutoModelForSpeechSeq2Seq:()=>Pp,AutoModelForTextToSpectrogram:()=>Tp,AutoModelForTextToWaveform:()=>wp,AutoModelForTokenClassification:()=>fp,AutoModelForUniversalSegmentation:()=>yp,AutoModelForVision2Seq:()=>Ep,AutoModelForXVector:()=>Op,AutoModelForZeroShotObjectDetection:()=>Ap,BartForConditionalGeneration:()=>vt,BartForSequenceClassification:()=>Ut,BartModel:()=>Cs,BartPretrainedModel:()=>Xt,BaseModelOutput:()=>de,BeitForImageClassification:()=>Dl,BeitModel:()=>Ll,BeitPreTrainedModel:()=>Ko,BertForMaskedLM:()=>me,BertForQuestionAnswering:()=>le,BertForSequenceClassification:()=>ne,BertForTokenClassification:()=>fe,BertModel:()=>Te,BertPreTrainedModel:()=>pe,BlenderbotForConditionalGeneration:()=>Dt,BlenderbotModel:()=>At,BlenderbotPreTrainedModel:()=>zt,BlenderbotSmallForConditionalGeneration:()=>Zs,BlenderbotSmallModel:()=>as,BlenderbotSmallPreTrainedModel:()=>Lt,BloomForCausalLM:()=>tl,BloomModel:()=>el,BloomPreTrainedModel:()=>Io,CLIPModel:()=>An,CLIPPreTrainedModel:()=>Gs,CLIPSegForImageSegmentation:()=>Wn,CLIPSegModel:()=>Gn,CLIPSegPreTrainedModel:()=>so,CLIPTextModel:()=>ep,CLIPTextModelWithProjection:()=>Ln,CLIPVisionModel:()=>tp,CLIPVisionModelWithProjection:()=>Dn,CamembertForMaskedLM:()=>Z,CamembertForQuestionAnswering:()=>Je,CamembertForSequenceClassification:()=>ue,CamembertForTokenClassification:()=>Ge,CamembertModel:()=>z,CamembertPreTrainedModel:()=>O,CausalLMOutput:()=>Ss,CausalLMOutputWithPast:()=>Qp,ChineseCLIPModel:()=>Nn,ChineseCLIPPreTrainedModel:()=>jn,ClapAudioModelWithProjection:()=>J_,ClapModel:()=>X_,ClapPreTrainedModel:()=>Er,ClapTextModelWithProjection:()=>H_,CodeGenForCausalLM:()=>ri,CodeGenModel:()=>si,CodeGenPreTrainedModel:()=>co,CohereForCausalLM:()=>Di,CohereModel:()=>Li,CoherePreTrainedModel:()=>vo,ConvBertForMaskedLM:()=>Ze,ConvBertForQuestionAnswering:()=>Is,ConvBertForSequenceClassification:()=>Ls,ConvBertForTokenClassification:()=>Ds,ConvBertModel:()=>qs,ConvBertPreTrainedModel:()=>us,ConvNextForImageClassification:()=>Cc,ConvNextModel:()=>Fc,ConvNextPreTrainedModel:()=>ia,ConvNextV2ForImageClassification:()=>yc,ConvNextV2Model:()=>kc,ConvNextV2PreTrainedModel:()=>la,DFineForObjectDetection:()=>Kl,DFineModel:()=>$l,DFinePreTrainedModel:()=>qo,DINOv3ConvNextModel:()=>jc,DINOv3ConvNextPreTrainedModel:()=>Bc,DINOv3ViTModel:()=>Oc,DINOv3ViTPreTrainedModel:()=>Ic,DPTForDepthEstimation:()=>lc,DPTModel:()=>ic,DPTPreTrainedModel:()=>oa,DacDecoderModel:()=>Nd,DacDecoderOutput:()=>Od,DacEncoderModel:()=>jd,DacEncoderOutput:()=>Id,DacModel:()=>Bd,DacPreTrainedModel:()=>Lr,DebertaForMaskedLM:()=>We,DebertaForQuestionAnswering:()=>Kt,DebertaForSequenceClassification:()=>it,DebertaForTokenClassification:()=>gt,DebertaModel:()=>st,DebertaPreTrainedModel:()=>Oe,DebertaV2ForMaskedLM:()=>Qt,DebertaV2ForQuestionAnswering:()=>ws,DebertaV2ForSequenceClassification:()=>Ps,DebertaV2ForTokenClassification:()=>Ts,DebertaV2Model:()=>ss,DebertaV2PreTrainedModel:()=>Nt,DecisionTransformerModel:()=>fd,DecisionTransformerPreTrainedModel:()=>Md,DeiTForImageClassification:()=>Yl,DeiTModel:()=>Jl,DeiTPreTrainedModel:()=>ea,DepthAnythingForDepthEstimation:()=>_c,DepthAnythingPreTrainedModel:()=>cc,DepthProForDepthEstimation:()=>hc,DepthProPreTrainedModel:()=>mc,DetrForObjectDetection:()=>Ol,DetrForSegmentation:()=>Qo,DetrModel:()=>Il,DetrObjectDetectionOutput:()=>Xo,DetrPreTrainedModel:()=>gr,DetrSegmentationOutput:()=>Bl,Dinov2ForImageClassification:()=>Ac,Dinov2Model:()=>Sc,Dinov2PreTrainedModel:()=>ca,Dinov2WithRegistersForImageClassification:()=>Dc,Dinov2WithRegistersModel:()=>Lc,Dinov2WithRegistersPreTrainedModel:()=>_a,DistilBertForMaskedLM:()=>ps,DistilBertForQuestionAnswering:()=>ls,DistilBertForSequenceClassification:()=>bs,DistilBertForTokenClassification:()=>js,DistilBertModel:()=>Bs,DistilBertPreTrainedModel:()=>os,DonutSwinModel:()=>Ec,DonutSwinPreTrainedModel:()=>vc,EdgeTamModel:()=>Xc,EfficientNetForImageClassification:()=>rd,EfficientNetModel:()=>sd,EfficientNetPreTrainedModel:()=>va,ElectraForMaskedLM:()=>Os,ElectraForQuestionAnswering:()=>v,ElectraForSequenceClassification:()=>n,ElectraForTokenClassification:()=>j,ElectraModel:()=>lt,ElectraPreTrainedModel:()=>is,Ernie4_5ForCausalLM:()=>W_,Ernie4_5Model:()=>G_,Ernie4_5PreTrainedModel:()=>Pa,EsmForMaskedLM:()=>xs,EsmForSequenceClassification:()=>vs,EsmForTokenClassification:()=>Es,EsmModel:()=>Ns,EsmPreTrainedModel:()=>ms,ExaoneForCausalLM:()=>wi,ExaoneModel:()=>Ti,ExaonePreTrainedModel:()=>go,FalconForCausalLM:()=>Q_,FalconModel:()=>K_,FalconPreTrainedModel:()=>wa,FastViTForImageClassification:()=>wl,FastViTModel:()=>Tl,FastViTPreTrainedModel:()=>zo,Florence2ForConditionalGeneration:()=>vn,Florence2PreTrainedModel:()=>xn,GLPNForDepthEstimation:()=>xc,GLPNModel:()=>bc,GLPNPreTrainedModel:()=>na,GPT2LMHeadModel:()=>$n,GPT2Model:()=>Un,GPT2PreTrainedModel:()=>ro,GPTBigCodeForCausalLM:()=>ti,GPTBigCodeModel:()=>ei,GPTBigCodePreTrainedModel:()=>lo,GPTJForCausalLM:()=>Zn,GPTJModel:()=>qn,GPTJPreTrainedModel:()=>io,GPTNeoForCausalLM:()=>Hn,GPTNeoModel:()=>Xn,GPTNeoPreTrainedModel:()=>ao,GPTNeoXForCausalLM:()=>Yn,GPTNeoXModel:()=>Jn,GPTNeoXPreTrainedModel:()=>no,Gemma2ForCausalLM:()=>ji,Gemma2Model:()=>Bi,Gemma2PreTrainedModel:()=>Fo,Gemma3ForCausalLM:()=>zi,Gemma3Model:()=>Vi,Gemma3PreTrainedModel:()=>ko,Gemma3nForConditionalGeneration:()=>qr,Gemma3nPreTrainedModel:()=>kn,GemmaForCausalLM:()=>Oi,GemmaModel:()=>Ii,GemmaPreTrainedModel:()=>Eo,GlmForCausalLM:()=>Pi,GlmModel:()=>gi,GlmPreTrainedModel:()=>fo,GraniteForCausalLM:()=>yi,GraniteModel:()=>ki,GraniteMoeHybridForCausalLM:()=>Ai,GraniteMoeHybridModel:()=>Si,GraniteMoeHybridPreTrainedModel:()=>xo,GranitePreTrainedModel:()=>bo,GroundingDinoForObjectDetection:()=>Rc,GroundingDinoPreTrainedModel:()=>Nc,GroupViTModel:()=>Pl,GroupViTPreTrainedModel:()=>gl,HeliumForCausalLM:()=>fi,HeliumModel:()=>Mi,HeliumPreTrainedModel:()=>Mo,HieraForImageClassification:()=>Zl,HieraModel:()=>ql,HieraPreTrainedModel:()=>ta,HubertForCTC:()=>w_,HubertForSequenceClassification:()=>b_,HubertModel:()=>T_,HubertPreTrainedModel:()=>sp,IJepaForImageClassification:()=>cl,IJepaModel:()=>ll,IJepaPreTrainedModel:()=>No,Idefics3ForConditionalGeneration:()=>Mr,Idefics3PreTrainedModel:()=>yn,ImageMattingOutput:()=>hu,JAISLMHeadModel:()=>Qn,JAISModel:()=>Kn,JAISPreTrainedModel:()=>oo,JinaCLIPModel:()=>Rn,JinaCLIPPreTrainedModel:()=>fr,JinaCLIPTextModel:()=>Vn,JinaCLIPVisionModel:()=>zn,Lfm2ForCausalLM:()=>pi,Lfm2Model:()=>ui,Lfm2PreTrainedModel:()=>mo,LiteWhisperForConditionalGeneration:()=>Pn,Llama4ForCausalLM:()=>ii,Llama4PreTrainedModel:()=>ni,LlamaForCausalLM:()=>ai,LlamaModel:()=>oi,LlamaPreTrainedModel:()=>_o,LlavaForConditionalGeneration:()=>hr,LlavaOnevisionForConditionalGeneration:()=>wn,LlavaPreTrainedModel:()=>Jr,LlavaQwen2ForCausalLM:()=>Yr,LongT5ForConditionalGeneration:()=>Zt,LongT5Model:()=>yt,LongT5PreTrainedModel:()=>Rt,M2M100ForConditionalGeneration:()=>Zc,M2M100Model:()=>qc,M2M100PreTrainedModel:()=>pa,MBartForCausalLM:()=>fs,MBartForConditionalGeneration:()=>gs,MBartForSequenceClassification:()=>es,MBartModel:()=>Ms,MBartPreTrainedModel:()=>Ht,MPNetForMaskedLM:()=>Fs,MPNetForQuestionAnswering:()=>ee,MPNetForSequenceClassification:()=>Vs,MPNetForTokenClassification:()=>mr,MPNetModel:()=>Rs,MPNetPreTrainedModel:()=>Tt,MT5ForConditionalGeneration:()=>zs,MT5Model:()=>cs,MT5PreTrainedModel:()=>Vt,MarianMTModel:()=>Yc,MarianModel:()=>Jc,MarianPreTrainedModel:()=>ua,MaskFormerForInstanceSegmentation:()=>wc,MaskFormerModel:()=>Tc,MaskFormerPreTrainedModel:()=>aa,MaskedLMOutput:()=>Gt,Metric3DForDepthEstimation:()=>fc,Metric3DPreTrainedModel:()=>Mc,Metric3Dv2ForDepthEstimation:()=>Pc,Metric3Dv2PreTrainedModel:()=>gc,MgpstrForSceneTextRecognition:()=>bd,MgpstrModelOutput:()=>Td,MgpstrPreTrainedModel:()=>wd,MimiDecoderModel:()=>Dd,MimiDecoderOutput:()=>Sd,MimiEncoderModel:()=>Ld,MimiEncoderOutput:()=>yd,MimiModel:()=>Ad,MimiPreTrainedModel:()=>Ar,Ministral3ForCausalLM:()=>z_,Ministral3Model:()=>V_,Ministral3PreTrainedModel:()=>ga,MinistralForCausalLM:()=>R_,MinistralModel:()=>N_,MinistralPreTrainedModel:()=>fa,Mistral3ForConditionalGeneration:()=>Cn,MistralForCausalLM:()=>j_,MistralModel:()=>B_,MistralPreTrainedModel:()=>Ma,MobileBertForMaskedLM:()=>Fe,MobileBertForQuestionAnswering:()=>Ke,MobileBertForSequenceClassification:()=>Se,MobileBertModel:()=>rs,MobileBertPreTrainedModel:()=>hs,MobileLLMForCausalLM:()=>xi,MobileLLMModel:()=>bi,MobileLLMPreTrainedModel:()=>Po,MobileNetV1ForImageClassification:()=>ad,MobileNetV1ForSemanticSegmentation:()=>nd,MobileNetV1Model:()=>od,MobileNetV1PreTrainedModel:()=>Cr,MobileNetV2ForImageClassification:()=>ld,MobileNetV2ForSemanticSegmentation:()=>cd,MobileNetV2Model:()=>id,MobileNetV2PreTrainedModel:()=>kr,MobileNetV3ForImageClassification:()=>dd,MobileNetV3ForSemanticSegmentation:()=>ud,MobileNetV3Model:()=>_d,MobileNetV3PreTrainedModel:()=>yr,MobileNetV4ForImageClassification:()=>md,MobileNetV4ForSemanticSegmentation:()=>hd,MobileNetV4Model:()=>pd,MobileNetV4PreTrainedModel:()=>Sr,MobileViTForImageClassification:()=>El,MobileViTModel:()=>vl,MobileViTPreTrainedModel:()=>Go,MobileViTV2ForImageClassification:()=>Cl,MobileViTV2Model:()=>Fl,MobileViTV2PreTrainedModel:()=>Wo,ModelOutput:()=>q,ModernBertDecoderForCausalLM:()=>Pt,ModernBertDecoderModel:()=>ut,ModernBertDecoderPreTrainedModel:()=>nt,ModernBertForMaskedLM:()=>ke,ModernBertForSequenceClassification:()=>qe,ModernBertForTokenClassification:()=>je,ModernBertModel:()=>Re,ModernBertPreTrainedModel:()=>Be,Moondream1ForConditionalGeneration:()=>bn,MoonshineForConditionalGeneration:()=>Tn,MoonshineModel:()=>Zu,MoonshinePreTrainedModel:()=>Xr,MptForCausalLM:()=>rl,MptModel:()=>sl,MptPreTrainedModel:()=>Oo,MultiModalityCausalLM:()=>Pd,MultiModalityPreTrainedModel:()=>gd,MusicgenForCausalLM:()=>np,MusicgenForConditionalGeneration:()=>Fa,MusicgenModel:()=>ap,MusicgenPreTrainedModel:()=>Ea,NanoChatForCausalLM:()=>ci,NanoChatModel:()=>li,NanoChatPreTrainedModel:()=>uo,NeoBertForMaskedLM:()=>ve,NeoBertForQuestionAnswering:()=>Qe,NeoBertForSequenceClassification:()=>ye,NeoBertForTokenClassification:()=>Ce,NeoBertModel:()=>De,NeoBertPreTrainedModel:()=>he,NomicBertModel:()=>ft,NomicBertPreTrainedModel:()=>jt,OPTForCausalLM:()=>al,OPTModel:()=>ol,OPTPreTrainedModel:()=>Bo,Olmo2ForCausalLM:()=>Ci,Olmo2Model:()=>Fi,Olmo2PreTrainedModel:()=>wo,OlmoForCausalLM:()=>Ei,OlmoModel:()=>vi,OlmoPreTrainedModel:()=>To,OpenELMForCausalLM:()=>Wi,OpenELMModel:()=>Gi,OpenELMPreTrainedModel:()=>yo,OwlViTForObjectDetection:()=>yl,OwlViTModel:()=>kl,OwlViTPreTrainedModel:()=>Uo,Owlv2ForObjectDetection:()=>Al,Owlv2Model:()=>Sl,Owlv2PreTrainedModel:()=>$o,PaliGemmaForConditionalGeneration:()=>Fn,PaliGemmaPreTrainedModel:()=>En,ParakeetForCTC:()=>a_,ParakeetPreTrainedModel:()=>o_,PatchTSMixerForPrediction:()=>Fd,PatchTSMixerModel:()=>Ed,PatchTSMixerPreTrainedModel:()=>ka,PatchTSTForPrediction:()=>vd,PatchTSTModel:()=>xd,PatchTSTPreTrainedModel:()=>Ca,Phi3ForCausalLM:()=>Zi,Phi3Model:()=>qi,Phi3PreTrainedModel:()=>Do,Phi3VForCausalLM:()=>eo,Phi3VPreTrainedModel:()=>Sn,PhiForCausalLM:()=>Yi,PhiModel:()=>Ji,PhiPreTrainedModel:()=>Lo,PreTrainedModel:()=>p,PretrainedMixin:()=>ht,PvtForImageClassification:()=>pl,PvtModel:()=>ul,PvtPreTrainedModel:()=>Ro,PyAnnoteForAudioFrameClassification:()=>i_,PyAnnoteModel:()=>n_,PyAnnotePreTrainedModel:()=>ma,QuestionAnsweringModelOutput:()=>Jt,Qwen2ForCausalLM:()=>$i,Qwen2Model:()=>Ui,Qwen2PreTrainedModel:()=>So,Qwen2VLForConditionalGeneration:()=>Hi,Qwen2VLPreTrainedModel:()=>Xi,Qwen3ForCausalLM:()=>Qi,Qwen3Model:()=>Ki,Qwen3PreTrainedModel:()=>Ao,RFDetrForObjectDetection:()=>Wl,RFDetrModel:()=>Gl,RFDetrObjectDetectionOutput:()=>Ul,RFDetrPreTrainedModel:()=>Yo,RTDetrForObjectDetection:()=>Nl,RTDetrModel:()=>jl,RTDetrObjectDetectionOutput:()=>lr,RTDetrPreTrainedModel:()=>Ho,RTDetrV2ForObjectDetection:()=>Vl,RTDetrV2Model:()=>Rl,RTDetrV2ObjectDetectionOutput:()=>zl,RTDetrV2PreTrainedModel:()=>Jo,ResNetForImageClassification:()=>tc,ResNetModel:()=>ec,ResNetPreTrainedModel:()=>sa,RoFormerForMaskedLM:()=>Js,RoFormerForQuestionAnswering:()=>qt,RoFormerForSequenceClassification:()=>Ys,RoFormerForTokenClassification:()=>kt,RoFormerModel:()=>Hs,RoFormerPreTrainedModel:()=>$t,RobertaForMaskedLM:()=>tn,RobertaForQuestionAnswering:()=>on,RobertaForSequenceClassification:()=>sn,RobertaForTokenClassification:()=>rn,RobertaModel:()=>en,RobertaPreTrainedModel:()=>ks,Sam2ImageSegmentationOutput:()=>Kc,Sam2Model:()=>wr,Sam2PreTrainedModel:()=>Qc,Sam3TrackerModel:()=>Hc,SamImageSegmentationOutput:()=>$c,SamModel:()=>Uc,SamPreTrainedModel:()=>Wc,SapiensForDepthEstimation:()=>uc,SapiensForNormalEstimation:()=>pc,SapiensForSemanticSegmentation:()=>dc,SapiensPreTrainedModel:()=>Tr,SegformerForImageClassification:()=>q_,SegformerForSemanticSegmentation:()=>Z_,SegformerModel:()=>op,SegformerPreTrainedModel:()=>Fr,Seq2SeqLMOutput:()=>Kp,SequenceClassifierOutput:()=>rt,SiglipModel:()=>In,SiglipPreTrainedModel:()=>to,SiglipTextModel:()=>On,SiglipVisionModel:()=>Bn,SmolLM3ForCausalLM:()=>hi,SmolLM3Model:()=>mi,SmolLM3PreTrainedModel:()=>ho,SmolVLMForConditionalGeneration:()=>Zr,SnacDecoderModel:()=>zd,SnacEncoderModel:()=>Vd,SnacModel:()=>Rd,SnacPreTrainedModel:()=>Dr,SpeechT5ForSpeechToText:()=>S_,SpeechT5ForTextToSpeech:()=>A_,SpeechT5HifiGan:()=>L_,SpeechT5Model:()=>rp,SpeechT5PreTrainedModel:()=>vr,SqueezeBertForMaskedLM:()=>U,SqueezeBertForQuestionAnswering:()=>ie,SqueezeBertForSequenceClassification:()=>$,SqueezeBertModel:()=>A,SqueezeBertPreTrainedModel:()=>c,StableLmForCausalLM:()=>td,StableLmModel:()=>ed,StableLmPreTrainedModel:()=>xa,Starcoder2ForCausalLM:()=>$_,Starcoder2Model:()=>U_,Starcoder2PreTrainedModel:()=>Ta,StyleTextToSpeech2Model:()=>y_,StyleTextToSpeech2PreTrainedModel:()=>k_,SupertonicForConditionalGeneration:()=>ha,SupertonicPreTrainedModel:()=>D_,Swin2SRForImageSuperResolution:()=>nc,Swin2SRModel:()=>ac,Swin2SRPreTrainedModel:()=>ra,SwinForImageClassification:()=>rc,SwinForSemanticSegmentation:()=>oc,SwinModel:()=>sc,SwinPreTrainedModel:()=>Pr,T5ForConditionalGeneration:()=>Ft,T5Model:()=>ot,T5PreTrainedModel:()=>_t,TableTransformerForObjectDetection:()=>Xl,TableTransformerModel:()=>Ql,TableTransformerObjectDetectionOutput:()=>Hl,TableTransformerPreTrainedModel:()=>Zo,TokenClassifierOutput:()=>It,TrOCRForCausalLM:()=>O_,TrOCRPreTrainedModel:()=>I_,UltravoxModel:()=>ya,UltravoxPreTrainedModel:()=>Cd,UniSpeechForCTC:()=>d_,UniSpeechForSequenceClassification:()=>u_,UniSpeechModel:()=>__,UniSpeechPreTrainedModel:()=>br,UniSpeechSatForAudioFrameClassification:()=>M_,UniSpeechSatForCTC:()=>m_,UniSpeechSatForSequenceClassification:()=>h_,UniSpeechSatModel:()=>p_,UniSpeechSatPreTrainedModel:()=>cr,VaultGemmaForCausalLM:()=>Ri,VaultGemmaModel:()=>Ni,VaultGemmaPreTrainedModel:()=>Co,ViTForImageClassification:()=>il,ViTMAEModel:()=>hl,ViTMAEPreTrainedModel:()=>ml,ViTMSNForImageClassification:()=>fl,ViTMSNModel:()=>Ml,ViTMSNPreTrainedModel:()=>Vo,ViTModel:()=>nl,ViTPreTrainedModel:()=>jo,VisionEncoderDecoderModel:()=>Hr,VitMatteForImageMatting:()=>xl,VitMattePreTrainedModel:()=>bl,VitPoseForPoseEstimation:()=>dl,VitPosePreTrainedModel:()=>_l,VitsModel:()=>ba,VitsModelOutput:()=>Mu,VitsPreTrainedModel:()=>Y_,VoxtralForConditionalGeneration:()=>kd,Wav2Vec2BertForCTC:()=>g_,Wav2Vec2BertForSequenceClassification:()=>P_,Wav2Vec2BertModel:()=>f_,Wav2Vec2BertPreTrainedModel:()=>xr,Wav2Vec2ForAudioFrameClassification:()=>r_,Wav2Vec2ForCTC:()=>t_,Wav2Vec2ForSequenceClassification:()=>s_,Wav2Vec2Model:()=>e_,Wav2Vec2PreTrainedModel:()=>ys,WavLMForAudioFrameClassification:()=>C_,WavLMForCTC:()=>v_,WavLMForSequenceClassification:()=>E_,WavLMForXVector:()=>F_,WavLMModel:()=>x_,WavLMPreTrainedModel:()=>sr,WeSpeakerResNetModel:()=>c_,WeSpeakerResNetPreTrainedModel:()=>l_,WhisperForConditionalGeneration:()=>Qr,WhisperModel:()=>gn,WhisperPreTrainedModel:()=>Kr,XLMForQuestionAnswering:()=>_n,XLMForSequenceClassification:()=>ln,XLMForTokenClassification:()=>cn,XLMModel:()=>an,XLMPreTrainedModel:()=>er,XLMRobertaForMaskedLM:()=>un,XLMRobertaForQuestionAnswering:()=>hn,XLMRobertaForSequenceClassification:()=>pn,XLMRobertaForTokenClassification:()=>mn,XLMRobertaModel:()=>dn,XLMRobertaPreTrainedModel:()=>tr,XLMWithLMHeadModel:()=>nn,XVectorOutput:()=>mu,YolosForObjectDetection:()=>zc,YolosModel:()=>Vc,YolosObjectDetectionOutput:()=>Gc,YolosPreTrainedModel:()=>da});var i=e("./src/configs.js"),d=e("./src/backends/onnx.js"),g=e("./src/utils/dtypes.js"),I=e("./src/utils/generic.js"),f=e("./src/utils/core.js"),u=e("./src/utils/hub.js"),m=e("./src/utils/constants.js"),T=e("./src/generation/logits_process.js"),_=e("./src/generation/configuration_utils.js"),o=e("./src/utils/tensor.js"),x=e("./src/utils/image.js"),w=e("./src/utils/maths.js"),k=e("./src/generation/stopping_criteria.js"),G=e("./src/generation/logits_sampler.js"),b=e("./src/env.js"),C=e("./src/models/whisper/generation_whisper.js"),B=e("./src/models/whisper/common_whisper.js");let P={EncoderOnly:0,EncoderDecoder:1,Seq2Seq:2,Vision2Seq:3,DecoderOnly:4,MaskGeneration:5,ImageTextToText:6,Musicgen:7,MultiModality:8,Phi3V:9,AudioTextToText:10,AutoEncoder:11,ImageAudioTextToText:12,Supertonic:13},M=new Map,y=new Map,l=new Map;async function h(s,r,E){let H=E.config?.["transformers.js_config"]??{},re=E.device??H.device;re&&typeof re!="string"&&(re.hasOwnProperty(r)?re=re[r]:(console.warn(`device not specified for "${r}". Using the default device.`),re=null));let oe=re??(b.apis.IS_NODE_ENV?"cpu":"wasm"),Me=(0,d.deviceToExecutionProviders)(oe),Ee=H.device_config??{};Ee.hasOwnProperty(oe)&&(H={...H,...Ee[oe]});let Ae=E.dtype??H.dtype;if(typeof Ae!="string"&&(Ae&&Ae.hasOwnProperty(r)?Ae=Ae[r]:(Ae=g.DEFAULT_DEVICE_DTYPE_MAPPING[oe]??g.DATA_TYPES.fp32,console.warn(`dtype not specified for "${r}". Using the default dtype (${Ae}) for this device (${oe}).`))),Ae===g.DATA_TYPES.auto){let ct=H.dtype;typeof ct!="string"&&(ct=ct?.[r]),ct&&ct!==g.DATA_TYPES.auto&&g.DATA_TYPES.hasOwnProperty(ct)?Ae=ct:Ae=g.DEFAULT_DEVICE_DTYPE_MAPPING[oe]??g.DATA_TYPES.fp32}let Ue=Ae;if(g.DEFAULT_DTYPE_SUFFIX_MAPPING.hasOwnProperty(Ue)){if(Ue===g.DATA_TYPES.fp16&&oe==="webgpu"&&!await(0,g.isWebGpuFp16Supported)())throw new Error(`The device (${oe}) does not support fp16.`)}else throw new Error(`Invalid dtype: ${Ue}. Should be one of: ${Object.keys(g.DATA_TYPES).join(", ")}`);let et=H.kv_cache_dtype,tt=et?typeof et=="string"?et:et[Ue]??"float32":void 0;if(tt&&!["float32","float16"].includes(tt))throw new Error(`Invalid kv_cache_dtype: ${tt}. Should be one of: float32, float16`);let at={dtype:Ue,kv_cache_dtype:tt,device:oe},He=g.DEFAULT_DTYPE_SUFFIX_MAPPING[Ue],pt=`${r}${He}.onnx`,Ye=`${E.subfolder??""}/${pt}`,Xe={...E.session_options};Xe.executionProviders??=Me;let dt=H.free_dimension_overrides;dt?Xe.freeDimensionOverrides??=dt:oe.startsWith("webnn")&&!Xe.freeDimensionOverrides&&console.warn(`WebNN does not currently support dynamic shapes and requires 'free_dimension_overrides' to be set in config.json, preferably as a field within config["transformers.js_config"]["device_config"]["${oe}"]. When 'free_dimension_overrides' is not set, you may experience significant performance degradation.`);let Mt=b.apis.IS_NODE_ENV&&b.env.useFSCache,wt=(0,u.getModelFile)(s,Ye,!0,E,Mt),xt=E.use_external_data_format??H.use_external_data_format,Ct=[];if(xt){let ct;typeof xt=="object"?xt.hasOwnProperty(pt)?ct=xt[pt]:xt.hasOwnProperty(r)?ct=xt[r]:ct=!1:ct=xt;let Et=+ct;if(Et>u.MAX_EXTERNAL_DATA_CHUNKS)throw new Error(`The number of external data chunks (${Et}) exceeds the maximum allowed value (${u.MAX_EXTERNAL_DATA_CHUNKS}).`);for(let Wt=0;Wt<Et;++Wt){let Ws=`${pt}_data${Wt===0?"":"_"+Wt}`,ts=`${E.subfolder??""}/${Ws}`;Ct.push(new Promise(async(_s,or)=>{let ar=await(0,u.getModelFile)(s,ts,!0,E,Mt);_s(ar instanceof Uint8Array?{path:Ws,data:ar}:Ws)}))}}else Xe.externalData!==void 0&&(Ct=Xe.externalData.map(async ct=>{if(typeof ct.data=="string"){let Et=await(0,u.getModelFile)(s,ct.data,!0,E);return{...ct,data:Et}}return ct}));if(Ct.length>0){let ct=await Promise.all(Ct);b.apis.IS_NODE_ENV||(Xe.externalData=ct)}if(oe==="webgpu"){let ct=(0,i.getCacheShapes)(E.config,{prefix:"present"});if(Object.keys(ct).length>0&&!(0,d.isONNXProxy)()){let Et={};for(let Wt in ct)Et[Wt]="gpu-buffer";Xe.preferredOutputLocation=Et}}return{buffer_or_path:await wt,session_options:Xe,session_config:at}}async function F(s,r,E){return Object.fromEntries(await Promise.all(Object.keys(r).map(async H=>{let{buffer_or_path:re,session_options:oe,session_config:Me}=await h(s,r[H],E),Ee=await(0,d.createInferenceSession)(re,oe,Me);return[H,Ee]})))}async function S(s,r,E){return Object.fromEntries(await Promise.all(Object.keys(r).map(async H=>{let re=await(0,u.getModelJSON)(s,r[H],!1,E);return[H,re]})))}function V(s,r){let E=Object.create(null),H=[];for(let Me of s.inputNames){let Ee=r[Me];if(!(Ee instanceof o.Tensor)){H.push(Me);continue}E[Me]=(0,d.isONNXProxy)()?Ee.clone():Ee}if(H.length>0)throw new Error(`An error occurred during model execution: "Missing the following inputs: ${H.join(", ")}.`);let re=Object.keys(r).length,oe=s.inputNames.length;if(re>oe){let Me=Object.keys(r).filter(Ee=>!s.inputNames.includes(Ee));console.warn(`WARNING: Too many inputs were provided (${re} > ${oe}). The following inputs will be ignored: "${Me.join(", ")}".`)}return E}async function R(s,r){let E=V(s,r);try{let H=Object.fromEntries(Object.entries(E).map(([oe,Me])=>[oe,Me.ort_tensor])),re=await(0,d.runInferenceSession)(s,H);return N(re)}catch(H){let re=Object.fromEntries(Object.entries(E).map(([oe,Me])=>{let Ee={type:Me.type,dims:Me.dims,location:Me.location};return Ee.location!=="gpu-buffer"&&(Ee.data=Me.data),[oe,Ee]}));throw console.error(`An error occurred during model execution: "${H}".`),console.error("Inputs given to model:",re),H}}function N(s){for(let r in s)(0,d.isONNXTensor)(s[r])?s[r]=new o.Tensor(s[r]):typeof s[r]=="object"&&N(s[r]);return s}function Q(s){if(s instanceof o.Tensor)return s;if(s.length===0)throw Error("items must be non-empty");if(Array.isArray(s[0])){if(s.some(r=>r.length!==s[0].length))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=True' and/or 'truncation=True' to have batched tensors with the same length.");return new o.Tensor("int64",BigInt64Array.from(s.flat().map(r=>BigInt(r))),[s.length,s[0].length])}else return new o.Tensor("int64",BigInt64Array.from(s.map(r=>BigInt(r))),[1,s.length])}function K(s){return new o.Tensor("bool",[s],[1])}async function J(s,r){let{encoder_outputs:E,input_ids:H,decoder_input_ids:re,...oe}=r;if(!E){let Ee=(0,f.pick)(r,s.sessions.model.inputNames);E=(await te(s,Ee)).last_hidden_state}return oe.input_ids=re,oe.encoder_hidden_states=E,s.sessions.decoder_model_merged.inputNames.includes("encoder_attention_mask")&&(oe.encoder_attention_mask=r.attention_mask),await ce(s,oe,!0)}async function te(s,r){let E=s.sessions.model,H=(0,f.pick)(r,E.inputNames);if(E.inputNames.includes("inputs_embeds")&&!H.inputs_embeds){if(!r.input_ids)throw new Error("Both `input_ids` and `inputs_embeds` are missing in the model inputs.");H.inputs_embeds=await s.encode_text({input_ids:r.input_ids})}if(E.inputNames.includes("token_type_ids")&&!H.token_type_ids){if(!H.input_ids)throw new Error("Both `input_ids` and `token_type_ids` are missing in the model inputs.");H.token_type_ids=(0,o.zeros_like)(H.input_ids)}if(E.inputNames.includes("pixel_mask")&&!H.pixel_mask){if(!H.pixel_values)throw new Error("Both `pixel_values` and `pixel_mask` are missing in the model inputs.");let re=H.pixel_values.dims;H.pixel_mask=(0,o.ones)([re[0],re[2],re[3]])}return await R(E,H)}async function se(s,r){let E=await s.encode(r);return await s.decode(E)}async function ce(s,r,E=!1){let H=s.sessions[E?"decoder_model_merged":"model"],{past_key_values:re,...oe}=r;if(H.inputNames.includes("use_cache_branch")&&(oe.use_cache_branch=K(!!re)),H.inputNames.includes("position_ids")&&oe.attention_mask&&!oe.position_ids){let Ee=["paligemma","gemma3_text","gemma3"].includes(s.config.model_type)?1:0;oe.position_ids=be(oe,re,Ee)}s.addPastKeyValues(oe,re);let Me=(0,f.pick)(oe,H.inputNames);return await R(H,Me)}function we({modality_token_id:s,inputs_embeds:r,modality_features:E,input_ids:H,attention_mask:re}){let oe=H.tolist().map(Ue=>Ue.reduce((et,tt,at)=>(tt==s&&et.push(at),et),[])),Me=oe.reduce((Ue,et)=>Ue+et.length,0),Ee=E.dims[0];if(Me!==Ee)throw new Error(`Number of tokens and features do not match: tokens: ${Me}, features ${Ee}`);let Ae=0;for(let Ue=0;Ue<oe.length;++Ue){let et=oe[Ue],tt=r[Ue];for(let at=0;at<et.length;++at)tt[et[at]].data.set(E[Ae++].data)}return{inputs_embeds:r,attention_mask:re}}function _e({image_token_id:s,inputs_embeds:r,image_features:E,input_ids:H,attention_mask:re}){return we({modality_token_id:s,inputs_embeds:r,modality_features:E,input_ids:H,attention_mask:re})}function X({audio_token_id:s,inputs_embeds:r,audio_features:E,input_ids:H,attention_mask:re}){return we({modality_token_id:s,inputs_embeds:r,modality_features:E,input_ids:H,attention_mask:re})}async function L(s,{encode_function:r,merge_function:E,modality_input_name:H,modality_output_name:re,input_ids:oe=null,attention_mask:Me=null,position_ids:Ee=null,inputs_embeds:Ae=null,past_key_values:Ue=null,generation_config:et=null,logits_processor:tt=null,...at}){let He=at[H];if(!Ae){if(Ae=await s.encode_text({input_ids:oe,...at}),He&&oe.dims[1]!==1){let Ye=await r({[H]:He,...at});({inputs_embeds:Ae,attention_mask:Me}=E({[re]:Ye,inputs_embeds:Ae,input_ids:oe,attention_mask:Me}))}else if(Ue&&He&&oe.dims[1]===1){let Ye=oe.dims[1],Xe=Object.values(Ue)[0].dims.at(-2);Me=(0,o.cat)([(0,o.ones)([oe.dims[0],Xe]),Me.slice(null,[Me.dims[1]-Ye,Me.dims[1]])],1)}}if(!Ee&&s.config.model_type==="qwen2_vl"){let{image_grid_thw:Ye,video_grid_thw:Xe}=at;[Ee]=s.get_rope_index(oe,Ye,Xe,Me)}return await ce(s,{inputs_embeds:Ae,past_key_values:Ue,attention_mask:Me,position_ids:Ee,generation_config:et,logits_processor:tt},!0)}async function W(s,r){return await L(s,{...r,modality_input_name:"audio_values",modality_output_name:"audio_features",encode_function:s.encode_audio.bind(s),merge_function:s._merge_input_ids_with_audio_features.bind(s)})}async function Y(s,r){return await L(s,{...r,modality_input_name:"pixel_values",modality_output_name:"image_features",encode_function:s.encode_image.bind(s),merge_function:s._merge_input_ids_with_image_features.bind(s)})}function ae(s,r=0){let[E,H]=s.dims,re=s.data,oe=new BigInt64Array(re.length);for(let Me=0;Me<E;++Me){let Ee=Me*H,Ae=BigInt(r);for(let Ue=0;Ue<H;++Ue){let et=Ee+Ue;re[et]===0n?oe[et]=BigInt(1):(oe[et]=Ae,Ae+=re[et])}}return{data:oe,dims:s.dims}}function be(s,r=null,E=0){let{input_ids:H,inputs_embeds:re,attention_mask:oe}=s,{data:Me,dims:Ee}=ae(oe,E),Ae=new o.Tensor("int64",Me,Ee);if(r){let Ue=-(H??re).dims.at(1);Ae=Ae.slice(null,[Ue,null])}return Ae}function xe(s,r,E,H){let re=E.past_key_values?Object.values(E.past_key_values)[0].dims.at(-2):0;if(!E.attention_mask){let oe;for(let Me of["input_ids","inputs_embeds","position_ids"])if(E[Me]){oe=E[Me].dims;break}if(!oe)throw new Error("attention_mask is not provided, and unable to infer its shape from model inputs.");E.attention_mask=(0,o.ones)([oe[0],re+oe[1]])}if(E.past_key_values){let{input_ids:oe,attention_mask:Me}=E;Me&&Me.dims[1]>oe.dims[1]||re<oe.dims[1]&&(E.input_ids=oe.slice(null,[re,null]))}return E}function Le(s,r,E,H){return E.past_key_values&&(r=r.map(re=>[re.at(-1)])),{...E,decoder_input_ids:Q(r)}}function $e(s,...r){return s.config.is_encoder_decoder?Le(s,...r):xe(s,...r)}function ge(s,r,E,H){let re=!!E.past_key_values;return H.guidance_scale!==null&&H.guidance_scale>1&&(re?E.input_ids=(0,o.cat)([E.input_ids,E.input_ids],0):(E.input_ids=(0,o.cat)([E.input_ids,(0,o.full_like)(E.input_ids,BigInt(H.pad_token_id))],0),E.attention_mask=(0,o.cat)([E.attention_mask,(0,o.full_like)(E.attention_mask,0n)],0))),(re||!E.pixel_values)&&(E.pixel_values=(0,o.full)([0,0,3,384,384],1)),re&&(E.images_seq_mask=new o.Tensor("bool",new Array(1).fill(!0).fill(!1,0,1),[1,1]),E.images_emb_mask=new o.Tensor("bool",new Array(0).fill(!1),[1,1,0])),E}class p extends I.Callable{main_input_name="input_ids";forward_params=["input_ids","attention_mask"];constructor(r,E,H){super(),this.config=r,this.sessions=E,this.configs=H;let re=l.get(this.constructor),oe=M.get(re);switch(this.can_generate=!1,this._forward=null,this._prepare_inputs_for_generation=null,oe){case P.DecoderOnly:this.can_generate=!0,this._forward=ce,this._prepare_inputs_for_generation=xe;break;case P.Seq2Seq:case P.Vision2Seq:case P.Musicgen:this.can_generate=!0,this._forward=J,this._prepare_inputs_for_generation=Le;break;case P.EncoderDecoder:this._forward=J;break;case P.ImageTextToText:this.can_generate=!0,this._forward=Y,this._prepare_inputs_for_generation=$e;break;case P.AudioTextToText:this.can_generate=!0,this._forward=W,this._prepare_inputs_for_generation=$e;break;case P.Phi3V:case P.ImageAudioTextToText:this.can_generate=!0,this._prepare_inputs_for_generation=$e;break;case P.MultiModality:this.can_generate=!0,this._prepare_inputs_for_generation=ge;break;case P.AutoEncoder:this._forward=se;break;default:this._forward=te;break}this.can_generate&&this.forward_params.push("past_key_values"),this.custom_config=this.config["transformers.js_config"]??{}}async dispose(){let r=[];for(let E of Object.values(this.sessions))E?.handler?.dispose&&r.push(E.handler.dispose());return await Promise.all(r)}static async from_pretrained(r,{progress_callback:E=null,config:H=null,cache_dir:re=null,local_files_only:oe=!1,revision:Me="main",model_file_name:Ee=null,subfolder:Ae="onnx",device:Ue=null,dtype:et=null,use_external_data_format:tt=null,session_options:at={}}={}){let He={progress_callback:E,config:H,cache_dir:re,local_files_only:oe,revision:Me,model_file_name:Ee,subfolder:Ae,device:Ue,dtype:et,use_external_data_format:tt,session_options:at},pt=l.get(this),Ye=M.get(pt);H=He.config=await i.AutoConfig.from_pretrained(r,He);let Xe;if(Ye===P.DecoderOnly)Xe=await Promise.all([F(r,{model:He.model_file_name??"model"},He),S(r,{generation_config:"generation_config.json"},He)]);else if(Ye===P.Seq2Seq||Ye===P.Vision2Seq)Xe=await Promise.all([F(r,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},He),S(r,{generation_config:"generation_config.json"},He)]);else if(Ye===P.MaskGeneration)Xe=await Promise.all([F(r,{model:"vision_encoder",prompt_encoder_mask_decoder:"prompt_encoder_mask_decoder"},He)]);else if(Ye===P.EncoderDecoder)Xe=await Promise.all([F(r,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},He)]);else if(Ye===P.ImageTextToText){let dt={embed_tokens:"embed_tokens",vision_encoder:"vision_encoder",decoder_model_merged:"decoder_model_merged"};H.is_encoder_decoder&&(dt.model="encoder_model"),Xe=await Promise.all([F(r,dt,He),S(r,{generation_config:"generation_config.json"},He)])}else if(Ye===P.AudioTextToText){let dt={embed_tokens:"embed_tokens",audio_encoder:"audio_encoder",decoder_model_merged:"decoder_model_merged"};Xe=await Promise.all([F(r,dt,He),S(r,{generation_config:"generation_config.json"},He)])}else if(Ye===P.ImageAudioTextToText){let dt={embed_tokens:"embed_tokens",audio_encoder:"audio_encoder",vision_encoder:"vision_encoder",decoder_model_merged:"decoder_model_merged"};Xe=await Promise.all([F(r,dt,He),S(r,{generation_config:"generation_config.json"},He)])}else if(Ye===P.Musicgen)Xe=await Promise.all([F(r,{model:"text_encoder",decoder_model_merged:"decoder_model_merged",encodec_decode:"encodec_decode"},He),S(r,{generation_config:"generation_config.json"},He)]);else if(Ye===P.MultiModality)Xe=await Promise.all([F(r,{prepare_inputs_embeds:"prepare_inputs_embeds",model:"language_model",lm_head:"lm_head",gen_head:"gen_head",gen_img_embeds:"gen_img_embeds",image_decode:"image_decode"},He),S(r,{generation_config:"generation_config.json"},He)]);else if(Ye===P.Phi3V)Xe=await Promise.all([F(r,{prepare_inputs_embeds:"prepare_inputs_embeds",model:"model",vision_encoder:"vision_encoder"},He),S(r,{generation_config:"generation_config.json"},He)]);else if(Ye===P.AutoEncoder)Xe=await Promise.all([F(r,{encoder_model:"encoder_model",decoder_model:"decoder_model"},He)]);else if(Ye===P.Supertonic)Xe=await Promise.all([F(r,{text_encoder:"text_encoder",latent_denoiser:"latent_denoiser",voice_decoder:"voice_decoder"},He)]);else{if(Ye!==P.EncoderOnly){let dt=pt??H?.model_type;dt!=="custom"&&console.warn(`Model type for '${dt}' not found, assuming encoder-only architecture. Please report this at ${m.GITHUB_ISSUE_URL}.`)}Xe=await Promise.all([F(r,{model:He.model_file_name??"model"},He)])}return new this(H,...Xe)}async _call(r){return await this.forward(r)}async forward(r){return await this._forward(this,r)}get generation_config(){return this.configs?.generation_config??null}_get_logits_processor(r,E,H=null){let re=new T.LogitsProcessorList;if(r.repetition_penalty!==null&&r.repetition_penalty!==1&&re.push(new T.RepetitionPenaltyLogitsProcessor(r.repetition_penalty)),r.no_repeat_ngram_size!==null&&r.no_repeat_ngram_size>0&&re.push(new T.NoRepeatNGramLogitsProcessor(r.no_repeat_ngram_size)),r.bad_words_ids!==null&&re.push(new T.NoBadWordsLogitsProcessor(r.bad_words_ids,r.eos_token_id)),r.min_length!==null&&r.eos_token_id!==null&&r.min_length>0&&re.push(new T.MinLengthLogitsProcessor(r.min_length,r.eos_token_id)),r.min_new_tokens!==null&&r.eos_token_id!==null&&r.min_new_tokens>0&&re.push(new T.MinNewTokensLengthLogitsProcessor(E,r.min_new_tokens,r.eos_token_id)),r.forced_bos_token_id!==null&&re.push(new T.ForcedBOSTokenLogitsProcessor(r.forced_bos_token_id)),r.forced_eos_token_id!==null&&re.push(new T.ForcedEOSTokenLogitsProcessor(r.max_length,r.forced_eos_token_id)),r.begin_suppress_tokens!==null){let oe=E>1||r.forced_bos_token_id===null?E:E+1;re.push(new T.SuppressTokensAtBeginLogitsProcessor(r.begin_suppress_tokens,oe))}return r.guidance_scale!==null&&r.guidance_scale>1&&re.push(new T.ClassifierFreeGuidanceLogitsProcessor(r.guidance_scale)),r.temperature===0&&r.do_sample&&(console.warn("`do_sample` changed to false because `temperature: 0` implies greedy sampling (always selecting the most likely token), which is incompatible with `do_sample: true`."),r.do_sample=!1),r.do_sample&&r.temperature!==null&&r.temperature!==1&&re.push(new T.TemperatureLogitsWarper(r.temperature)),H!==null&&re.extend(H),re}_prepare_generation_config(r,E,H=_.GenerationConfig){let re={...this.config};for(let Me of["decoder","generator","text_config"])Me in re&&Object.assign(re,re[Me]);let oe=new H(re);return Object.assign(oe,this.generation_config??{}),r&&Object.assign(oe,r),E&&Object.assign(oe,(0,f.pick)(E,Object.getOwnPropertyNames(oe))),oe}_get_stopping_criteria(r,E=null){let H=new k.StoppingCriteriaList;return r.max_length!==null&&H.push(new k.MaxLengthCriteria(r.max_length,this.config.max_position_embeddings??null)),r.eos_token_id!==null&&H.push(new k.EosTokenCriteria(r.eos_token_id)),E&&H.extend(E),H}_validate_model_class(){if(!this.can_generate){let r=[La,Da,Aa,Sa],E=l.get(this.constructor),H=new Set,re=this.config.model_type;for(let Me of r){let Ee=Me.get(re);Ee&&H.add(Ee[0])}let oe=`The current model class (${E}) is not compatible with \`.generate()\`, as it doesn't have a language model head.`;throw H.size>0&&(oe+=` Please use the following class instead: ${[...H].join(", ")}`),Error(oe)}}prepare_inputs_for_generation(...r){return this._prepare_inputs_for_generation(this,...r)}_update_model_kwargs_for_generation({generated_input_ids:r,outputs:E,model_inputs:H,is_encoder_decoder:re}){return H.past_key_values=this.getPastKeyValues(E,H.past_key_values),H.input_ids=new o.Tensor("int64",r.flat(),[r.length,1]),re?"decoder_attention_mask"in H:H.attention_mask=(0,o.cat)([H.attention_mask,(0,o.ones)([H.attention_mask.dims[0],1])],1),H.position_ids=null,H}_prepare_model_inputs({inputs:r,bos_token_id:E,model_kwargs:H}){let re=(0,f.pick)(H,this.forward_params),oe=this.main_input_name;if(oe in re){if(r)throw new Error("`inputs`: {inputs}` were passed alongside {input_name} which is not allowed. Make sure to either pass {inputs} or {input_name}=...")}else re[oe]=r;return{inputs_tensor:re[oe],model_inputs:re,model_input_name:oe}}async _prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:r,model_inputs:E,model_input_name:H,generation_config:re}){if(this.sessions.model.inputNames.includes("inputs_embeds")&&!E.inputs_embeds&&"_prepare_inputs_embeds"in this){let{input_ids:Me,pixel_values:Ee,attention_mask:Ae,...Ue}=E,et=await this._prepare_inputs_embeds(E);E={...Ue,...(0,f.pick)(et,["inputs_embeds","attention_mask"])}}let{last_hidden_state:oe}=await te(this,E);if(re.guidance_scale!==null&&re.guidance_scale>1)oe=(0,o.cat)([oe,(0,o.full_like)(oe,0)],0),"attention_mask"in E&&(E.attention_mask=(0,o.cat)([E.attention_mask,(0,o.zeros_like)(E.attention_mask)],0));else if(E.decoder_input_ids){let Me=Q(E.decoder_input_ids).dims[0];if(Me!==oe.dims[0]){if(oe.dims[0]!==1)throw new Error(`The encoder outputs have a different batch size (${oe.dims[0]}) than the decoder inputs (${Me}).`);oe=(0,o.cat)(Array.from({length:Me},()=>oe),0)}}return E.encoder_outputs=oe,E}_prepare_decoder_input_ids_for_generation({batch_size:r,model_input_name:E,model_kwargs:H,decoder_start_token_id:re,bos_token_id:oe,generation_config:Me}){let{decoder_input_ids:Ee,...Ae}=H;if(!(Ee instanceof o.Tensor)){if(Ee)Array.isArray(Ee[0])||(Ee=Array.from({length:r},()=>Ee));else if(re??=oe,this.config.model_type==="musicgen")Ee=Array.from({length:r*this.config.decoder.num_codebooks},()=>[re]);else if(Array.isArray(re)){if(re.length!==r)throw new Error(`\`decoder_start_token_id\` expcted to have length ${r} but got ${re.length}`);Ee=re}else Ee=Array.from({length:r},()=>[re]);Ee=Q(Ee)}return H.decoder_attention_mask=(0,o.ones_like)(Ee),{input_ids:Ee,model_inputs:Ae}}async generate({inputs:r=null,generation_config:E=null,logits_processor:H=null,stopping_criteria:re=null,streamer:oe=null,...Me}){this._validate_model_class(),E=this._prepare_generation_config(E,Me);let{inputs_tensor:Ee,model_inputs:Ae,model_input_name:Ue}=this._prepare_model_inputs({inputs:r,model_kwargs:Me}),et=this.config.is_encoder_decoder;et&&("encoder_outputs"in Ae||(Ae=await this._prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:Ee,model_inputs:Ae,model_input_name:Ue,generation_config:E})));let tt;et?{input_ids:tt,model_inputs:Ae}=this._prepare_decoder_input_ids_for_generation({batch_size:Ae[Ue].dims.at(0),model_input_name:Ue,model_kwargs:Ae,decoder_start_token_id:E.decoder_start_token_id,bos_token_id:E.bos_token_id,generation_config:E}):tt=Ae[Ue];let at=tt.dims.at(-1);E.max_new_tokens!==null&&(E.max_length=at+E.max_new_tokens);let He=this._get_logits_processor(E,at,H),pt=this._get_stopping_criteria(E,re),Ye=Ae[Ue].dims.at(0),Xe=G.LogitsSampler.getSampler(E),dt=new Array(Ye).fill(0),Mt=tt.tolist();oe&&oe.put(Mt);let wt,xt={};for(;;){if(Ae=this.prepare_inputs_for_generation(Mt,Ae,E),wt=await this.forward(Ae),E.output_attentions&&E.return_dict_in_generate){let ts=this.getAttentions(wt);for(let _s in ts)_s in xt||(xt[_s]=[]),xt[_s].push(ts[_s])}let ct=wt.logits.slice(null,-1,null),Et=He(Mt,ct),Wt=[];for(let ts=0;ts<Et.dims.at(0);++ts){let _s=Et[ts],or=await Xe(_s);for(let[ar,Ir]of or){let _r=BigInt(ar);dt[ts]+=Ir,Mt[ts].push(_r),Wt.push([_r]);break}}if(oe&&oe.put(Wt),pt(Mt).every(ts=>ts))break;Ae=this._update_model_kwargs_for_generation({generated_input_ids:Wt,outputs:wt,model_inputs:Ae,is_encoder_decoder:et})}oe&&oe.end();let Ct=this.getPastKeyValues(wt,Ae.past_key_values,!0),St=new o.Tensor("int64",Mt.flat(),[Mt.length,Mt[0].length]);if(E.return_dict_in_generate)return{sequences:St,past_key_values:Ct,...xt};for(let ct of Object.values(wt))ct.location==="gpu-buffer"&&ct.dispose();return St}getPastKeyValues(r,E,H=!1){let re=Object.create(null);for(let oe in r)if(oe.startsWith("present")){let Me=oe.replace("present_conv","past_conv").replace("present","past_key_values"),Ee=oe.includes("encoder");if(Ee&&E?re[Me]=E[Me]:re[Me]=r[oe],E&&(!Ee||H)){let Ae=E[Me];Ae.location==="gpu-buffer"&&Ae.dispose()}}return re}getAttentions(r){let E={};for(let H of["cross_attentions","encoder_attentions","decoder_attentions"])for(let re in r)re.startsWith(H)&&(H in E||(E[H]=[]),E[H].push(r[re]));return E}addPastKeyValues(r,E){if(E)Object.assign(r,E);else{let H=this.sessions.decoder_model_merged??this.sessions.model,re=(r[this.main_input_name]??r.attention_mask)?.dims?.[0]??1,oe=H?.config?.kv_cache_dtype??"float32",Me=oe==="float16"?o.DataTypeMap.float16:o.DataTypeMap.float32,Ee=(0,i.getCacheShapes)(this.config,{batch_size:re});for(let Ae in Ee){let Ue=Ee[Ae].reduce((et,tt)=>et*tt,1);r[Ae]=new o.Tensor(oe,new Me(Ue),Ee[Ae])}}}async encode_image({pixel_values:r}){return(await R(this.sessions.vision_encoder,{pixel_values:r})).image_features}async encode_text({input_ids:r}){return(await R(this.sessions.embed_tokens,{input_ids:r})).inputs_embeds}async encode_audio({audio_values:r}){return(await R(this.sessions.audio_encoder,{audio_values:r})).audio_features}}class q{}class de extends q{constructor({last_hidden_state:r,hidden_states:E=null,attentions:H=null}){super(),this.last_hidden_state=r,this.hidden_states=E,this.attentions=H}}class pe extends p{}class Te extends pe{}class me extends pe{async _call(r){return new Gt(await super._call(r))}}class ne extends pe{async _call(r){return new rt(await super._call(r))}}class fe extends pe{async _call(r){return new It(await super._call(r))}}class le extends pe{async _call(r){return new Jt(await super._call(r))}}class he extends p{}class De extends he{}class ve extends he{async _call(r){return new Gt(await super._call(r))}}class ye extends he{async _call(r){return new rt(await super._call(r))}}class Ce extends he{async _call(r){return new It(await super._call(r))}}class Qe extends he{async _call(r){return new Jt(await super._call(r))}}class Be extends p{}class Re extends Be{}class ke extends Be{async _call(r){return new Gt(await super._call(r))}}class qe extends Be{async _call(r){return new rt(await super._call(r))}}class je extends Be{async _call(r){return new It(await super._call(r))}}class nt extends p{}class ut extends nt{}class Pt extends nt{}class jt extends p{}class ft extends jt{}class $t extends p{}class Hs extends $t{}class Js extends $t{async _call(r){return new Gt(await super._call(r))}}class Ys extends $t{async _call(r){return new rt(await super._call(r))}}class kt extends $t{async _call(r){return new It(await super._call(r))}}class qt extends $t{async _call(r){return new Jt(await super._call(r))}}class us extends p{}class qs extends us{}class Ze extends us{async _call(r){return new Gt(await super._call(r))}}class Ls extends us{async _call(r){return new rt(await super._call(r))}}class Ds extends us{async _call(r){return new It(await super._call(r))}}class Is extends us{async _call(r){return new Jt(await super._call(r))}}class is extends p{}class lt extends is{}class Os extends is{async _call(r){return new Gt(await super._call(r))}}class n extends is{async _call(r){return new rt(await super._call(r))}}class j extends is{async _call(r){return new It(await super._call(r))}}class v extends is{async _call(r){return new Jt(await super._call(r))}}class O extends p{}class z extends O{}class Z extends O{async _call(r){return new Gt(await super._call(r))}}class ue extends O{async _call(r){return new rt(await super._call(r))}}class Ge extends O{async _call(r){return new It(await super._call(r))}}class Je extends O{async _call(r){return new Jt(await super._call(r))}}class Oe extends p{}class st extends Oe{}class We extends Oe{async _call(r){return new Gt(await super._call(r))}}class it extends Oe{async _call(r){return new rt(await super._call(r))}}class gt extends Oe{async _call(r){return new It(await super._call(r))}}class Kt extends Oe{async _call(r){return new Jt(await super._call(r))}}class Nt extends p{}class ss extends Nt{}class Qt extends Nt{async _call(r){return new Gt(await super._call(r))}}class Ps extends Nt{async _call(r){return new rt(await super._call(r))}}class Ts extends Nt{async _call(r){return new It(await super._call(r))}}class ws extends Nt{async _call(r){return new Jt(await super._call(r))}}class os extends p{}class Bs extends os{}class bs extends os{async _call(r){return new rt(await super._call(r))}}class js extends os{async _call(r){return new It(await super._call(r))}}class ls extends os{async _call(r){return new Jt(await super._call(r))}}class ps extends os{async _call(r){return new Gt(await super._call(r))}}class ms extends p{}class Ns extends ms{}class xs extends ms{async _call(r){return new Gt(await super._call(r))}}class vs extends ms{async _call(r){return new rt(await super._call(r))}}class Es extends ms{async _call(r){return new It(await super._call(r))}}class hs extends p{}class rs extends hs{}class Fe extends hs{async _call(r){return new Gt(await super._call(r))}}class Se extends hs{async _call(r){return new rt(await super._call(r))}}class Ke extends hs{async _call(r){return new Jt(await super._call(r))}}class Tt extends p{}class Rs extends Tt{}class Fs extends Tt{async _call(r){return new Gt(await super._call(r))}}class Vs extends Tt{async _call(r){return new rt(await super._call(r))}}class mr extends Tt{async _call(r){return new It(await super._call(r))}}class ee extends Tt{async _call(r){return new Jt(await super._call(r))}}class c extends p{}class A extends c{}class U extends c{async _call(r){return new Gt(await super._call(r))}}class $ extends c{async _call(r){return new rt(await super._call(r))}}class ie extends c{async _call(r){return new Jt(await super._call(r))}}class Pe extends p{}class Ne extends Pe{}class Ve extends Pe{async _call(r){return new rt(await super._call(r))}}class ze extends Pe{async _call(r){return new Jt(await super._call(r))}}class Ie extends Pe{async _call(r){return new Gt(await super._call(r))}}class _t extends p{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"]}class ot extends _t{}class Ft extends _t{}class Rt extends p{}class yt extends Rt{}class Zt extends Rt{}class Vt extends p{}class cs extends Vt{}class zs extends Vt{}class Xt extends p{}class Cs extends Xt{}class vt extends Xt{}class Ut extends Xt{async _call(r){return new rt(await super._call(r))}}class Ht extends p{}class Ms extends Ht{}class gs extends Ht{}class es extends Ht{async _call(r){return new rt(await super._call(r))}}class fs extends Ht{}class zt extends p{}class At extends zt{}class Dt extends zt{}class Lt extends p{}class as extends Lt{}class Zs extends Lt{}class ks extends p{}class en extends ks{}class tn extends ks{async _call(r){return new Gt(await super._call(r))}}class sn extends ks{async _call(r){return new rt(await super._call(r))}}class rn extends ks{async _call(r){return new It(await super._call(r))}}class on extends ks{async _call(r){return new Jt(await super._call(r))}}class er extends p{}class an extends er{}class nn extends er{async _call(r){return new Gt(await super._call(r))}}class ln extends er{async _call(r){return new rt(await super._call(r))}}class cn extends er{async _call(r){return new It(await super._call(r))}}class _n extends er{async _call(r){return new Jt(await super._call(r))}}class tr extends p{}class dn extends tr{}class un extends tr{async _call(r){return new Gt(await super._call(r))}}class pn extends tr{async _call(r){return new rt(await super._call(r))}}class mn extends tr{async _call(r){return new It(await super._call(r))}}class hn extends tr{async _call(r){return new Jt(await super._call(r))}}class $r extends p{}class Mn extends $r{}class fn extends $r{}class Kr extends p{requires_attention_mask=!1;main_input_name="input_features";forward_params=["input_features","attention_mask","decoder_input_ids","decoder_attention_mask","past_key_values"]}class gn extends Kr{}class Qr extends Kr{_prepare_generation_config(r,E){return super._prepare_generation_config(r,E,C.WhisperGenerationConfig)}_retrieve_init_tokens(r){let E=[r.decoder_start_token_id],H=r.language,re=r.task;if(r.is_multilingual){H||(console.warn("No language specified - defaulting to English (en)."),H="en");let Me=`<|${(0,B.whisper_language_to_code)(H)}|>`;E.push(r.lang_to_id[Me]),E.push(r.task_to_id[re??"transcribe"])}else if(H||re)throw new Error("Cannot specify `task` or `language` for an English-only model. If the model is intended to be multilingual, pass `is_multilingual=true` to generate, or update the generation config.");return!r.return_timestamps&&r.no_timestamps_token_id&&E.at(-1)!==r.no_timestamps_token_id?E.push(r.no_timestamps_token_id):r.return_timestamps&&E.at(-1)===r.no_timestamps_token_id&&(console.warn("<|notimestamps|> prompt token is removed from generation_config since `return_timestamps` is set to `true`."),E.pop()),E.filter(oe=>oe!=null)}async generate({inputs:r=null,generation_config:E=null,logits_processor:H=null,stopping_criteria:re=null,...oe}){E=this._prepare_generation_config(E,oe);let Me=oe.decoder_input_ids??this._retrieve_init_tokens(E);if(E.return_timestamps&&(H??=new T.LogitsProcessorList,H.push(new T.WhisperTimeStampLogitsProcessor(E,Me))),E.begin_suppress_tokens&&(H??=new T.LogitsProcessorList,H.push(new T.SuppressTokensAtBeginLogitsProcessor(E.begin_suppress_tokens,Me.length))),E.return_token_timestamps){if(!E.alignment_heads)throw new Error("Model generation config has no `alignment_heads`, token-level timestamps not available. See https://gist.github.com/hollance/42e32852f24243b748ae6bc1f985b13a on how to add this property to the generation config.");E.task==="translate"&&console.warn("Token-level timestamps may not be reliable for task 'translate'."),E.output_attentions=!0,E.return_dict_in_generate=!0}let Ee=await super.generate({inputs:r,generation_config:E,logits_processor:H,decoder_input_ids:Me,...oe});return E.return_token_timestamps&&(Ee.token_timestamps=this._extract_token_timestamps(Ee,E.alignment_heads,E.num_frames)),Ee}_extract_token_timestamps(r,E,H=null,re=.02){if(!r.cross_attentions)throw new Error("Model outputs must contain cross attentions to extract timestamps. This is most likely because the model was not exported with `output_attentions=True`.");H==null&&console.warn("`num_frames` has not been set, meaning the entire audio will be analyzed. This may lead to inaccurate token-level timestamps for short audios (< 30 seconds).");let oe=this.config.median_filter_width;oe===void 0&&(console.warn("Model config has no `median_filter_width`, using default value of 7."),oe=7);let Me=r.cross_attentions,Ee=Array.from({length:this.config.decoder_layers},(Ye,Xe)=>(0,o.cat)(Me.map(dt=>dt[Xe]),2)),Ae=(0,o.stack)(E.map(([Ye,Xe])=>{if(Ye>=Ee.length)throw new Error(`Layer index ${Ye} is out of bounds for cross attentions (length ${Ee.length}).`);return H?Ee[Ye].slice(null,Xe,null,[0,H]):Ee[Ye].slice(null,Xe)})).transpose(1,0,2,3),[Ue,et]=(0,o.std_mean)(Ae,-2,0,!0),tt=Ae.clone();for(let Ye=0;Ye<tt.dims[0];++Ye){let Xe=tt[Ye];for(let dt=0;dt<Xe.dims[0];++dt){let Mt=Xe[dt],wt=Ue[Ye][dt][0].data,xt=et[Ye][dt][0].data;for(let Ct=0;Ct<Mt.dims[0];++Ct){let St=Mt[Ct].data;for(let ct=0;ct<St.length;++ct)St[ct]=(St[ct]-xt[ct])/wt[ct];St.set((0,w.medianFilter)(St,oe))}}}let at=[(0,o.mean)(tt,1)],He=r.sequences.dims,pt=new o.Tensor("float32",new Float32Array(He[0]*He[1]),He);for(let Ye=0;Ye<He[0];++Ye){let Xe=at[Ye].neg().squeeze_(0),[dt,Mt]=(0,w.dynamic_time_warping)(Xe.tolist()),wt=Array.from({length:dt.length-1},(St,ct)=>dt[ct+1]-dt[ct]),xt=(0,f.mergeArrays)([1],wt).map(St=>!!St),Ct=[];for(let St=0;St<xt.length;++St)xt[St]&&Ct.push(Mt[St]*re);pt[Ye].data.set(Ct,1)}return pt}}class Pn extends Qr{}class Xr extends p{requires_attention_mask=!1;main_input_name="input_values";forward_params=["input_values","decoder_input_ids","past_key_values"]}class Zu extends Xr{}class Tn extends Xr{}class Hr extends p{main_input_name="pixel_values";forward_params=["pixel_values","decoder_input_ids","encoder_hidden_states","past_key_values"]}class Jr extends p{forward_params=["input_ids","attention_mask","pixel_values","position_ids","past_key_values"]}class hr extends Jr{_merge_input_ids_with_image_features(r){let E=r.image_features.dims.at(-1),H=r.image_features.view(-1,E);return _e({image_token_id:this.config.image_token_index,...r,image_features:H})}}class wn extends hr{}class bn extends hr{}class xn extends p{forward_params=["input_ids","inputs_embeds","attention_mask","pixel_values","encoder_outputs","decoder_input_ids","decoder_inputs_embeds","decoder_attention_mask","past_key_values"];main_input_name="inputs_embeds"}class vn extends xn{_merge_input_ids_with_image_features({inputs_embeds:r,image_features:E,input_ids:H,attention_mask:re}){return{inputs_embeds:(0,o.cat)([E,r],1),attention_mask:(0,o.cat)([(0,o.ones)(E.dims.slice(0,2)),re],1)}}async _prepare_inputs_embeds({input_ids:r,pixel_values:E,inputs_embeds:H,attention_mask:re}){if(!r&&!E)throw new Error("Either `input_ids` or `pixel_values` should be provided.");let oe,Me;return r&&(oe=await this.encode_text({input_ids:r})),E&&(Me=await this.encode_image({pixel_values:E})),oe&&Me?{inputs_embeds:H,attention_mask:re}=this._merge_input_ids_with_image_features({inputs_embeds:oe,image_features:Me,input_ids:r,attention_mask:re}):H=oe||Me,{inputs_embeds:H,attention_mask:re}}async forward({input_ids:r,pixel_values:E,attention_mask:H,decoder_input_ids:re,decoder_attention_mask:oe,encoder_outputs:Me,past_key_values:Ee,inputs_embeds:Ae,decoder_inputs_embeds:Ue}){if(Ae||({inputs_embeds:Ae,attention_mask:H}=await this._prepare_inputs_embeds({input_ids:r,pixel_values:E,inputs_embeds:Ae,attention_mask:H})),!Me){let{last_hidden_state:at}=await te(this,{inputs_embeds:Ae,attention_mask:H});Me=at}if(!Ue){if(!re)throw new Error("Either `decoder_input_ids` or `decoder_inputs_embeds` should be provided.");Ue=await this.encode_text({input_ids:re})}return await ce(this,{inputs_embeds:Ue,attention_mask:oe,encoder_attention_mask:H,encoder_hidden_states:Me,past_key_values:Ee},!0)}}class En extends p{forward_params=["input_ids","attention_mask","pixel_values","position_ids","past_key_values"]}class Fn extends En{_merge_input_ids_with_image_features(r){let E=r.image_features.dims.at(-1),H=r.image_features.view(-1,E);return _e({image_token_id:this.config.image_token_index,...r,image_features:H})}}class Yr extends Jr{_merge_input_ids_with_image_features(r){let E=r.image_features.dims.at(-1),H=r.image_features.view(-1,E);return _e({image_token_id:this.config.image_token_index,...r,image_features:H})}}class Cn extends Yr{}class kn extends p{forward_params=["input_ids","attention_mask","inputs_embeds","per_layer_inputs","position_ids","pixel_values","input_features","input_features_mask","past_key_values"]}class qr extends kn{async forward({input_ids:r=null,attention_mask:E=null,pixel_values:H=null,input_features:re=null,input_features_mask:oe=null,position_ids:Me=null,inputs_embeds:Ee=null,per_layer_inputs:Ae=null,past_key_values:Ue=null,generation_config:et=null,logits_processor:tt=null,...at}){if((!Ee||!Ae)&&({inputs_embeds:Ee,per_layer_inputs:Ae}=await R(this.sessions.embed_tokens,{input_ids:r}),r.dims[1]!==1)){if(H){let{image_features:pt}=await R(this.sessions.vision_encoder,{pixel_values:H});({inputs_embeds:Ee,attention_mask:E}=this._merge_input_ids_with_image_features({image_features:pt,inputs_embeds:Ee,input_ids:r,attention_mask:E}))}if(re){let{audio_features:pt}=await R(this.sessions.audio_encoder,{input_features:re,input_features_mask:oe});({inputs_embeds:Ee,attention_mask:E}=this._merge_input_ids_with_audio_features({audio_features:pt,inputs_embeds:Ee,input_ids:r,attention_mask:E}))}}return await ce(this,{inputs_embeds:Ee,per_layer_inputs:Ae,past_key_values:Ue,attention_mask:E,position_ids:Me,generation_config:et,logits_processor:tt},!0)}_merge_input_ids_with_image_features(r){let E=r.image_features.dims.at(-1),H=r.image_features.view(-1,E);return _e({image_token_id:this.config.image_token_id,...r,image_features:H})}_merge_input_ids_with_audio_features(r){let E=r.audio_features.dims.at(-1),H=r.audio_features.view(-1,E);return X({audio_token_id:this.config.audio_token_id,...r,audio_features:H})}}class yn extends p{forward_params=["input_ids","attention_mask","pixel_values","pixel_attention_mask","position_ids","past_key_values"]}class Mr extends yn{async encode_image({pixel_values:r,pixel_attention_mask:E}){return(await R(this.sessions.vision_encoder,{pixel_values:r,pixel_attention_mask:E})).image_features}_merge_input_ids_with_image_features(r){let E=r.image_features.dims.at(-1),H=r.image_features.view(-1,E);return _e({image_token_id:this.config.image_token_id,...r,image_features:H})}}class Zr extends Mr{}class Sn extends p{forward_params=["input_ids","inputs_embeds","attention_mask","position_ids","pixel_values","image_sizes","past_key_values"]}class eo extends Sn{async forward({input_ids:r=null,attention_mask:E=null,pixel_values:H=null,image_sizes:re=null,position_ids:oe=null,inputs_embeds:Me=null,past_key_values:Ee=null,generation_config:Ae=null,logits_processor:Ue=null,...et}){if(!Me){let at;if(H&&r.dims[1]!==1){if(!re)throw new Error("`image_sizes` must be provided when `pixel_values` is provided.");({image_features:at}=await R(this.sessions.vision_encoder,{pixel_values:H,image_sizes:re}))}else{let He=this.config.normalized_config.hidden_size;at=new o.Tensor("float32",[],[0,He])}({inputs_embeds:Me}=await R(this.sessions.prepare_inputs_embeds,{input_ids:r,image_features:at}))}return await ce(this,{inputs_embeds:Me,past_key_values:Ee,attention_mask:E,position_ids:oe,generation_config:Ae,logits_processor:Ue},!1)}}class Gs extends p{}class An extends Gs{}class ep extends Gs{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"text_model"})}}class Ln extends Gs{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"text_model"})}}class tp extends Gs{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"vision_model"})}}class Dn extends Gs{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"vision_model"})}}class to extends p{}class In extends to{}class On extends to{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"text_model"})}}class Bn extends Gs{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"vision_model"})}}class jn extends p{}class Nn extends jn{}class fr extends p{}class Rn extends fr{async forward(r){let E=!r.input_ids,H=!r.pixel_values;if(E&&H)throw new Error("Either `input_ids` or `pixel_values` should be provided.");if(E&&(r.input_ids=(0,o.ones)([r.pixel_values.dims[0],1])),H){let{image_size:Ue}=this.config.vision_config;r.pixel_values=(0,o.full)([0,3,Ue,Ue],0)}let{text_embeddings:re,image_embeddings:oe,l2norm_text_embeddings:Me,l2norm_image_embeddings:Ee}=await super.forward(r),Ae={};return E||(Ae.text_embeddings=re,Ae.l2norm_text_embeddings=Me),H||(Ae.image_embeddings=oe,Ae.l2norm_image_embeddings=Ee),Ae}}class Vn extends fr{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"text_model"})}}class zn extends fr{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"vision_model"})}}class so extends p{}class Gn extends so{}class Wn extends so{}class ro extends p{}class Un extends ro{}class $n extends ro{}class oo extends p{}class Kn extends oo{}class Qn extends oo{}class ao extends p{}class Xn extends ao{}class Hn extends ao{}class no extends p{}class Jn extends no{}class Yn extends no{}class io extends p{}class qn extends io{}class Zn extends io{}class lo extends p{}class ei extends lo{}class ti extends lo{}class co extends p{}class si extends co{}class ri extends co{}class _o extends p{}class oi extends _o{}class ai extends _o{}class ni extends p{}class ii extends ni{}class uo extends p{}class li extends uo{}class ci extends uo{}class po extends p{}class _i extends po{}class di extends po{}class mo extends p{}class ui extends mo{}class pi extends mo{}class ho extends p{}class mi extends ho{}class hi extends ho{}class Mo extends p{}class Mi extends Mo{}class fi extends Mo{}class fo extends p{}class gi extends fo{}class Pi extends fo{}class go extends p{}class Ti extends go{}class wi extends go{}class Po extends p{}class bi extends Po{}class xi extends Po{}class To extends p{}class vi extends To{}class Ei extends To{}class wo extends p{}class Fi extends wo{}class Ci extends wo{}class bo extends p{}class ki extends bo{}class yi extends bo{}class xo extends p{}class Si extends xo{}class Ai extends xo{}class vo extends p{}class Li extends vo{}class Di extends vo{}class Eo extends p{}class Ii extends Eo{}class Oi extends Eo{}class Fo extends p{}class Bi extends Fo{}class ji extends Fo{}class Co extends p{}class Ni extends Co{}class Ri extends Co{}class ko extends p{}class Vi extends ko{}class zi extends ko{}class yo extends p{}class Gi extends yo{}class Wi extends yo{}class So extends p{}class Ui extends So{}class $i extends So{}class Ao extends p{}class Ki extends Ao{}class Qi extends Ao{}class Xi extends p{forward_params=["input_ids","attention_mask","position_ids","past_key_values","pixel_values","image_grid_thw"]}class Hi extends Xi{get_rope_index(r,E,H,re){let{vision_config:oe,image_token_id:Me,video_token_id:Ee,vision_start_token_id:Ae}=this.config,Ue=oe.spatial_merge_size??2,et=[];if(E||H){let tt=r.tolist();re||(re=(0,o.ones_like)(r));let at=re.tolist(),He=Array.from({length:3},Mt=>Array.from({length:r.dims[0]},wt=>Array.from({length:r.dims[1]},xt=>1))),pt=E?E.tolist():[],Ye=H?H.tolist():[],Xe=0,dt=0;for(let Mt=0;Mt<tt.length;++Mt){let wt=tt[Mt].filter((bt,Ot)=>at[Mt][Ot]==1),Ct=wt.reduce((bt,Ot,As)=>(Ot==Ae&&bt.push(As),bt),[]).map(bt=>wt[bt+1]),St=Ct.filter(bt=>bt==Me).length,ct=Ct.filter(bt=>bt==Ee).length,Et=[],Wt=0,Ws=St,ts=ct;for(let bt=0;bt<Ct.length;++bt){let Ot=wt.findIndex(($s,ds)=>ds>Wt&&$s==Me),As=wt.findIndex(($s,ds)=>ds>Wt&&$s==Ee),Us=Ws>0&&Ot!==-1?Ot:wt.length+1,nr=ts>0&&As!==-1?As:wt.length+1,Or,Ia,Oa,Ba;Us<nr?([Ia,Oa,Ba]=pt[Xe],++Xe,--Ws,Or=Us):([Ia,Oa,Ba]=Ye[dt],++dt,--ts,Or=nr);let[Hp,ja,Br]=[Number(Ia),Math.floor(Number(Oa)/Ue),Math.floor(Number(Ba)/Ue)],Na=Or-Wt,fu=Et.length>0?(0,w.max)(Et.at(-1))[0]+1:0;Et.push(Array.from({length:3*Na},($s,ds)=>fu+ds%Na));let Ra=Na+fu,jr=Hp*ja*Br,Jp=Array.from({length:jr},($s,ds)=>Ra+Math.floor(ds/(ja*Br))),Yp=Array.from({length:jr},($s,ds)=>Ra+Math.floor(ds/Br)%ja),qp=Array.from({length:jr},($s,ds)=>Ra+ds%Br);Et.push([Jp,Yp,qp].flat()),Wt=Or+jr}if(Wt<wt.length){let bt=Et.length>0?(0,w.max)(Et.at(-1))[0]+1:0,Ot=wt.length-Wt;Et.push(Array.from({length:3*Ot},(As,Us)=>bt+Us%Ot))}let _s=Et.reduce((bt,Ot)=>bt+Ot.length,0),or=new Array(_s),ar=0;for(let bt=0;bt<3;++bt)for(let Ot=0;Ot<Et.length;++Ot){let As=Et[Ot],Us=As.length/3;for(let nr=bt*Us;nr<(bt+1)*Us;++nr)or[ar++]=As[nr]}let Ir=0,_r=at[Mt];for(let bt=0;bt<_r.length;++bt)if(_r[bt]==1){for(let Ot=0;Ot<3;++Ot)He[Ot][Mt][bt]=or[Ot*_s/3+Ir];++Ir}let Xp=(0,w.max)(or)[0];et.push(Xp+1-tt[Mt].length)}return[new o.Tensor("int64",He.flat(1/0),[3,r.dims[0],r.dims[1]]),new o.Tensor("int64",et,[et.length,1])]}else if(re){let{data:tt,dims:at}=ae(re),He=BigInt64Array.from({length:3*tt.length},(Ye,Xe)=>tt[Xe%tt.length]),pt=Array.from({length:at[0]},(Ye,Xe)=>(0,w.max)(tt.subarray(at[1]*Xe,at[1]*(Xe+1)))[0]+1n+BigInt(at[1]));return[new o.Tensor("int64",He,[3,...at]),new o.Tensor("int64",pt,[pt.length,1])]}else{let[tt,at]=r.dims,He=BigInt64Array.from({length:3*tt*at},(pt,Ye)=>BigInt(Math.floor(Ye%at/tt)));return[new o.Tensor("int64",He,[3,...r.dims]),(0,o.zeros)([tt,1])]}}async encode_image({pixel_values:r,image_grid_thw:E}){return(await R(this.sessions.vision_encoder,{pixel_values:r,grid_thw:E})).image_features}_merge_input_ids_with_image_features(r){return _e({image_token_id:this.config.image_token_id,...r})}prepare_inputs_for_generation(r,E,H){if(E.attention_mask&&!E.position_ids)if(!E.past_key_values)[E.position_ids,E.rope_deltas]=this.get_rope_index(E.input_ids,E.image_grid_thw,E.video_grid_thw,E.attention_mask);else{E.pixel_values=null;let re=BigInt(Object.values(E.past_key_values)[0].dims.at(-2)),oe=E.rope_deltas.map(Me=>re+Me);E.position_ids=(0,o.stack)([oe,oe,oe],0)}return E}}class Lo extends p{}class Ji extends Lo{}class Yi extends Lo{}class Do extends p{}class qi extends Do{}class Zi extends Do{}class Io extends p{}class el extends Io{}class tl extends Io{}class Oo extends p{}class sl extends Oo{}class rl extends Oo{}class Bo extends p{}class ol extends Bo{}class al extends Bo{}class jo extends p{}class nl extends jo{}class il extends jo{async _call(r){return new rt(await super._call(r))}}class No extends p{}class ll extends No{}class cl extends No{async _call(r){return new rt(await super._call(r))}}class _l extends p{}class dl extends _l{}class Ro extends p{}class ul extends Ro{}class pl extends Ro{async _call(r){return new rt(await super._call(r))}}class ml extends p{}class hl extends ml{}class Vo extends p{}class Ml extends Vo{}class fl extends Vo{async _call(r){return new rt(await super._call(r))}}class gl extends p{}class Pl extends gl{}class zo extends p{}class Tl extends zo{}class wl extends zo{async _call(r){return new rt(await super._call(r))}}class bl extends p{}class xl extends bl{async _call(r){return new hu(await super._call(r))}}class Go extends p{}class vl extends Go{}class El extends Go{async _call(r){return new rt(await super._call(r))}}class Wo extends p{}class Fl extends Wo{}class Cl extends Wo{async _call(r){return new rt(await super._call(r))}}class Uo extends p{}class kl extends Uo{}class yl extends Uo{}class $o extends p{}class Sl extends $o{}class Al extends $o{}class Ko extends p{}class Ll extends Ko{}class Dl extends Ko{async _call(r){return new rt(await super._call(r))}}class gr extends p{}class Il extends gr{}class Ol extends gr{async _call(r){return new Xo(await super._call(r))}}class Qo extends gr{async _call(r){return new Bl(await super._call(r))}}class Xo extends q{constructor({logits:r,pred_boxes:E}){super(),this.logits=r,this.pred_boxes=E}}class Bl extends q{constructor({logits:r,pred_boxes:E,pred_masks:H}){super(),this.logits=r,this.pred_boxes=E,this.pred_masks=H}}class Ho extends p{}class jl extends Ho{}class Nl extends Ho{async _call(r){return new lr(await super._call(r))}}class lr extends q{constructor({logits:r,pred_boxes:E}){super(),this.logits=r,this.pred_boxes=E}}class Jo extends p{}class Rl extends Jo{}class Vl extends Jo{async _call(r){return new zl(await super._call(r))}}class zl extends lr{}class Yo extends p{}class Gl extends Yo{}class Wl extends Yo{async _call(r){return new Ul(await super._call(r))}}class Ul extends lr{}class qo extends p{}class $l extends qo{}class Kl extends qo{async _call(r){return new lr(await super._call(r))}}class Zo extends p{}class Ql extends Zo{}class Xl extends Zo{async _call(r){return new Hl(await super._call(r))}}class Hl extends Xo{}class ea extends p{}class Jl extends ea{}class Yl extends ea{async _call(r){return new rt(await super._call(r))}}class ta extends p{}class ql extends ta{}class Zl extends ta{async _call(r){return new rt(await super._call(r))}}class sa extends p{}class ec extends sa{}class tc extends sa{async _call(r){return new rt(await super._call(r))}}class Pr extends p{}class sc extends Pr{}class rc extends Pr{async _call(r){return new rt(await super._call(r))}}class oc extends Pr{}class ra extends p{}class ac extends ra{}class nc extends ra{}class oa extends p{}class ic extends oa{}class lc extends oa{}class cc extends p{}class _c extends cc{}class Tr extends p{}class dc extends Tr{}class uc extends Tr{}class pc extends Tr{}class mc extends p{}class hc extends mc{}class Mc extends p{}class fc extends Mc{}class gc extends p{}class Pc extends gc{}class aa extends p{}class Tc extends aa{}class wc extends aa{}class na extends p{}class bc extends na{}class xc extends na{}class vc extends p{}class Ec extends vc{}class ia extends p{}class Fc extends ia{}class Cc extends ia{async _call(r){return new rt(await super._call(r))}}class la extends p{}class kc extends la{}class yc extends la{async _call(r){return new rt(await super._call(r))}}class ca extends p{}class Sc extends ca{}class Ac extends ca{async _call(r){return new rt(await super._call(r))}}class _a extends p{}class Lc extends _a{}class Dc extends _a{async _call(r){return new rt(await super._call(r))}}class Ic extends p{}class Oc extends Ic{}class Bc extends p{}class jc extends Bc{}class Nc extends p{}class Rc extends Nc{}class da extends p{}class Vc extends da{}class zc extends da{async _call(r){return new Gc(await super._call(r))}}class Gc extends q{constructor({logits:r,pred_boxes:E}){super(),this.logits=r,this.pred_boxes=E}}class Wc extends p{}class Uc extends Wc{async get_image_embeddings({pixel_values:r}){return await te(this,{pixel_values:r})}async forward(r){!r.image_embeddings||!r.image_positional_embeddings?r={...r,...await this.get_image_embeddings(r)}:r={...r},r.input_labels??=(0,o.ones)(r.input_points.dims.slice(0,-1));let E={image_embeddings:r.image_embeddings,image_positional_embeddings:r.image_positional_embeddings};return r.input_points&&(E.input_points=r.input_points),r.input_labels&&(E.input_labels=r.input_labels),r.input_boxes&&(E.input_boxes=r.input_boxes),await R(this.sessions.prompt_encoder_mask_decoder,E)}async _call(r){return new $c(await super._call(r))}}class $c extends q{constructor({iou_scores:r,pred_masks:E}){super(),this.iou_scores=r,this.pred_masks=E}}class Kc extends q{constructor({iou_scores:r,pred_masks:E,object_score_logits:H}){super(),this.iou_scores=r,this.pred_masks=E,this.object_score_logits=H}}class Qc extends p{}class wr extends Qc{async get_image_embeddings({pixel_values:r}){return await te(this,{pixel_values:r})}async forward(r){let{num_feature_levels:E}=this.config.vision_config;if(Array.from({length:E},(Me,Ee)=>`image_embeddings.${Ee}`).some(Me=>!r[Me])?r={...r,...await this.get_image_embeddings(r)}:r={...r},r.input_points){if(r.input_boxes&&r.input_boxes.dims[1]!==1)throw new Error("When both `input_points` and `input_boxes` are provided, the number of boxes per image must be 1.");let Me=r.input_points.dims;r.input_labels??=(0,o.ones)(Me.slice(0,-1)),r.input_boxes??=(0,o.full)([Me[0],0,4],0)}else if(r.input_boxes){let Me=r.input_boxes.dims;r.input_labels=(0,o.full)([Me[0],Me[1],0],-1n),r.input_points=(0,o.full)([Me[0],1,0,2],0)}else throw new Error("At least one of `input_points` or `input_boxes` must be provided.");let re=this.sessions.prompt_encoder_mask_decoder,oe=(0,f.pick)(r,re.inputNames);return await R(re,oe)}async _call(r){return new Kc(await super._call(r))}}class Xc extends wr{}class Hc extends wr{}class ua extends p{}class Jc extends ua{}class Yc extends ua{}class pa extends p{}class qc extends pa{}class Zc extends pa{}class ys extends p{}class e_ extends ys{}class t_ extends ys{async _call(r){return new Ss(await super._call(r))}}class s_ extends ys{async _call(r){return new rt(await super._call(r))}}class r_ extends ys{async _call(r){return new It(await super._call(r))}}class o_ extends p{}class a_ extends o_{async _call(r){return new Ss(await super._call(r))}}class ma extends p{}class n_ extends ma{}class i_ extends ma{async _call(r){return new It(await super._call(r))}}class l_ extends p{}class c_ extends l_{}class br extends p{}class __ extends br{}class d_ extends br{async _call(r){return new Ss(await super._call(r))}}class u_ extends br{async _call(r){return new rt(await super._call(r))}}class cr extends p{}class p_ extends cr{}class m_ extends cr{async _call(r){return new Ss(await super._call(r))}}class h_ extends cr{async _call(r){return new rt(await super._call(r))}}class M_ extends cr{async _call(r){return new It(await super._call(r))}}class xr extends p{}class f_ extends xr{}class g_ extends xr{async _call(r){return new Ss(await super._call(r))}}class P_ extends xr{async _call(r){return new rt(await super._call(r))}}class sp extends p{}class T_ extends ys{}class w_ extends ys{async _call(r){return new Ss(await super._call(r))}}class b_ extends ys{async _call(r){return new rt(await super._call(r))}}class sr extends p{}class x_ extends sr{}class v_ extends sr{async _call(r){return new Ss(await super._call(r))}}class E_ extends sr{async _call(r){return new rt(await super._call(r))}}class F_ extends sr{async _call(r){return new mu(await super._call(r))}}class C_ extends sr{async _call(r){return new It(await super._call(r))}}class k_ extends p{}class y_ extends k_{}class vr extends p{}class rp extends vr{}class S_ extends vr{}class A_ extends vr{async generate_speech(r,E,{threshold:H=.5,minlenratio:re=0,maxlenratio:oe=20,vocoder:Me=null}={}){let Ee={input_ids:r},{encoder_outputs:Ae,encoder_attention_mask:Ue}=await te(this,Ee),et=Ae.dims[1]/this.config.reduction_factor,tt=Math.floor(et*oe),at=Math.floor(et*re),He=this.config.num_mel_bins,pt=[],Ye=null,Xe=null,dt=0;for(;;){++dt;let xt=K(!!Xe),Ct;Xe?Ct=Xe.output_sequence_out:Ct=new o.Tensor("float32",new Float32Array(He),[1,1,He]);let St={use_cache_branch:xt,output_sequence:Ct,encoder_attention_mask:Ue,speaker_embeddings:E,encoder_hidden_states:Ae};this.addPastKeyValues(St,Ye),Xe=await R(this.sessions.decoder_model_merged,St),Ye=this.getPastKeyValues(Xe,Ye);let{prob:ct,spectrum:Et}=Xe;if(pt.push(Et),dt>=at&&(Array.from(ct.data).filter(Wt=>Wt>=H).length>0||dt>=tt))break}let Mt=(0,o.cat)(pt),{waveform:wt}=await R(Me.sessions.model,{spectrogram:Mt});return{spectrogram:Mt,waveform:wt}}}class L_ extends p{main_input_name="spectrogram"}class D_ extends p{}class ha extends D_{async generate_speech({input_ids:r,attention_mask:E,style:H,num_inference_steps:re=5,speed:oe=1.05}){let{sampling_rate:Me,chunk_compress_factor:Ee,base_chunk_size:Ae,latent_dim:Ue}=this.config,{last_hidden_state:et,durations:tt}=await R(this.sessions.text_encoder,{input_ids:r,attention_mask:E,style:H});tt.div_(oe);let at=tt.max().item()*Me,He=Ae*Ee,pt=Math.floor((at+He-1)/He),Ye=r.dims[0],Xe=(0,o.ones)([Ye,pt]),dt=(0,o.full)([Ye],re),Mt=(0,o.randn)([Ye,Ue*Ee,pt]);for(let xt=0;xt<re;++xt){let Ct=(0,o.full)([Ye],xt);({denoised_latents:Mt}=await R(this.sessions.latent_denoiser,{style:H,noisy_latents:Mt,latent_mask:Xe,encoder_outputs:et,attention_mask:E,timestep:Ct,num_inference_steps:dt}))}let{waveform:wt}=await R(this.sessions.voice_decoder,{latents:Mt});return{waveform:wt,durations:tt}}}class I_ extends p{}class O_ extends I_{}class Ma extends p{}class B_ extends Ma{}class j_ extends Ma{}class fa extends p{}class N_ extends fa{}class R_ extends fa{}class ga extends p{}class V_ extends ga{}class z_ extends ga{}class Pa extends p{}class G_ extends Pa{}class W_ extends Pa{}class Ta extends p{}class U_ extends Ta{}class $_ extends Ta{}class wa extends p{}class K_ extends wa{}class Q_ extends wa{}class Er extends p{}class X_ extends Er{}class H_ extends Er{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"text_model"})}}class J_ extends Er{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"audio_model"})}}class Y_ extends p{}class ba extends Y_{async _call(r){return new Mu(await super._call(r))}}class Fr extends p{}class op extends Fr{}class q_ extends Fr{}class Z_ extends Fr{}class xa extends p{}class ed extends xa{}class td extends xa{}class va extends p{}class sd extends va{}class rd extends va{async _call(r){return new rt(await super._call(r))}}class Ea extends p{}class ap extends Ea{}class np extends Ea{}class Fa extends p{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"];_apply_and_filter_by_delay_pattern_mask(r){let[E,H]=r.dims,re=this.config.decoder.num_codebooks,oe=H-re,Me=0;for(let Ue=0;Ue<r.size;++Ue){if(r.data[Ue]===this.config.decoder.pad_token_id)continue;let et=Ue%H,tt=Math.floor(Ue/H)%re,at=et-tt;at>0&&at<=oe&&(r.data[Me++]=r.data[Ue])}let Ee=Math.floor(E/re),Ae=Me/(Ee*re);return new o.Tensor(r.type,r.data.slice(0,Me),[Ee,re,Ae])}prepare_inputs_for_generation(r,E,H){let re=structuredClone(r);for(let Me=0;Me<re.length;++Me)for(let Ee=0;Ee<re[Me].length;++Ee)Me%this.config.decoder.num_codebooks>=Ee&&(re[Me][Ee]=BigInt(this.config.decoder.pad_token_id));return H.guidance_scale!==null&&H.guidance_scale>1&&(re=re.concat(re)),super.prepare_inputs_for_generation(re,E,H)}async generate(r){let E=await super.generate(r),H=this._apply_and_filter_by_delay_pattern_mask(E).unsqueeze_(0),{audio_values:re}=await R(this.sessions.encodec_decode,{audio_codes:H});return re}}class Cr extends p{}class od extends Cr{}class ad extends Cr{async _call(r){return new rt(await super._call(r))}}class nd extends Cr{}class kr extends p{}class id extends kr{}class ld extends kr{async _call(r){return new rt(await super._call(r))}}class cd extends kr{}class yr extends p{}class _d extends yr{}class dd extends yr{async _call(r){return new rt(await super._call(r))}}class ud extends yr{}class Sr extends p{}class pd extends Sr{}class md extends Sr{async _call(r){return new rt(await super._call(r))}}class hd extends Sr{}class Md extends p{}class fd extends Md{}class gd extends p{}class Pd extends gd{forward_params=["input_ids","pixel_values","images_seq_mask","images_emb_mask","attention_mask","position_ids","past_key_values"];constructor(...r){super(...r),this._generation_mode="text"}async forward(r){let E=this._generation_mode??"text",H;if(E==="text"||!r.past_key_values){let Ae=this.sessions.prepare_inputs_embeds,Ue=(0,f.pick)(r,Ae.inputNames);H=await R(Ae,Ue)}else{let Ae=this.sessions.gen_img_embeds,Ue=(0,f.pick)({image_ids:r.input_ids},Ae.inputNames);H=await R(Ae,Ue)}let re={...r,...H},oe=await ce(this,re),Me=this.sessions[E==="text"?"lm_head":"gen_head"];if(!Me)throw new Error(`Unable to find "${Me}" generation head`);let Ee=await R(Me,(0,f.pick)(oe,Me.inputNames));return{...H,...oe,...Ee}}async generate(r){return this._generation_mode="text",super.generate(r)}async generate_images(r){this._generation_mode="image";let E=(r.inputs??r[this.main_input_name]).dims[1],re=(await super.generate(r)).slice(null,[E,null]),oe=this.sessions.image_decode,{decoded_image:Me}=await R(oe,{generated_tokens:re}),Ee=Me.add_(1).mul_(255/2).clamp_(0,255).to("uint8"),Ae=[];for(let Ue of Ee){let et=x.RawImage.fromTensor(Ue);Ae.push(et)}return Ae}}class Td extends q{constructor({char_logits:r,bpe_logits:E,wp_logits:H}){super(),this.char_logits=r,this.bpe_logits=E,this.wp_logits=H}get logits(){return[this.char_logits,this.bpe_logits,this.wp_logits]}}class wd extends p{}class bd extends wd{async _call(r){return new Td(await super._call(r))}}class Ca extends p{}class xd extends Ca{}class vd extends Ca{}class ka extends p{}class Ed extends ka{}class Fd extends ka{}class Cd extends p{forward_params=["input_ids","attention_mask","position_ids","audio_values","past_key_values"]}class ya extends Cd{_merge_input_ids_with_audio_features(r){let E=r.audio_features.dims.at(-1),H=r.audio_features.view(-1,E);return X({audio_token_id:this.config.ignore_index??this.config.audio_token_id,...r,audio_features:H})}}class kd extends ya{}class Ar extends p{main_input_name="input_values";forward_params=["input_values"]}class yd extends q{constructor({audio_codes:r}){super(),this.audio_codes=r}}class Sd extends q{constructor({audio_values:r}){super(),this.audio_values=r}}class Ad extends Ar{async encode(r){return new yd(await R(this.sessions.encoder_model,r))}async decode(r){return new Sd(await R(this.sessions.decoder_model,r))}}class Ld extends Ar{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"encoder_model"})}}class Dd extends Ar{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"decoder_model"})}}class Lr extends p{main_input_name="input_values";forward_params=["input_values"]}class Id extends q{constructor({audio_codes:r}){super(),this.audio_codes=r}}class Od extends q{constructor({audio_values:r}){super(),this.audio_values=r}}class Bd extends Lr{async encode(r){return new Id(await R(this.sessions.encoder_model,r))}async decode(r){return new Od(await R(this.sessions.decoder_model,r))}}class jd extends Lr{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"encoder_model"})}}class Nd extends Lr{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"decoder_model"})}}class Dr extends p{main_input_name="input_values";forward_params=["input_values"]}class Rd extends Dr{async encode(r){return await R(this.sessions.encoder_model,r)}async decode(r){return await R(this.sessions.decoder_model,r)}}class Vd extends Dr{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"encoder_model"})}}class zd extends Dr{static async from_pretrained(r,E={}){return super.from_pretrained(r,{...E,model_file_name:E.model_file_name??"decoder_model"})}}class ht{static MODEL_CLASS_MAPPINGS=null;static BASE_IF_FAIL=!1;static async from_pretrained(r,{progress_callback:E=null,config:H=null,cache_dir:re=null,local_files_only:oe=!1,revision:Me="main",model_file_name:Ee=null,subfolder:Ae="onnx",device:Ue=null,dtype:et=null,use_external_data_format:tt=null,session_options:at={}}={}){let He={progress_callback:E,config:H,cache_dir:re,local_files_only:oe,revision:Me,model_file_name:Ee,subfolder:Ae,device:Ue,dtype:et,use_external_data_format:tt,session_options:at};if(He.config=await i.AutoConfig.from_pretrained(r,He),!this.MODEL_CLASS_MAPPINGS)throw new Error("`MODEL_CLASS_MAPPINGS` not implemented for this type of `AutoClass`: "+this.name);let pt=He.config.model_type;for(let Ye of this.MODEL_CLASS_MAPPINGS){let Xe=Ye.get(pt);if(!Xe){for(let dt of Ye.values())if(dt[0]===pt){Xe=dt;break}if(!Xe)continue}return await Xe[1].from_pretrained(r,He)}if(this.BASE_IF_FAIL)return pu.has(pt)||console.warn(`Unknown model class "${pt}", attempting to construct from base class.`),await p.from_pretrained(r,He);throw Error(`Unsupported model type: ${pt}`)}}let ip=new Map([["bert",["BertModel",Te]],["neobert",["NeoBertModel",De]],["modernbert",["ModernBertModel",Re]],["nomic_bert",["NomicBertModel",ft]],["roformer",["RoFormerModel",Hs]],["electra",["ElectraModel",lt]],["esm",["EsmModel",Ns]],["convbert",["ConvBertModel",qs]],["camembert",["CamembertModel",z]],["deberta",["DebertaModel",st]],["deberta-v2",["DebertaV2Model",ss]],["mpnet",["MPNetModel",Rs]],["albert",["AlbertModel",Ne]],["distilbert",["DistilBertModel",Bs]],["roberta",["RobertaModel",en]],["xlm",["XLMModel",an]],["xlm-roberta",["XLMRobertaModel",dn]],["clap",["ClapModel",X_]],["clip",["CLIPModel",An]],["clipseg",["CLIPSegModel",Gn]],["chinese_clip",["ChineseCLIPModel",Nn]],["siglip",["SiglipModel",In]],["jina_clip",["JinaCLIPModel",Rn]],["mobilebert",["MobileBertModel",rs]],["squeezebert",["SqueezeBertModel",A]],["wav2vec2",["Wav2Vec2Model",e_]],["wav2vec2-bert",["Wav2Vec2BertModel",f_]],["unispeech",["UniSpeechModel",__]],["unispeech-sat",["UniSpeechSatModel",p_]],["hubert",["HubertModel",T_]],["wavlm",["WavLMModel",x_]],["audio-spectrogram-transformer",["ASTModel",Mn]],["vits",["VitsModel",ba]],["pyannote",["PyAnnoteModel",n_]],["wespeaker-resnet",["WeSpeakerResNetModel",c_]],["detr",["DetrModel",Il]],["rt_detr",["RTDetrModel",jl]],["rt_detr_v2",["RTDetrV2Model",Rl]],["rf_detr",["RFDetrModel",Gl]],["d_fine",["DFineModel",$l]],["table-transformer",["TableTransformerModel",Ql]],["vit",["ViTModel",nl]],["ijepa",["IJepaModel",ll]],["pvt",["PvtModel",ul]],["vit_msn",["ViTMSNModel",Ml]],["vit_mae",["ViTMAEModel",hl]],["groupvit",["GroupViTModel",Pl]],["fastvit",["FastViTModel",Tl]],["mobilevit",["MobileViTModel",vl]],["mobilevitv2",["MobileViTV2Model",Fl]],["owlvit",["OwlViTModel",kl]],["owlv2",["Owlv2Model",Sl]],["beit",["BeitModel",Ll]],["deit",["DeiTModel",Jl]],["hiera",["HieraModel",ql]],["convnext",["ConvNextModel",Fc]],["convnextv2",["ConvNextV2Model",kc]],["dinov2",["Dinov2Model",Sc]],["dinov2_with_registers",["Dinov2WithRegistersModel",Lc]],["dinov3_vit",["DINOv3ViTModel",Oc]],["dinov3_convnext",["DINOv3ConvNextModel",jc]],["resnet",["ResNetModel",ec]],["swin",["SwinModel",sc]],["swin2sr",["Swin2SRModel",ac]],["donut-swin",["DonutSwinModel",Ec]],["yolos",["YolosModel",Vc]],["dpt",["DPTModel",ic]],["glpn",["GLPNModel",bc]],["hifigan",["SpeechT5HifiGan",L_]],["efficientnet",["EfficientNetModel",sd]],["decision_transformer",["DecisionTransformerModel",fd]],["patchtst",["PatchTSTForPrediction",xd]],["patchtsmixer",["PatchTSMixerForPrediction",Ed]],["mobilenet_v1",["MobileNetV1Model",od]],["mobilenet_v2",["MobileNetV2Model",id]],["mobilenet_v3",["MobileNetV3Model",_d]],["mobilenet_v4",["MobileNetV4Model",pd]],["maskformer",["MaskFormerModel",Tc]],["mgp-str",["MgpstrForSceneTextRecognition",bd]],["style_text_to_speech_2",["StyleTextToSpeech2Model",y_]]]),lp=new Map([["t5",["T5Model",ot]],["longt5",["LongT5Model",yt]],["mt5",["MT5Model",cs]],["bart",["BartModel",Cs]],["mbart",["MBartModel",Ms]],["marian",["MarianModel",Jc]],["whisper",["WhisperModel",gn]],["m2m_100",["M2M100Model",qc]],["blenderbot",["BlenderbotModel",At]],["blenderbot-small",["BlenderbotSmallModel",as]]]),cp=new Map([["mimi",["MimiModel",Ad]],["dac",["DacModel",Bd]],["snac",["SnacModel",Rd]]]),_p=new Map([["bloom",["BloomModel",el]],["jais",["JAISModel",Kn]],["gpt2",["GPT2Model",Un]],["gptj",["GPTJModel",qn]],["gpt_bigcode",["GPTBigCodeModel",ei]],["gpt_neo",["GPTNeoModel",Xn]],["gpt_neox",["GPTNeoXModel",Jn]],["codegen",["CodeGenModel",si]],["llama",["LlamaModel",oi]],["nanochat",["NanoChatModel",li]],["arcee",["ArceeModel",_i]],["lfm2",["Lfm2Model",ui]],["smollm3",["SmolLM3Model",mi]],["exaone",["ExaoneModel",Ti]],["olmo",["OlmoModel",vi]],["olmo2",["Olmo2Model",Fi]],["mobilellm",["MobileLLMModel",bi]],["granite",["GraniteModel",ki]],["granitemoehybrid",["GraniteMoeHybridModel",Si]],["cohere",["CohereModel",Li]],["gemma",["GemmaModel",Ii]],["gemma2",["Gemma2Model",Bi]],["vaultgemma",["VaultGemmaModel",Ni]],["gemma3_text",["Gemma3Model",Vi]],["helium",["HeliumModel",Mi]],["glm",["GlmModel",gi]],["openelm",["OpenELMModel",Gi]],["qwen2",["Qwen2Model",Ui]],["qwen3",["Qwen3Model",Ki]],["phi",["PhiModel",Ji]],["phi3",["Phi3Model",qi]],["mpt",["MptModel",sl]],["opt",["OPTModel",ol]],["mistral",["MistralModel",B_]],["ministral",["MinistralModel",N_]],["ministral3",["Ministral3Model",V_]],["ernie4_5",["Ernie4_5Model",G_]],["starcoder2",["Starcoder2Model",U_]],["falcon",["FalconModel",K_]],["stablelm",["StableLmModel",ed]],["modernbert-decoder",["ModernBertDecoderModel",ut]]]),Sa=new Map([["speecht5",["SpeechT5ForSpeechToText",S_]],["whisper",["WhisperForConditionalGeneration",Qr]],["lite-whisper",["LiteWhisperForConditionalGeneration",Pn]],["moonshine",["MoonshineForConditionalGeneration",Tn]]]),Gd=new Map([["speecht5",["SpeechT5ForTextToSpeech",A_]]]),Wd=new Map([["vits",["VitsModel",ba]],["musicgen",["MusicgenForConditionalGeneration",Fa]],["supertonic",["SupertonicForConditionalGeneration",ha]]]),Ud=new Map([["bert",["BertForSequenceClassification",ne]],["neobert",["NeoBertForSequenceClassification",ye]],["modernbert",["ModernBertForSequenceClassification",qe]],["roformer",["RoFormerForSequenceClassification",Ys]],["electra",["ElectraForSequenceClassification",n]],["esm",["EsmForSequenceClassification",vs]],["convbert",["ConvBertForSequenceClassification",Ls]],["camembert",["CamembertForSequenceClassification",ue]],["deberta",["DebertaForSequenceClassification",it]],["deberta-v2",["DebertaV2ForSequenceClassification",Ps]],["mpnet",["MPNetForSequenceClassification",Vs]],["albert",["AlbertForSequenceClassification",Ve]],["distilbert",["DistilBertForSequenceClassification",bs]],["roberta",["RobertaForSequenceClassification",sn]],["xlm",["XLMForSequenceClassification",ln]],["xlm-roberta",["XLMRobertaForSequenceClassification",pn]],["bart",["BartForSequenceClassification",Ut]],["mbart",["MBartForSequenceClassification",es]],["mobilebert",["MobileBertForSequenceClassification",Se]],["squeezebert",["SqueezeBertForSequenceClassification",$]]]),$d=new Map([["bert",["BertForTokenClassification",fe]],["neobert",["NeoBertForTokenClassification",Ce]],["modernbert",["ModernBertForTokenClassification",je]],["roformer",["RoFormerForTokenClassification",kt]],["electra",["ElectraForTokenClassification",j]],["esm",["EsmForTokenClassification",Es]],["convbert",["ConvBertForTokenClassification",Ds]],["camembert",["CamembertForTokenClassification",Ge]],["deberta",["DebertaForTokenClassification",gt]],["deberta-v2",["DebertaV2ForTokenClassification",Ts]],["mpnet",["MPNetForTokenClassification",mr]],["distilbert",["DistilBertForTokenClassification",js]],["roberta",["RobertaForTokenClassification",rn]],["xlm",["XLMForTokenClassification",cn]],["xlm-roberta",["XLMRobertaForTokenClassification",mn]]]),Aa=new Map([["t5",["T5ForConditionalGeneration",Ft]],["longt5",["LongT5ForConditionalGeneration",Zt]],["mt5",["MT5ForConditionalGeneration",zs]],["bart",["BartForConditionalGeneration",vt]],["mbart",["MBartForConditionalGeneration",gs]],["marian",["MarianMTModel",Yc]],["m2m_100",["M2M100ForConditionalGeneration",Zc]],["blenderbot",["BlenderbotForConditionalGeneration",Dt]],["blenderbot-small",["BlenderbotSmallForConditionalGeneration",Zs]]]),La=new Map([["bloom",["BloomForCausalLM",tl]],["gpt2",["GPT2LMHeadModel",$n]],["jais",["JAISLMHeadModel",Qn]],["gptj",["GPTJForCausalLM",Zn]],["gpt_bigcode",["GPTBigCodeForCausalLM",ti]],["gpt_neo",["GPTNeoForCausalLM",Hn]],["gpt_neox",["GPTNeoXForCausalLM",Yn]],["codegen",["CodeGenForCausalLM",ri]],["llama",["LlamaForCausalLM",ai]],["nanochat",["NanoChatForCausalLM",ci]],["llama4_text",["Llama4ForCausalLM",ii]],["arcee",["ArceeForCausalLM",di]],["lfm2",["Lfm2ForCausalLM",pi]],["smollm3",["SmolLM3ForCausalLM",hi]],["exaone",["ExaoneForCausalLM",wi]],["olmo",["OlmoForCausalLM",Ei]],["olmo2",["Olmo2ForCausalLM",Ci]],["mobilellm",["MobileLLMForCausalLM",xi]],["granite",["GraniteForCausalLM",yi]],["granitemoehybrid",["GraniteMoeHybridForCausalLM",Ai]],["cohere",["CohereForCausalLM",Di]],["gemma",["GemmaForCausalLM",Oi]],["gemma2",["Gemma2ForCausalLM",ji]],["vaultgemma",["VaultGemmaForCausalLM",Ri]],["gemma3_text",["Gemma3ForCausalLM",zi]],["helium",["HeliumForCausalLM",fi]],["glm",["GlmForCausalLM",Pi]],["openelm",["OpenELMForCausalLM",Wi]],["qwen2",["Qwen2ForCausalLM",$i]],["qwen3",["Qwen3ForCausalLM",Qi]],["phi",["PhiForCausalLM",Yi]],["phi3",["Phi3ForCausalLM",Zi]],["mpt",["MptForCausalLM",rl]],["opt",["OPTForCausalLM",al]],["mbart",["MBartForCausalLM",fs]],["mistral",["MistralForCausalLM",j_]],["ministral",["MinistralForCausalLM",R_]],["ministral3",["Ministral3ForCausalLM",z_]],["ernie4_5",["Ernie4_5ForCausalLM",W_]],["starcoder2",["Starcoder2ForCausalLM",$_]],["falcon",["FalconForCausalLM",Q_]],["trocr",["TrOCRForCausalLM",O_]],["stablelm",["StableLmForCausalLM",td]],["modernbert-decoder",["ModernBertDecoderForCausalLM",Pt]],["phi3_v",["Phi3VForCausalLM",eo]]]),dp=new Map([["multi_modality",["MultiModalityCausalLM",Pd]]]),Kd=new Map([["bert",["BertForMaskedLM",me]],["neobert",["NeoBertForMaskedLM",ve]],["modernbert",["ModernBertForMaskedLM",ke]],["roformer",["RoFormerForMaskedLM",Js]],["electra",["ElectraForMaskedLM",Os]],["esm",["EsmForMaskedLM",xs]],["convbert",["ConvBertForMaskedLM",Ze]],["camembert",["CamembertForMaskedLM",Z]],["deberta",["DebertaForMaskedLM",We]],["deberta-v2",["DebertaV2ForMaskedLM",Qt]],["mpnet",["MPNetForMaskedLM",Fs]],["albert",["AlbertForMaskedLM",Ie]],["distilbert",["DistilBertForMaskedLM",ps]],["roberta",["RobertaForMaskedLM",tn]],["xlm",["XLMWithLMHeadModel",nn]],["xlm-roberta",["XLMRobertaForMaskedLM",un]],["mobilebert",["MobileBertForMaskedLM",Fe]],["squeezebert",["SqueezeBertForMaskedLM",U]]]),Qd=new Map([["bert",["BertForQuestionAnswering",le]],["neobert",["NeoBertForQuestionAnswering",Qe]],["roformer",["RoFormerForQuestionAnswering",qt]],["electra",["ElectraForQuestionAnswering",v]],["convbert",["ConvBertForQuestionAnswering",Is]],["camembert",["CamembertForQuestionAnswering",Je]],["deberta",["DebertaForQuestionAnswering",Kt]],["deberta-v2",["DebertaV2ForQuestionAnswering",ws]],["mpnet",["MPNetForQuestionAnswering",ee]],["albert",["AlbertForQuestionAnswering",ze]],["distilbert",["DistilBertForQuestionAnswering",ls]],["roberta",["RobertaForQuestionAnswering",on]],["xlm",["XLMForQuestionAnswering",_n]],["xlm-roberta",["XLMRobertaForQuestionAnswering",hn]],["mobilebert",["MobileBertForQuestionAnswering",Ke]],["squeezebert",["SqueezeBertForQuestionAnswering",ie]]]),Da=new Map([["vision-encoder-decoder",["VisionEncoderDecoderModel",Hr]],["idefics3",["Idefics3ForConditionalGeneration",Mr]],["smolvlm",["SmolVLMForConditionalGeneration",Zr]]]),Xd=new Map([["llava",["LlavaForConditionalGeneration",hr]],["llava_onevision",["LlavaOnevisionForConditionalGeneration",wn]],["moondream1",["Moondream1ForConditionalGeneration",bn]],["florence2",["Florence2ForConditionalGeneration",vn]],["qwen2-vl",["Qwen2VLForConditionalGeneration",Hi]],["idefics3",["Idefics3ForConditionalGeneration",Mr]],["smolvlm",["SmolVLMForConditionalGeneration",Zr]],["paligemma",["PaliGemmaForConditionalGeneration",Fn]],["llava_qwen2",["LlavaQwen2ForCausalLM",Yr]],["gemma3n",["Gemma3nForConditionalGeneration",qr]],["mistral3",["Mistral3ForConditionalGeneration",Cn]]]),Hd=new Map([["ultravox",["UltravoxModel",ya]],["voxtral",["VoxtralForConditionalGeneration",kd]]]),up=new Map([["vision-encoder-decoder",["VisionEncoderDecoderModel",Hr]]]),Jd=new Map([["vit",["ViTForImageClassification",il]],["ijepa",["IJepaForImageClassification",cl]],["pvt",["PvtForImageClassification",pl]],["vit_msn",["ViTMSNForImageClassification",fl]],["fastvit",["FastViTForImageClassification",wl]],["mobilevit",["MobileViTForImageClassification",El]],["mobilevitv2",["MobileViTV2ForImageClassification",Cl]],["beit",["BeitForImageClassification",Dl]],["deit",["DeiTForImageClassification",Yl]],["hiera",["HieraForImageClassification",Zl]],["convnext",["ConvNextForImageClassification",Cc]],["convnextv2",["ConvNextV2ForImageClassification",yc]],["dinov2",["Dinov2ForImageClassification",Ac]],["dinov2_with_registers",["Dinov2WithRegistersForImageClassification",Dc]],["resnet",["ResNetForImageClassification",tc]],["swin",["SwinForImageClassification",rc]],["segformer",["SegformerForImageClassification",q_]],["efficientnet",["EfficientNetForImageClassification",rd]],["mobilenet_v1",["MobileNetV1ForImageClassification",ad]],["mobilenet_v2",["MobileNetV2ForImageClassification",ld]],["mobilenet_v3",["MobileNetV3ForImageClassification",dd]],["mobilenet_v4",["MobileNetV4ForImageClassification",md]]]),Yd=new Map([["detr",["DetrForObjectDetection",Ol]],["rt_detr",["RTDetrForObjectDetection",Nl]],["rt_detr_v2",["RTDetrV2ForObjectDetection",Vl]],["rf_detr",["RFDetrForObjectDetection",Wl]],["d_fine",["DFineForObjectDetection",Kl]],["table-transformer",["TableTransformerForObjectDetection",Xl]],["yolos",["YolosForObjectDetection",zc]]]),qd=new Map([["owlvit",["OwlViTForObjectDetection",yl]],["owlv2",["Owlv2ForObjectDetection",Al]],["grounding-dino",["GroundingDinoForObjectDetection",Rc]]]),rr=new Map([["detr",["DetrForSegmentation",Qo]],["clipseg",["CLIPSegForImageSegmentation",Wn]]]),Zd=new Map([["segformer",["SegformerForSemanticSegmentation",Z_]],["sapiens",["SapiensForSemanticSegmentation",dc]],["swin",["SwinForSemanticSegmentation",oc]],["mobilenet_v1",["MobileNetV1ForSemanticSegmentation",nd]],["mobilenet_v2",["MobileNetV2ForSemanticSegmentation",cd]],["mobilenet_v3",["MobileNetV3ForSemanticSegmentation",ud]],["mobilenet_v4",["MobileNetV4ForSemanticSegmentation",hd]]]),eu=new Map([["detr",["DetrForSegmentation",Qo]],["maskformer",["MaskFormerForInstanceSegmentation",wc]]]),tu=new Map([["sam",["SamModel",Uc]],["sam2",["Sam2Model",wr]],["edgetam",["EdgeTamModel",Xc]],["sam3_tracker",["Sam3TrackerModel",Hc]]]),su=new Map([["wav2vec2",["Wav2Vec2ForCTC",t_]],["wav2vec2-bert",["Wav2Vec2BertForCTC",g_]],["unispeech",["UniSpeechForCTC",d_]],["unispeech-sat",["UniSpeechSatForCTC",m_]],["wavlm",["WavLMForCTC",v_]],["hubert",["HubertForCTC",w_]],["parakeet_ctc",["ParakeetForCTC",a_]]]),ru=new Map([["wav2vec2",["Wav2Vec2ForSequenceClassification",s_]],["wav2vec2-bert",["Wav2Vec2BertForSequenceClassification",P_]],["unispeech",["UniSpeechForSequenceClassification",u_]],["unispeech-sat",["UniSpeechSatForSequenceClassification",h_]],["wavlm",["WavLMForSequenceClassification",E_]],["hubert",["HubertForSequenceClassification",b_]],["audio-spectrogram-transformer",["ASTForAudioClassification",fn]]]),ou=new Map([["wavlm",["WavLMForXVector",F_]]]),au=new Map([["unispeech-sat",["UniSpeechSatForAudioFrameClassification",M_]],["wavlm",["WavLMForAudioFrameClassification",C_]],["wav2vec2",["Wav2Vec2ForAudioFrameClassification",r_]],["pyannote",["PyAnnoteForAudioFrameClassification",i_]]]),nu=new Map([["vitmatte",["VitMatteForImageMatting",xl]]]),pp=new Map([["patchtst",["PatchTSTForPrediction",vd]],["patchtsmixer",["PatchTSMixerForPrediction",Fd]]]),iu=new Map([["swin2sr",["Swin2SRForImageSuperResolution",nc]]]),lu=new Map([["dpt",["DPTForDepthEstimation",lc]],["depth_anything",["DepthAnythingForDepthEstimation",_c]],["glpn",["GLPNForDepthEstimation",xc]],["sapiens",["SapiensForDepthEstimation",uc]],["depth_pro",["DepthProForDepthEstimation",hc]],["metric3d",["Metric3DForDepthEstimation",fc]],["metric3dv2",["Metric3Dv2ForDepthEstimation",Pc]]]),cu=new Map([["sapiens",["SapiensForNormalEstimation",pc]]]),_u=new Map([["vitpose",["VitPoseForPoseEstimation",dl]]]),du=new Map([["clip",["CLIPVisionModelWithProjection",Dn]],["siglip",["SiglipVisionModel",Bn]],["jina_clip",["JinaCLIPVisionModel",zn]]]),uu=[[ip,P.EncoderOnly],[lp,P.EncoderDecoder],[_p,P.DecoderOnly],[cp,P.AutoEncoder],[Ud,P.EncoderOnly],[$d,P.EncoderOnly],[Aa,P.Seq2Seq],[Sa,P.Seq2Seq],[La,P.DecoderOnly],[dp,P.MultiModality],[Kd,P.EncoderOnly],[Qd,P.EncoderOnly],[Da,P.Vision2Seq],[Xd,P.ImageTextToText],[Hd,P.AudioTextToText],[Jd,P.EncoderOnly],[rr,P.EncoderOnly],[eu,P.EncoderOnly],[Zd,P.EncoderOnly],[nu,P.EncoderOnly],[pp,P.EncoderOnly],[iu,P.EncoderOnly],[lu,P.EncoderOnly],[cu,P.EncoderOnly],[_u,P.EncoderOnly],[Yd,P.EncoderOnly],[qd,P.EncoderOnly],[tu,P.MaskGeneration],[su,P.EncoderOnly],[ru,P.EncoderOnly],[Gd,P.Seq2Seq],[Wd,P.EncoderOnly],[ou,P.EncoderOnly],[au,P.EncoderOnly],[du,P.EncoderOnly]];for(let[s,r]of uu)for(let[E,H]of s.values())M.set(E,r),l.set(H,E),y.set(E,H);let mp=[["MusicgenForConditionalGeneration",Fa,P.Musicgen],["Phi3VForCausalLM",eo,P.Phi3V],["CLIPTextModelWithProjection",Ln,P.EncoderOnly],["SiglipTextModel",On,P.EncoderOnly],["JinaCLIPTextModel",Vn,P.EncoderOnly],["ClapTextModelWithProjection",H_,P.EncoderOnly],["ClapAudioModelWithProjection",J_,P.EncoderOnly],["DacEncoderModel",jd,P.EncoderOnly],["DacDecoderModel",Nd,P.EncoderOnly],["MimiEncoderModel",Ld,P.EncoderOnly],["MimiDecoderModel",Dd,P.EncoderOnly],["SnacEncoderModel",Vd,P.EncoderOnly],["SnacDecoderModel",zd,P.EncoderOnly],["Gemma3nForConditionalGeneration",qr,P.ImageAudioTextToText],["SupertonicForConditionalGeneration",ha,P.Supertonic]];for(let[s,r,E]of mp)M.set(s,E),l.set(r,s),y.set(s,r);let pu=new Map([["modnet",rr],["birefnet",rr],["isnet",rr],["ben",rr]]);for(let[s,r]of pu.entries())r.set(s,["PreTrainedModel",p]),M.set(s,P.EncoderOnly),l.set(p,s),y.set(s,p);class hp extends ht{static MODEL_CLASS_MAPPINGS=uu.map(r=>r[0]);static BASE_IF_FAIL=!0}class Mp extends ht{static MODEL_CLASS_MAPPINGS=[Ud]}class fp extends ht{static MODEL_CLASS_MAPPINGS=[$d]}class gp extends ht{static MODEL_CLASS_MAPPINGS=[Aa]}class Pp extends ht{static MODEL_CLASS_MAPPINGS=[Sa]}class Tp extends ht{static MODEL_CLASS_MAPPINGS=[Gd]}class wp extends ht{static MODEL_CLASS_MAPPINGS=[Wd]}class bp extends ht{static MODEL_CLASS_MAPPINGS=[La]}class xp extends ht{static MODEL_CLASS_MAPPINGS=[Kd]}class vp extends ht{static MODEL_CLASS_MAPPINGS=[Qd]}class Ep extends ht{static MODEL_CLASS_MAPPINGS=[Da]}class Fp extends ht{static MODEL_CLASS_MAPPINGS=[Jd]}class Cp extends ht{static MODEL_CLASS_MAPPINGS=[rr]}class kp extends ht{static MODEL_CLASS_MAPPINGS=[Zd]}class yp extends ht{static MODEL_CLASS_MAPPINGS=[eu]}class Sp extends ht{static MODEL_CLASS_MAPPINGS=[Yd]}class Ap extends ht{static MODEL_CLASS_MAPPINGS=[qd]}class Lp extends ht{static MODEL_CLASS_MAPPINGS=[tu]}class Dp extends ht{static MODEL_CLASS_MAPPINGS=[su]}class Ip extends ht{static MODEL_CLASS_MAPPINGS=[ru]}class Op extends ht{static MODEL_CLASS_MAPPINGS=[ou]}class Bp extends ht{static MODEL_CLASS_MAPPINGS=[au]}class jp extends ht{static MODEL_CLASS_MAPPINGS=[up]}class Np extends ht{static MODEL_CLASS_MAPPINGS=[nu]}class Rp extends ht{static MODEL_CLASS_MAPPINGS=[iu]}class Vp extends ht{static MODEL_CLASS_MAPPINGS=[lu]}class zp extends ht{static MODEL_CLASS_MAPPINGS=[cu]}class Gp extends ht{static MODEL_CLASS_MAPPINGS=[_u]}class Wp extends ht{static MODEL_CLASS_MAPPINGS=[du]}class Up extends ht{static MODEL_CLASS_MAPPINGS=[Xd]}class $p extends ht{static MODEL_CLASS_MAPPINGS=[Hd]}class Kp extends q{constructor({logits:r,past_key_values:E,encoder_outputs:H,decoder_attentions:re=null,cross_attentions:oe=null}){super(),this.logits=r,this.past_key_values=E,this.encoder_outputs=H,this.decoder_attentions=re,this.cross_attentions=oe}}class rt extends q{constructor({logits:r,...E}){super(),this.logits=r;let H=Object.values(E);H.length>0&&(this.attentions=H)}}class mu extends q{constructor({logits:r,embeddings:E}){super(),this.logits=r,this.embeddings=E}}class It extends q{constructor({logits:r}){super(),this.logits=r}}class Gt extends q{constructor({logits:r}){super(),this.logits=r}}class Jt extends q{constructor({start_logits:r,end_logits:E}){super(),this.start_logits=r,this.end_logits=E}}class Ss extends q{constructor({logits:r}){super(),this.logits=r}}class Qp extends q{constructor({logits:r,past_key_values:E}){super(),this.logits=r,this.past_key_values=E}}class hu extends q{constructor({alphas:r}){super(),this.alphas=r}}class Mu extends q{constructor({waveform:r,spectrogram:E}){super(),this.waveform=r,this.spectrogram=E}}}),"./src/models/audio_spectrogram_transformer/feature_extraction_audio_spectrogram_transformer.js":((D,a,e)=>{e.r(a),e.d(a,{ASTFeatureExtractor:()=>I});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/audio.js");class I extends i.FeatureExtractor{constructor(u){super(u);let m=this.config.sampling_rate,T=(0,g.mel_filter_bank)(257,this.config.num_mel_bins,20,Math.floor(m/2),m,null,"kaldi",!0);this.mel_filters=T,this.window=(0,g.window_function)(400,"hann",{periodic:!1}),this.mean=this.config.mean,this.std=this.config.std}async _extract_fbank_features(u,m){return(0,g.spectrogram)(u,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:m,transpose:!0})}async _call(u){(0,i.validate_audio_inputs)(u,"ASTFeatureExtractor");let m=await this._extract_fbank_features(u,this.config.max_length);if(this.config.do_normalize){let T=this.std*2,_=m.data;for(let o=0;o<_.length;++o)_[o]=(_[o]-this.mean)/T}return{input_values:m.unsqueeze_(0)}}}}),"./src/models/auto/feature_extraction_auto.js":((D,a,e)=>{e.r(a),e.d(a,{AutoFeatureExtractor:()=>f});var i=e("./src/utils/constants.js"),d=e("./src/utils/hub.js"),g=e("./src/base/feature_extraction_utils.js"),I=e("./src/models/feature_extractors.js");class f{static async from_pretrained(m,T={}){let _=await(0,d.getModelJSON)(m,i.FEATURE_EXTRACTOR_NAME,!0,T),o=_.feature_extractor_type,x=I[o];if(!x)throw new Error(`Unknown feature_extractor_type: '${o}'. Please report this at ${i.GITHUB_ISSUE_URL}.`);return new x(_)}}}),"./src/models/auto/image_processing_auto.js":((D,a,e)=>{e.r(a),e.d(a,{AutoImageProcessor:()=>f});var i=e("./src/utils/constants.js"),d=e("./src/utils/hub.js"),g=e("./src/base/image_processors_utils.js"),I=e("./src/models/image_processors.js");class f{static async from_pretrained(m,T={}){let _=await(0,d.getModelJSON)(m,i.IMAGE_PROCESSOR_NAME,!0,T),o=_.image_processor_type??_.feature_extractor_type,x=I[o?.replace(/Fast$/,"")];return x||(o!==void 0&&console.warn(`Image processor type '${o}' not found, assuming base ImageProcessor. Please report this at ${i.GITHUB_ISSUE_URL}.`),x=g.ImageProcessor),new x(_)}}}),"./src/models/auto/processing_auto.js":((D,a,e)=>{e.r(a),e.d(a,{AutoProcessor:()=>m});var i=e("./src/utils/constants.js"),d=e("./src/utils/hub.js"),g=e("./src/base/processing_utils.js"),I=e("./src/models/processors.js"),f=e("./src/models/image_processors.js"),u=e("./src/models/feature_extractors.js");class m{static async from_pretrained(_,o={}){let x=await(0,d.getModelJSON)(_,i.IMAGE_PROCESSOR_NAME,!0,o),{image_processor_type:w,feature_extractor_type:k,processor_class:G}=x;if(G&&I[G])return I[G].from_pretrained(_,o);if(!w&&!k)throw new Error("No `image_processor_type` or `feature_extractor_type` found in the config.");let b={};if(w){let B=f[w.replace(/Fast$/,"")];if(!B)throw new Error(`Unknown image_processor_type: '${w}'.`);b.image_processor=new B(x)}if(k){let B=f[k];if(B)b.image_processor=new B(x);else{let P=u[k];if(!P)throw new Error(`Unknown feature_extractor_type: '${k}'.`);b.feature_extractor=new P(x)}}let C={};return new g.Processor(C,b,null)}}}),"./src/models/beit/image_processing_beit.js":((D,a,e)=>{e.r(a),e.d(a,{BeitFeatureExtractor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}}),"./src/models/bit/image_processing_bit.js":((D,a,e)=>{e.r(a),e.d(a,{BitImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}}),"./src/models/chinese_clip/image_processing_chinese_clip.js":((D,a,e)=>{e.r(a),e.d(a,{ChineseCLIPFeatureExtractor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}}),"./src/models/clap/feature_extraction_clap.js":((D,a,e)=>{e.r(a),e.d(a,{ClapFeatureExtractor:()=>I});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/audio.js");class I extends i.FeatureExtractor{constructor(u){super(u),this.mel_filters=(0,g.mel_filter_bank)(this.config.nb_frequency_bins,this.config.feature_size,this.config.frequency_min,this.config.frequency_max,this.config.sampling_rate,null,"htk"),this.mel_filters_slaney=(0,g.mel_filter_bank)(this.config.nb_frequency_bins,this.config.feature_size,this.config.frequency_min,this.config.frequency_max,this.config.sampling_rate,"slaney","slaney"),this.window=(0,g.window_function)(this.config.fft_window_size,"hann")}async _get_input_mel(u,m,T,_){let o,x=!1,w=u.length-m;if(w>0)if(T==="rand_trunc"){x=!0;let k=Math.floor(Math.random()*(w+1));u=u.subarray(k,k+m),o=await this._extract_fbank_features(u,this.mel_filters_slaney,this.config.nb_max_samples)}else throw new Error(`Truncation strategy "${T}" not implemented`);else{if(w<0){let k=new Float64Array(m);if(k.set(u),_==="repeat")for(let G=u.length;G<m;G+=u.length)k.set(u.subarray(0,Math.min(u.length,m-G)),G);else if(_==="repeatpad")for(let G=u.length;G<-w;G+=u.length)k.set(u,G);u=k}if(T==="fusion")throw new Error(`Truncation strategy "${T}" not implemented`);o=await this._extract_fbank_features(u,this.mel_filters_slaney,this.config.nb_max_samples)}return o.unsqueeze_(0)}async _extract_fbank_features(u,m,T=null){return(0,g.spectrogram)(u,this.window,this.config.fft_window_size,this.config.hop_length,{power:2,mel_filters:m,log_mel:"dB",max_num_frames:T,do_pad:!1,transpose:!0})}async _call(u,{max_length:m=null}={}){return(0,i.validate_audio_inputs)(u,"ClapFeatureExtractor"),{input_features:(await this._get_input_mel(u,m??this.config.nb_max_samples,this.config.truncation,this.config.padding)).unsqueeze_(0)}}}}),"./src/models/clip/image_processing_clip.js":((D,a,e)=>{e.r(a),e.d(a,{CLIPFeatureExtractor:()=>g,CLIPImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/convnext/image_processing_convnext.js":((D,a,e)=>{e.r(a),e.d(a,{ConvNextFeatureExtractor:()=>g,ConvNextImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{constructor(f){super(f),this.crop_pct=this.config.crop_pct??224/256}async resize(f){let u=this.size?.shortest_edge;if(u===void 0)throw new Error("Size dictionary must contain 'shortest_edge' key.");if(u<384){let m=Math.floor(u/this.crop_pct),[T,_]=this.get_resize_output_image_size(f,{shortest_edge:m});f=await f.resize(T,_,{resample:this.resample}),f=await f.center_crop(u,u)}else f=await f.resize(u,u,{resample:this.resample});return f}}class g extends d{}}),"./src/models/dac/feature_extraction_dac.js":((D,a,e)=>{e.r(a),e.d(a,{DacFeatureExtractor:()=>d});var i=e("./src/models/encodec/feature_extraction_encodec.js");class d extends i.EncodecFeatureExtractor{}}),"./src/models/deit/image_processing_deit.js":((D,a,e)=>{e.r(a),e.d(a,{DeiTFeatureExtractor:()=>g,DeiTImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/detr/image_processing_detr.js":((D,a,e)=>{e.r(a),e.d(a,{DetrFeatureExtractor:()=>I,DetrImageProcessor:()=>g});var i=e("./src/base/image_processors_utils.js"),d=e("./src/utils/tensor.js");class g extends i.ImageProcessor{async _call(u){let m=await super._call(u),T=[m.pixel_values.dims[0],64,64],_=(0,d.full)(T,1n);return{...m,pixel_mask:_}}post_process_object_detection(...u){return(0,i.post_process_object_detection)(...u)}post_process_panoptic_segmentation(...u){return(0,i.post_process_panoptic_segmentation)(...u)}post_process_instance_segmentation(...u){return(0,i.post_process_instance_segmentation)(...u)}}class I extends g{}}),"./src/models/dinov3_vit/image_processing_dinov3_vit.js":((D,a,e)=>{e.r(a),e.d(a,{DINOv3ViTImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}}),"./src/models/donut/image_processing_donut.js":((D,a,e)=>{e.r(a),e.d(a,{DonutFeatureExtractor:()=>g,DonutImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{pad_image(f,u,m,T={}){let[_,o,x]=u,w=this.image_mean;Array.isArray(this.image_mean)||(w=new Array(x).fill(w));let k=this.image_std;Array.isArray(k)||(k=new Array(x).fill(w));let G=w.map((b,C)=>-b/k[C]);return super.pad_image(f,u,m,{center:!0,constant_values:G,...T})}}class g extends d{}}),"./src/models/dpt/image_processing_dpt.js":((D,a,e)=>{e.r(a),e.d(a,{DPTFeatureExtractor:()=>g,DPTImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/efficientnet/image_processing_efficientnet.js":((D,a,e)=>{e.r(a),e.d(a,{EfficientNetImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{constructor(I){super(I),this.include_top=this.config.include_top??!0,this.include_top&&(this.image_std=this.image_std.map(f=>f*f))}}}),"./src/models/encodec/feature_extraction_encodec.js":((D,a,e)=>{e.r(a),e.d(a,{EncodecFeatureExtractor:()=>g});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js");class g extends i.FeatureExtractor{async _call(f){(0,i.validate_audio_inputs)(f,"EncodecFeatureExtractor"),f instanceof Float64Array&&(f=new Float32Array(f));let u=this.config.feature_size;if(f.length%u!==0)throw new Error(`The length of the audio data must be a multiple of the number of channels (${u}).`);let m=[1,u,f.length/u];return{input_values:new d.Tensor("float32",f,m)}}}}),"./src/models/feature_extractors.js":((D,a,e)=>{e.r(a),e.d(a,{ASTFeatureExtractor:()=>i.ASTFeatureExtractor,ClapFeatureExtractor:()=>g.ClapFeatureExtractor,DacFeatureExtractor:()=>I.DacFeatureExtractor,EncodecFeatureExtractor:()=>d.EncodecFeatureExtractor,Gemma3nAudioFeatureExtractor:()=>f.Gemma3nAudioFeatureExtractor,ImageFeatureExtractor:()=>b.ImageProcessor,MoonshineFeatureExtractor:()=>u.MoonshineFeatureExtractor,ParakeetFeatureExtractor:()=>m.ParakeetFeatureExtractor,PyAnnoteFeatureExtractor:()=>T.PyAnnoteFeatureExtractor,SeamlessM4TFeatureExtractor:()=>_.SeamlessM4TFeatureExtractor,SnacFeatureExtractor:()=>o.SnacFeatureExtractor,SpeechT5FeatureExtractor:()=>x.SpeechT5FeatureExtractor,Wav2Vec2FeatureExtractor:()=>w.Wav2Vec2FeatureExtractor,WeSpeakerFeatureExtractor:()=>k.WeSpeakerFeatureExtractor,WhisperFeatureExtractor:()=>G.WhisperFeatureExtractor});var i=e("./src/models/audio_spectrogram_transformer/feature_extraction_audio_spectrogram_transformer.js"),d=e("./src/models/encodec/feature_extraction_encodec.js"),g=e("./src/models/clap/feature_extraction_clap.js"),I=e("./src/models/dac/feature_extraction_dac.js"),f=e("./src/models/gemma3n/feature_extraction_gemma3n.js"),u=e("./src/models/moonshine/feature_extraction_moonshine.js"),m=e("./src/models/parakeet/feature_extraction_parakeet.js"),T=e("./src/models/pyannote/feature_extraction_pyannote.js"),_=e("./src/models/seamless_m4t/feature_extraction_seamless_m4t.js"),o=e("./src/models/snac/feature_extraction_snac.js"),x=e("./src/models/speecht5/feature_extraction_speecht5.js"),w=e("./src/models/wav2vec2/feature_extraction_wav2vec2.js"),k=e("./src/models/wespeaker/feature_extraction_wespeaker.js"),G=e("./src/models/whisper/feature_extraction_whisper.js"),b=e("./src/base/image_processors_utils.js")}),"./src/models/florence2/processing_florence2.js":((D,a,e)=>{e.r(a),e.d(a,{Florence2Processor:()=>I});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js");class I extends i.Processor{static tokenizer_class=g.AutoTokenizer;static image_processor_class=d.AutoImageProcessor;constructor(u,m,T){super(u,m,T);let{tasks_answer_post_processing_type:_,task_prompts_without_inputs:o,task_prompts_with_input:x}=this.image_processor.config;this.tasks_answer_post_processing_type=new Map(Object.entries(_??{})),this.task_prompts_without_inputs=new Map(Object.entries(o??{})),this.task_prompts_with_input=new Map(Object.entries(x??{})),this.regexes={quad_boxes:/(.+?)<loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)>/gm,bboxes:/([^<]+)?<loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)>/gm},this.size_per_bin=1e3}construct_prompts(u){typeof u=="string"&&(u=[u]);let m=[];for(let T of u)if(this.task_prompts_without_inputs.has(T))m.push(this.task_prompts_without_inputs.get(T));else{for(let[_,o]of this.task_prompts_with_input)if(T.includes(_)){m.push(o.replaceAll("{input}",T).replaceAll(_,""));break}m.length!==u.length&&m.push(T)}return m}post_process_generation(u,m,T){let _=this.tasks_answer_post_processing_type.get(m)??"pure_text";u=u.replaceAll("<s>","").replaceAll("</s>","");let o;switch(_){case"pure_text":o=u;break;case"description_with_bboxes":case"bboxes":case"phrase_grounding":case"ocr":let x=_==="ocr"?"quad_boxes":"bboxes",w=u.matchAll(this.regexes[x]),k=[],G=[];for(let[b,C,...B]of w)k.push(C?C.trim():k.at(-1)??""),G.push(B.map((P,M)=>(Number(P)+.5)/this.size_per_bin*T[M%2]));o={labels:k,[x]:G};break;default:throw new Error(`Task "${m}" (of type "${_}") not yet implemented.`)}return{[m]:o}}async _call(u,m=null,T={}){if(!u&&!m)throw new Error("Either text or images must be provided");let _=await this.image_processor(u,T),o=m?this.tokenizer(this.construct_prompts(m),T):{};return{..._,...o}}}}),"./src/models/gemma3n/feature_extraction_gemma3n.js":((D,a,e)=>{e.r(a),e.d(a,{Gemma3nAudioFeatureExtractor:()=>I});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/audio.js");class I extends i.FeatureExtractor{constructor(u){super(u);let{fft_length:m,feature_size:T,min_frequency:_,max_frequency:o,sampling_rate:x,frame_length:w}=this.config,k=(0,g.mel_filter_bank)(Math.floor(1+m/2),T,_,o,x,null,"htk",!1);this.mel_filters=k,this.window=(0,g.window_function)(w,"hann")}async _extract_fbank_features(u,m){return(0,g.spectrogram)(u,this.window,this.config.frame_length,this.config.hop_length,{fft_length:this.config.fft_length,center:!1,onesided:!0,preemphasis:this.config.preemphasis,preemphasis_htk_flavor:this.config.preemphasis_htk_flavor,mel_filters:this.mel_filters,log_mel:"log",mel_floor:this.config.mel_floor,remove_dc_offset:!1,transpose:!0})}async _call(u,{max_length:m=48e4,truncation:T=!0,padding:_=!0,pad_to_multiple_of:o=128}={}){if((0,i.validate_audio_inputs)(u,"Gemma3nAudioFeatureExtractor"),T&&u.length>m&&(u=u.slice(0,m)),_&&u.length%o!==0){let k=o-u.length%o,G=new Float64Array(u.length+k);G.set(u),this.config.padding_value!==0&&G.fill(this.config.padding_value,u.length),u=G}let x=await this._extract_fbank_features(u,this.config.max_length),w=(0,d.full)([1,x.dims[0]],!0);return{input_features:x.unsqueeze_(0),input_features_mask:w}}}}),"./src/models/gemma3n/processing_gemma3n.js":((D,a,e)=>{e.r(a),e.d(a,{Gemma3nProcessor:()=>m});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/models/auto/feature_extraction_auto.js"),I=e("./src/tokenizers.js"),f=e("./src/utils/image.js"),u=e("./src/utils/audio.js");class m extends i.Processor{static image_processor_class=d.AutoImageProcessor;static feature_extractor_class=g.AutoFeatureExtractor;static tokenizer_class=I.AutoTokenizer;static uses_processor_config=!0;static uses_chat_template_file=!0;constructor(_,o,x){super(_,o,x),this.audio_seq_length=this.config.audio_seq_length,this.image_seq_length=this.config.image_seq_length;let{audio_token_id:w,boa_token:k,audio_token:G,eoa_token:b,image_token_id:C,boi_token:B,image_token:P,eoi_token:M}=this.tokenizer.config;this.audio_token_id=w,this.boa_token=k,this.audio_token=G;let y=G.repeat(this.audio_seq_length);this.full_audio_sequence=`
|
|
12
|
+
|
|
13
|
+
${k}${y}${b}
|
|
14
|
+
|
|
15
|
+
`,this.image_token_id=C,this.boi_token=B,this.image_token=P;let l=P.repeat(this.image_seq_length);this.full_image_sequence=`
|
|
16
|
+
|
|
17
|
+
${B}${l}${M}
|
|
18
|
+
|
|
19
|
+
`}async _call(_,o=null,x=null,w={}){typeof _=="string"&&(_=[_]);let k;x&&(k=await this.feature_extractor(x,w),_=_.map(C=>C.replaceAll(this.audio_token,this.full_audio_sequence)));let G;return o&&(G=await this.image_processor(o,w),_=_.map(C=>C.replaceAll(this.image_token,this.full_image_sequence))),{...this.tokenizer(_,w),...G,...k}}}}),"./src/models/glpn/image_processing_glpn.js":((D,a,e)=>{e.r(a),e.d(a,{GLPNFeatureExtractor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}}),"./src/models/grounding_dino/image_processing_grounding_dino.js":((D,a,e)=>{e.r(a),e.d(a,{GroundingDinoImageProcessor:()=>g});var i=e("./src/base/image_processors_utils.js"),d=e("./src/utils/tensor.js");class g extends i.ImageProcessor{async _call(f){let u=await super._call(f),m=u.pixel_values.dims,T=(0,d.ones)([m[0],m[2],m[3]]);return{...u,pixel_mask:T}}}}),"./src/models/grounding_dino/processing_grounding_dino.js":((D,a,e)=>{e.r(a),e.d(a,{GroundingDinoProcessor:()=>u});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js"),I=e("./src/base/image_processors_utils.js");function f(m,T){let o=m.dims.at(-1)-1,x=m.tolist();x.fill(!1,0,1),x.fill(!1,o);let w=T.tolist();return x.map((k,G)=>k?G:null).filter(k=>k!==null).map(k=>w[k])}class u extends i.Processor{static tokenizer_class=g.AutoTokenizer;static image_processor_class=d.AutoImageProcessor;async _call(T,_,o={}){let x=T?await this.image_processor(T,o):{};return{..._?this.tokenizer(_,o):{},...x}}post_process_grounded_object_detection(T,_,{box_threshold:o=.25,text_threshold:x=.25,target_sizes:w=null}={}){let{logits:k,pred_boxes:G}=T,b=k.dims[0];if(w!==null&&w.length!==b)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let C=k.dims.at(1),B=k.sigmoid(),P=B.max(-1).tolist(),M=G.tolist().map(l=>l.map(h=>(0,I.center_to_corners_format)(h))),y=[];for(let l=0;l<b;++l){let h=w!==null?w[l]:null;h!==null&&(M[l]=M[l].map(N=>N.map((Q,K)=>Q*h[(K+1)%2])));let F=P[l],S=[],V=[],R=[];for(let N=0;N<C;++N){let Q=F[N];if(Q<=o)continue;let K=M[l][N],J=B[l][N];S.push(Q),R.push(K);let te=f(J.gt(x),_[l]);V.push(te)}y.push({scores:S,boxes:R,labels:this.batch_decode(V)})}return y}}}),"./src/models/idefics3/image_processing_idefics3.js":((D,a,e)=>{e.r(a),e.d(a,{Idefics3ImageProcessor:()=>g});var i=e("./src/base/image_processors_utils.js"),d=e("./src/utils/tensor.js");class g extends i.ImageProcessor{constructor(f){super(f),this.do_image_splitting=f.do_image_splitting??!0,this.max_image_size=f.max_image_size}get_resize_for_vision_encoder(f,u){let[m,T]=f.dims.slice(-2),_=T/m;return T>=m?(T=Math.ceil(T/u)*u,m=Math.floor(T/_),m=Math.ceil(m/u)*u):(m=Math.ceil(m/u)*u,T=Math.floor(m*_),T=Math.ceil(T/u)*u),{height:m,width:T}}async _call(f,{do_image_splitting:u=null,return_row_col_info:m=!1}={}){let T;if(!Array.isArray(f))T=[[f]];else{if(f.length===0||!f[0])throw new Error("No images provided.");Array.isArray(f[0])?T=f:T=[f]}let _=[],o=[],x=[],w=[],k=[];for(let l of T){let h=await Promise.all(l.map(V=>this.preprocess(V)));w.push(...h.map(V=>V.original_size)),k.push(...h.map(V=>V.reshaped_input_size)),h.forEach(V=>V.pixel_values.unsqueeze_(0));let{longest_edge:F}=this.max_image_size,S;if(u??this.do_image_splitting){let V=new Array(h.length),R=new Array(h.length);S=await Promise.all(h.map(async(N,Q)=>{let K=this.get_resize_for_vision_encoder(N.pixel_values,F),J=await(0,d.interpolate_4d)(N.pixel_values,{size:[K.height,K.width]}),{frames:te,num_splits_h:se,num_splits_w:ce}=await this.split_image(J,this.max_image_size);return V[Q]=se,R[Q]=ce,(0,d.cat)(te,0)})),o.push(V),x.push(R)}else{let V=[F,F];S=await Promise.all(h.map(R=>(0,d.interpolate_4d)(R.pixel_values,{size:V}))),o.push(new Array(h.length).fill(0)),x.push(new Array(h.length).fill(0))}_.push((0,d.cat)(S,0))}let G=_.length,[b,C,B,P]=_[0].dims,M,y;if(G===1)M=_[0].unsqueeze_(0),y=(0,d.full)([G,b,B,P],!0);else{let l=Math.max(..._.map(S=>S.dims.at(0)));y=(0,d.full)([G,l,B,P],!0);let h=y.data,F=l*B*P;for(let S=0;S<G;++S){let V=_[S].dims[0];if(V<l){_[S]=(0,d.cat)([_[S],(0,d.full)([l-V,C,B,P],0)],0);let R=S*F+V*B*P,N=(S+1)*F;h.fill(!1,R,N)}}M=(0,d.stack)(_,0)}return{pixel_values:M,pixel_attention_mask:y,original_sizes:w,reshaped_input_sizes:k,...m?{rows:o,cols:x}:{}}}async split_image(f,{longest_edge:u}){let m=u,T=u,_=[],[o,x]=f.dims.slice(-2),w=0,k=0;if(o>m||x>T){w=Math.ceil(o/m),k=Math.ceil(x/T);let G=Math.ceil(o/w),b=Math.ceil(x/k);for(let P=0;P<w;++P)for(let M=0;M<k;++M){let y,l,h,F;P===w-1?(l=o-G,F=o):(l=P*G,F=(P+1)*G),M===k-1?(y=x-b,h=x):(y=M*b,h=(M+1)*b);let S=[l,y],V=[F,h],R=await(0,d.slice)(f,S,V,[2,3]);_.push(R)}let C=m,B=T;(o!==C||x!==B)&&(f=await(0,d.interpolate_4d)(f,{size:[C,B]}))}return _.push(f),{frames:_,num_splits_h:w,num_splits_w:k}}}}),"./src/models/idefics3/processing_idefics3.js":((D,a,e)=>{e.r(a),e.d(a,{Idefics3Processor:()=>_});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js"),I=e("./src/utils/image.js"),f=e("./src/utils/core.js");function u(o,x,w,k,G,b){let C="";for(let B=0;B<x;++B){for(let P=0;P<w;++P)C+=k+`<row_${B+1}_col_${P+1}>`+G.repeat(o);C+=`
|
|
20
|
+
`}return C+=`
|
|
21
|
+
${k}${b}`+G.repeat(o)+`${k}`,C}function m(o,x,w,k){return`${x}${k}`+w.repeat(o)+`${x}`}function T(o,x,w,k,G,b){return o===0&&x===0?m(w,k,G,b):u(w,o,x,k,G,b)}class _ extends i.Processor{static image_processor_class=d.AutoImageProcessor;static tokenizer_class=g.AutoTokenizer;static uses_processor_config=!0;fake_image_token="<fake_token_around_image>";image_token="<image>";global_img_token="<global-img>";async _call(x,w=null,k={}){k.return_row_col_info??=!0;let G;w&&(G=await this.image_processor(w,k)),Array.isArray(x)||(x=[x]);let b=G.rows??[new Array(x.length).fill(0)],C=G.cols??[new Array(x.length).fill(0)],B=this.config.image_seq_len,P=[],M=[];for(let l=0;l<x.length;++l){let h=x[l],F=b[l],S=C[l];P.push((0,f.count)(h,this.image_token));let V=F.map((Q,K)=>T(Q,S[K],B,this.fake_image_token,this.image_token,this.global_img_token)),R=h.split(this.image_token);if(R.length===0)throw new Error("The image token should be present in the text.");let N=R[0];for(let Q=0;Q<V.length;++Q)N+=V[Q]+R[Q+1];M.push(N)}return{...this.tokenizer(M),...G}}}}),"./src/models/image_processors.js":((D,a,e)=>{e.r(a),e.d(a,{BeitFeatureExtractor:()=>i.BeitFeatureExtractor,BitImageProcessor:()=>d.BitImageProcessor,CLIPFeatureExtractor:()=>I.CLIPFeatureExtractor,CLIPImageProcessor:()=>I.CLIPImageProcessor,ChineseCLIPFeatureExtractor:()=>g.ChineseCLIPFeatureExtractor,ConvNextFeatureExtractor:()=>f.ConvNextFeatureExtractor,ConvNextImageProcessor:()=>f.ConvNextImageProcessor,DINOv3ViTImageProcessor:()=>T.DINOv3ViTImageProcessor,DPTFeatureExtractor:()=>o.DPTFeatureExtractor,DPTImageProcessor:()=>o.DPTImageProcessor,DeiTFeatureExtractor:()=>u.DeiTFeatureExtractor,DeiTImageProcessor:()=>u.DeiTImageProcessor,DetrFeatureExtractor:()=>m.DetrFeatureExtractor,DetrImageProcessor:()=>m.DetrImageProcessor,DonutFeatureExtractor:()=>_.DonutFeatureExtractor,DonutImageProcessor:()=>_.DonutImageProcessor,EfficientNetImageProcessor:()=>x.EfficientNetImageProcessor,GLPNFeatureExtractor:()=>w.GLPNFeatureExtractor,GroundingDinoImageProcessor:()=>k.GroundingDinoImageProcessor,Idefics3ImageProcessor:()=>G.Idefics3ImageProcessor,JinaCLIPImageProcessor:()=>C.JinaCLIPImageProcessor,LlavaOnevisionImageProcessor:()=>B.LlavaOnevisionImageProcessor,Mask2FormerImageProcessor:()=>P.Mask2FormerImageProcessor,MaskFormerFeatureExtractor:()=>M.MaskFormerFeatureExtractor,MaskFormerImageProcessor:()=>M.MaskFormerImageProcessor,MobileNetV1FeatureExtractor:()=>y.MobileNetV1FeatureExtractor,MobileNetV1ImageProcessor:()=>y.MobileNetV1ImageProcessor,MobileNetV2FeatureExtractor:()=>l.MobileNetV2FeatureExtractor,MobileNetV2ImageProcessor:()=>l.MobileNetV2ImageProcessor,MobileNetV3FeatureExtractor:()=>h.MobileNetV3FeatureExtractor,MobileNetV3ImageProcessor:()=>h.MobileNetV3ImageProcessor,MobileNetV4FeatureExtractor:()=>F.MobileNetV4FeatureExtractor,MobileNetV4ImageProcessor:()=>F.MobileNetV4ImageProcessor,MobileViTFeatureExtractor:()=>S.MobileViTFeatureExtractor,MobileViTImageProcessor:()=>S.MobileViTImageProcessor,NougatImageProcessor:()=>V.NougatImageProcessor,OwlViTFeatureExtractor:()=>N.OwlViTFeatureExtractor,OwlViTImageProcessor:()=>N.OwlViTImageProcessor,Owlv2ImageProcessor:()=>R.Owlv2ImageProcessor,Phi3VImageProcessor:()=>Q.Phi3VImageProcessor,PixtralImageProcessor:()=>K.PixtralImageProcessor,PvtImageProcessor:()=>J.PvtImageProcessor,Qwen2VLImageProcessor:()=>te.Qwen2VLImageProcessor,RTDetrImageProcessor:()=>se.RTDetrImageProcessor,Sam2ImageProcessor:()=>we.Sam2ImageProcessor,Sam3ImageProcessor:()=>_e.Sam3ImageProcessor,SamImageProcessor:()=>ce.SamImageProcessor,SegformerFeatureExtractor:()=>X.SegformerFeatureExtractor,SegformerImageProcessor:()=>X.SegformerImageProcessor,SiglipImageProcessor:()=>L.SiglipImageProcessor,SmolVLMImageProcessor:()=>W.SmolVLMImageProcessor,Swin2SRImageProcessor:()=>Y.Swin2SRImageProcessor,VLMImageProcessor:()=>b.VLMImageProcessor,ViTFeatureExtractor:()=>ae.ViTFeatureExtractor,ViTImageProcessor:()=>ae.ViTImageProcessor,VitMatteImageProcessor:()=>be.VitMatteImageProcessor,VitPoseImageProcessor:()=>xe.VitPoseImageProcessor,YolosFeatureExtractor:()=>Le.YolosFeatureExtractor,YolosImageProcessor:()=>Le.YolosImageProcessor});var i=e("./src/models/beit/image_processing_beit.js"),d=e("./src/models/bit/image_processing_bit.js"),g=e("./src/models/chinese_clip/image_processing_chinese_clip.js"),I=e("./src/models/clip/image_processing_clip.js"),f=e("./src/models/convnext/image_processing_convnext.js"),u=e("./src/models/deit/image_processing_deit.js"),m=e("./src/models/detr/image_processing_detr.js"),T=e("./src/models/dinov3_vit/image_processing_dinov3_vit.js"),_=e("./src/models/donut/image_processing_donut.js"),o=e("./src/models/dpt/image_processing_dpt.js"),x=e("./src/models/efficientnet/image_processing_efficientnet.js"),w=e("./src/models/glpn/image_processing_glpn.js"),k=e("./src/models/grounding_dino/image_processing_grounding_dino.js"),G=e("./src/models/idefics3/image_processing_idefics3.js"),b=e("./src/models/janus/image_processing_janus.js"),C=e("./src/models/jina_clip/image_processing_jina_clip.js"),B=e("./src/models/llava_onevision/image_processing_llava_onevision.js"),P=e("./src/models/mask2former/image_processing_mask2former.js"),M=e("./src/models/maskformer/image_processing_maskformer.js"),y=e("./src/models/mobilenet_v1/image_processing_mobilenet_v1.js"),l=e("./src/models/mobilenet_v2/image_processing_mobilenet_v2.js"),h=e("./src/models/mobilenet_v3/image_processing_mobilenet_v3.js"),F=e("./src/models/mobilenet_v4/image_processing_mobilenet_v4.js"),S=e("./src/models/mobilevit/image_processing_mobilevit.js"),V=e("./src/models/nougat/image_processing_nougat.js"),R=e("./src/models/owlv2/image_processing_owlv2.js"),N=e("./src/models/owlvit/image_processing_owlvit.js"),Q=e("./src/models/phi3_v/image_processing_phi3_v.js"),K=e("./src/models/pixtral/image_processing_pixtral.js"),J=e("./src/models/pvt/image_processing_pvt.js"),te=e("./src/models/qwen2_vl/image_processing_qwen2_vl.js"),se=e("./src/models/rt_detr/image_processing_rt_detr.js"),ce=e("./src/models/sam/image_processing_sam.js"),we=e("./src/models/sam2/image_processing_sam2.js"),_e=e("./src/models/sam3/image_processing_sam3.js"),X=e("./src/models/segformer/image_processing_segformer.js"),L=e("./src/models/siglip/image_processing_siglip.js"),W=e("./src/models/smolvlm/image_processing_smolvlm.js"),Y=e("./src/models/swin2sr/image_processing_swin2sr.js"),ae=e("./src/models/vit/image_processing_vit.js"),be=e("./src/models/vitmatte/image_processing_vitmatte.js"),xe=e("./src/models/vitpose/image_processing_vitpose.js"),Le=e("./src/models/yolos/image_processing_yolos.js")}),"./src/models/janus/image_processing_janus.js":((D,a,e)=>{e.r(a),e.d(a,{VLMImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{constructor(I){super({do_pad:!0,pad_size:{width:I.image_size,height:I.image_size},...I}),this.constant_values=this.config.background_color.map(f=>f*this.rescale_factor)}pad_image(I,f,u,m){return super.pad_image(I,f,u,{constant_values:this.constant_values,center:!0,...m})}}}),"./src/models/janus/processing_janus.js":((D,a,e)=>{e.r(a),e.d(a,{VLChatProcessor:()=>m});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js"),I=e("./src/utils/core.js"),f=e("./src/utils/tensor.js"),u=e("./src/utils/image.js");class m extends i.Processor{static image_processor_class=d.AutoImageProcessor;static tokenizer_class=g.AutoTokenizer;static uses_processor_config=!0;constructor(_,o,x){super(_,o,x),this.image_tag=this.config.image_tag,this.image_start_tag=this.config.image_start_tag,this.image_end_tag=this.config.image_end_tag,this.num_image_tokens=this.config.num_image_tokens}async _call(_,{images:o=null,chat_template:x="default"}={}){o?Array.isArray(o)||(o=[o]):o=await Promise.all(_.filter(S=>S.images).flatMap(S=>S.images).map(S=>u.RawImage.read(S)));let w=this.tokenizer,k=w.apply_chat_template(_,{tokenize:!1,add_generation_prompt:!0,chat_template:x}),G=S=>w.encode(S,{add_special_tokens:!1}),b=k.split(this.image_tag),C=b.length-1;if(o.length!==C)throw new Error(`Number of images provided (${o.length}) does not match number of "${this.image_tag}" image tags (${C})`);let[B,P,M]=w.model.convert_tokens_to_ids([this.image_tag,this.image_start_tag,this.image_end_tag]),y=G(b[0]),l=new Array(y.length).fill(!1);for(let S=1;S<b.length;++S){let V=new Array(this.num_image_tokens).fill(B),R=G(b[S]);y=(0,I.mergeArrays)(y,[P],V,[M],R);let N=new Array(this.num_image_tokens).fill(!0);l=(0,I.mergeArrays)(l,[!1],N,[!1],new Array(R.length).fill(!1))}let h=[1,y.length],F={input_ids:new f.Tensor("int64",y,h),attention_mask:new f.Tensor("int64",new Array(y.length).fill(1),h),images_seq_mask:new f.Tensor("bool",l,h),images_emb_mask:new f.Tensor("bool",new Array(C*this.num_image_tokens).fill(!0),[1,C,this.num_image_tokens])};if(o&&o.length>0){let S=await this.image_processor(o);return S.pixel_values.unsqueeze_(0),{...F,...S}}return F}}}),"./src/models/jina_clip/image_processing_jina_clip.js":((D,a,e)=>{e.r(a),e.d(a,{JinaCLIPImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{constructor(I){let{resize_mode:f,fill_color:u,interpolation:m,size:T,..._}=I,o=f==="squash"?{width:T,height:T}:f==="shortest"?{shortest_edge:T}:{longest_edge:T},x=m==="bicubic"?3:2;super({..._,size:o,resample:x,do_center_crop:!0,crop_size:T,do_normalize:!0})}}}),"./src/models/jina_clip/processing_jina_clip.js":((D,a,e)=>{e.r(a),e.d(a,{JinaCLIPProcessor:()=>I});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js");class I extends i.Processor{static tokenizer_class=g.AutoTokenizer;static image_processor_class=d.AutoImageProcessor;async _call(u=null,m=null,T={}){if(!u&&!m)throw new Error("Either text or images must be provided");let _=u?this.tokenizer(u,T):{},o=m?await this.image_processor(m,T):{};return{..._,...o}}}}),"./src/models/llava/processing_llava.js":((D,a,e)=>{e.r(a),e.d(a,{LlavaProcessor:()=>I});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js");class I extends i.Processor{static tokenizer_class=g.AutoTokenizer;static image_processor_class=d.AutoImageProcessor;static uses_processor_config=!0;async _call(u,m=null,T={}){let _=await this.image_processor(u,T);if(m){let[x,w]=_.pixel_values.dims.slice(-2),{image_token:k,patch_size:G,num_additional_image_tokens:b}=this.config,C=Math.floor(x/G)*Math.floor(w/G)+b;m=structuredClone(m),Array.isArray(m)||(m=[m]);for(let B=0;B<m.length;++B)m[B]=m[B].replace(k,k.repeat(C))}let o=m?this.tokenizer(m,T):{};return{..._,...o}}}}),"./src/models/llava_onevision/image_processing_llava_onevision.js":((D,a,e)=>{e.r(a),e.d(a,{LlavaOnevisionImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}}),"./src/models/mask2former/image_processing_mask2former.js":((D,a,e)=>{e.r(a),e.d(a,{Mask2FormerImageProcessor:()=>d});var i=e("./src/models/maskformer/image_processing_maskformer.js");class d extends i.MaskFormerImageProcessor{}}),"./src/models/maskformer/image_processing_maskformer.js":((D,a,e)=>{e.r(a),e.d(a,{MaskFormerFeatureExtractor:()=>g,MaskFormerImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{post_process_panoptic_segmentation(...f){return(0,i.post_process_panoptic_segmentation)(...f)}post_process_instance_segmentation(...f){return(0,i.post_process_instance_segmentation)(...f)}}class g extends d{}}),"./src/models/mgp_str/processing_mgp_str.js":((D,a,e)=>{e.r(a),e.d(a,{MgpstrProcessor:()=>u});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js"),I=e("./src/utils/maths.js");let f={char:["char_decode",1],bpe:["bpe_decode",2],wp:["wp_decode",102]};class u extends i.Processor{static tokenizer_class=g.AutoTokenizer;static image_processor_class=d.AutoImageProcessor;get char_tokenizer(){return this.components.char_tokenizer}get bpe_tokenizer(){return this.components.bpe_tokenizer}get wp_tokenizer(){return this.components.wp_tokenizer}_decode_helper(T,_){if(!f.hasOwnProperty(_))throw new Error(`Format ${_} is not supported.`);let[o,x]=f[_],w=this[o].bind(this),[k,G]=T.dims,b=[],C=[],B=T.tolist();for(let M=0;M<k;++M){let y=B[M],l=[],h=[];for(let S=1;S<G;++S){let[V,R]=(0,I.max)((0,I.softmax)(y[S]));if(h.push(V),R==x)break;l.push(R)}let F=h.length>0?h.reduce((S,V)=>S*V,1):0;C.push(l),b.push(F)}return[w(C),b]}char_decode(T){return this.char_tokenizer.batch_decode(T).map(_=>_.replaceAll(" ",""))}bpe_decode(T){return this.bpe_tokenizer.batch_decode(T)}wp_decode(T){return this.wp_tokenizer.batch_decode(T).map(_=>_.replaceAll(" ",""))}batch_decode([T,_,o]){let[x,w]=this._decode_helper(T,"char"),[k,G]=this._decode_helper(_,"bpe"),[b,C]=this._decode_helper(o,"wp"),B=[],P=[];for(let M=0;M<x.length;++M){let[y,l]=(0,I.max)([w[M],G[M],C[M]]);B.push([x[M],k[M],b[M]][l]),P.push(y)}return{generated_text:B,scores:P,char_preds:x,bpe_preds:k,wp_preds:b}}static async from_pretrained(...T){let _=await super.from_pretrained(...T),o=await g.AutoTokenizer.from_pretrained("Xenova/gpt2"),x=await g.AutoTokenizer.from_pretrained("Xenova/bert-base-uncased");return _.components={image_processor:_.image_processor,char_tokenizer:_.tokenizer,bpe_tokenizer:o,wp_tokenizer:x},_}async _call(T,_=null){let o=await this.image_processor(T);return _&&(o.labels=this.tokenizer(_).input_ids),o}}}),"./src/models/mobilenet_v1/image_processing_mobilenet_v1.js":((D,a,e)=>{e.r(a),e.d(a,{MobileNetV1FeatureExtractor:()=>g,MobileNetV1ImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/mobilenet_v2/image_processing_mobilenet_v2.js":((D,a,e)=>{e.r(a),e.d(a,{MobileNetV2FeatureExtractor:()=>g,MobileNetV2ImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/mobilenet_v3/image_processing_mobilenet_v3.js":((D,a,e)=>{e.r(a),e.d(a,{MobileNetV3FeatureExtractor:()=>g,MobileNetV3ImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/mobilenet_v4/image_processing_mobilenet_v4.js":((D,a,e)=>{e.r(a),e.d(a,{MobileNetV4FeatureExtractor:()=>g,MobileNetV4ImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/mobilevit/image_processing_mobilevit.js":((D,a,e)=>{e.r(a),e.d(a,{MobileViTFeatureExtractor:()=>g,MobileViTImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/moonshine/feature_extraction_moonshine.js":((D,a,e)=>{e.r(a),e.d(a,{MoonshineFeatureExtractor:()=>g});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js");class g extends i.FeatureExtractor{async _call(f){(0,i.validate_audio_inputs)(f,"MoonshineFeatureExtractor"),f instanceof Float64Array&&(f=new Float32Array(f));let u=[1,f.length];return{input_values:new d.Tensor("float32",f,u)}}}}),"./src/models/moonshine/processing_moonshine.js":((D,a,e)=>{e.r(a),e.d(a,{MoonshineProcessor:()=>I});var i=e("./src/models/auto/feature_extraction_auto.js"),d=e("./src/tokenizers.js"),g=e("./src/base/processing_utils.js");class I extends g.Processor{static tokenizer_class=d.AutoTokenizer;static feature_extractor_class=i.AutoFeatureExtractor;async _call(u){return await this.feature_extractor(u)}}}),"./src/models/nougat/image_processing_nougat.js":((D,a,e)=>{e.r(a),e.d(a,{NougatImageProcessor:()=>d});var i=e("./src/models/donut/image_processing_donut.js");class d extends i.DonutImageProcessor{}}),"./src/models/owlv2/image_processing_owlv2.js":((D,a,e)=>{e.r(a),e.d(a,{Owlv2ImageProcessor:()=>d});var i=e("./src/models/owlvit/image_processing_owlvit.js");class d extends i.OwlViTImageProcessor{}}),"./src/models/owlvit/image_processing_owlvit.js":((D,a,e)=>{e.r(a),e.d(a,{OwlViTFeatureExtractor:()=>g,OwlViTImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{post_process_object_detection(...f){return(0,i.post_process_object_detection)(...f)}}class g extends d{}}),"./src/models/owlvit/processing_owlvit.js":((D,a,e)=>{e.r(a),e.d(a,{OwlViTProcessor:()=>I});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js");class I extends i.Processor{static tokenizer_class=g.AutoTokenizer;static image_processor_class=d.AutoImageProcessor}}),"./src/models/paligemma/processing_paligemma.js":((D,a,e)=>{e.r(a),e.d(a,{PaliGemmaProcessor:()=>u});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js");let I="<image>";function f(m,T,_,o,x){return`${o.repeat(_*x)}${T}${m}
|
|
22
|
+
`}class u extends i.Processor{static tokenizer_class=g.AutoTokenizer;static image_processor_class=d.AutoImageProcessor;static uses_processor_config=!1;async _call(T,_=null,o={}){_||(console.warn("You are using PaliGemma without a text prefix. It will perform as a picture-captioning model."),_=""),Array.isArray(T)||(T=[T]),Array.isArray(_)||(_=[_]);let x=this.tokenizer.bos_token,w=this.image_processor.config.image_seq_length,k;_.some(C=>C.includes(I))?k=_.map(C=>{let B=C.replaceAll(I,I.repeat(w)),P=B.lastIndexOf(I),M=P===-1?0:P+I.length;return B.slice(0,M)+x+B.slice(M)+`
|
|
23
|
+
`}):(console.warn("You are passing both `text` and `images` to `PaliGemmaProcessor`. The processor expects special image tokens in the text, as many tokens as there are images per each text. It is recommended to add `<image>` tokens in the very beginning of your text. For this call, we will infer how many images each text has and add special tokens."),k=_.map(C=>f(C,x,w,I,T.length)));let G=this.tokenizer(k,o);return{...await this.image_processor(T,o),...G}}}}),"./src/models/parakeet/feature_extraction_parakeet.js":((D,a,e)=>{e.r(a),e.d(a,{ParakeetFeatureExtractor:()=>f});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/audio.js");let I=1e-5;class f extends i.FeatureExtractor{constructor(m){super(m),this.config.mel_filters??=(0,g.mel_filter_bank)(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,this.config.sampling_rate/2,this.config.sampling_rate,"slaney","slaney");let T=(0,g.window_function)(this.config.win_length,"hann",{periodic:!1});this.window=new Float64Array(this.config.n_fft);let _=Math.floor((this.config.n_fft-this.config.win_length)/2);this.window.set(T,_)}async _extract_fbank_features(m){let T=this.config.preemphasis;m=new Float64Array(m);for(let o=m.length-1;o>=1;--o)m[o]-=T*m[o-1];return await(0,g.spectrogram)(m,this.window,this.window.length,this.config.hop_length,{fft_length:this.config.n_fft,power:2,mel_filters:this.config.mel_filters,log_mel:"log",mel_floor:-1/0,pad_mode:"constant",center:!0,transpose:!0,mel_offset:2**-24})}async _call(m){(0,i.validate_audio_inputs)(m,"ParakeetFeatureExtractor");let T=await this._extract_fbank_features(m),_=Math.floor((m.length+Math.floor(this.config.n_fft/2)*2-this.config.n_fft)/this.config.hop_length),o=T.data;o.fill(0,_*T.dims[1]);let[x,w]=T.dims,k=new Float64Array(w),G=new Float64Array(w);for(let B=0;B<_;++B){let P=B*w;for(let M=0;M<w;++M){let y=o[P+M];k[M]+=y,G[M]+=y*y}}let b=_>1?_-1:1;for(let B=0;B<w;++B){let P=k[B]/_,M=(G[B]-_*P*P)/b,l=1/(Math.sqrt(M)+I);for(let h=0;h<_;++h){let F=h*w+B;o[F]=(o[F]-P)*l}}let C=new BigInt64Array(x);return C.fill(1n,0,_),{input_features:T.unsqueeze_(0),attention_mask:new d.Tensor("int64",C,[1,x])}}}}),"./src/models/phi3_v/image_processing_phi3_v.js":((D,a,e)=>{e.r(a),e.d(a,{Phi3VImageProcessor:()=>T});var i=e("./src/base/image_processors_utils.js"),d=e("./src/utils/tensor.js");let g=336,I=[2,3],{ceil:f,floor:u,sqrt:m}=Math;class T extends i.ImageProcessor{constructor(o){super({...o,do_normalize:!0,do_pad:!0,pad_size:"custom",do_convert_rgb:!0,do_resize:!0}),this._num_crops=o.num_crops}calc_num_image_tokens_from_image_size(o,x){let{num_img_tokens:w}=this.config;return u((u(x/g)*u(o/g)+1)*w+1+(u(x/g)+1)*m(w))}get_resize_output_image_size(o,x){let w=this._num_crops,[k,G]=o.size,b=k/G,C=1;for(;C*Math.ceil(C/b)<=w;)C+=1;C-=1;let B=Math.floor(C*336),P=Math.floor(B/b);return[B,P]}pad_image(o,x,w,k={}){let[G,b]=x,C=g*f(G/g),B=g*f(b/g),P=[1,1,1].map((M,y)=>(M-this.image_mean[y])/this.image_std[y]);return super.pad_image(o,x,{width:B,height:C},{center:!0,constant_values:P,...k})}async _call(o,{num_crops:x=null}={}){if(this._num_crops=x??=this.config.num_crops,x<4||m(x)%1!==0)throw new Error("num_crops must be a square number >= 4");Array.isArray(o)||(o=[o]);let w=o.length,k=await Promise.all(o.map(l=>this.preprocess(l))),G=k.map(l=>l.original_size),b=k.map(l=>l.reshaped_input_size),C=[];for(let{pixel_values:l}of k){l.unsqueeze_(0);let[h,F]=l.dims.slice(-2),S=await(0,d.interpolate_4d)(l,{size:[g,g],mode:"bicubic"});if(x>0){let V=[],R=m(x),N=u(F/R),Q=u(h/R);for(let J=0;J<R;++J)for(let te=0;te<R;++te){let se,ce,we,_e;J===R-1?(ce=h-Q,_e=h):(ce=J*Q,_e=(J+1)*Q),te===R-1?(se=F-N,we=F):(se=te*N,we=(te+1)*N);let X=[ce,se],L=[_e,we],W=await(0,d.slice)(l,X,L,I);V.push(W)}let K=await(0,d.interpolate_4d)((0,d.cat)(V,0),{size:[g,g],mode:"bicubic"});C.push((0,d.cat)([S,K],0))}else C.push(S)}let B=(0,d.stack)(C,0),P=b.map(l=>l.map(h=>g*f(h/g))),M=new d.Tensor("int64",P.flat(),[w,2]),y=P.map(([l,h])=>this.calc_num_image_tokens_from_image_size(h,l));return{pixel_values:B,original_sizes:G,reshaped_input_sizes:b,image_sizes:M,num_img_tokens:y}}}}),"./src/models/phi3_v/processing_phi3_v.js":((D,a,e)=>{e.r(a),e.d(a,{Phi3VProcessor:()=>m});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js"),I=e("./src/utils/image.js");let f="<|image|>",u=/<\|image_\d+\|>/g;class m extends i.Processor{static image_processor_class=d.AutoImageProcessor;static tokenizer_class=g.AutoTokenizer;async _call(_,o=null,{padding:x=!0,truncation:w=!0,num_crops:k=null}={}){Array.isArray(_)||(_=[_]);let G,b;if(o){b=await this.image_processor(o,{num_crops:k});let{num_img_tokens:C}=b,B=_.map((M,y)=>M.split(u).join(f.repeat(C[y])));G=this.tokenizer(B,{padding:x,truncation:w});let P=this.tokenizer.model.convert_tokens_to_ids([f])[0];G.input_ids.map_(M=>M==P?-M:M)}else G=this.tokenizer(_);return{...G,...b}}}}),"./src/models/pixtral/image_processing_pixtral.js":((D,a,e)=>{e.r(a),e.d(a,{PixtralImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{get_resize_output_image_size(I,f){let{longest_edge:u}=f;if(u===void 0)throw new Error("size must contain 'longest_edge'");let[m,T]=I.size,_=Math.max(m,T)/u,o=m,x=T;_>1&&(o=Math.floor(m/_),x=Math.floor(T/_));let{patch_size:w,spatial_merge_size:k}=this.config;if(!k)throw new Error("config must contain 'spatial_merge_size'");let G=w*k,b=Math.floor((o-1)/G)+1,C=Math.floor((x-1)/G)+1;return[b*G,C*G]}}}),"./src/models/pixtral/processing_pixtral.js":((D,a,e)=>{e.r(a),e.d(a,{PixtralProcessor:()=>I});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js");class I extends i.Processor{static tokenizer_class=g.AutoTokenizer;static image_processor_class=d.AutoImageProcessor;static uses_processor_config=!0;async _call(u,m=null,T={}){let _=await this.image_processor(u,T);if(m){let[x,w]=_.pixel_values.dims.slice(-2),{image_token:k,image_break_token:G,image_end_token:b,patch_size:C,spatial_merge_size:B}=this.config,P=C*B,M=Math.floor(x/P),y=Math.floor(w/P);m=structuredClone(m),Array.isArray(m)||(m=[m]);for(let l=0;l<m.length;++l){let h=k.repeat(y),F=h+G,S=h+b,V=F.repeat(M-1)+S;m[l]=m[l].replace(k,V)}}let o=m?this.tokenizer(m,T):{};return{..._,...o}}}}),"./src/models/processors.js":((D,a,e)=>{e.r(a),e.d(a,{Florence2Processor:()=>i.Florence2Processor,Gemma3nProcessor:()=>d.Gemma3nProcessor,GroundingDinoProcessor:()=>g.GroundingDinoProcessor,Idefics3Processor:()=>I.Idefics3Processor,JinaCLIPProcessor:()=>u.JinaCLIPProcessor,LlavaProcessor:()=>m.LlavaProcessor,MgpstrProcessor:()=>T.MgpstrProcessor,MoonshineProcessor:()=>_.MoonshineProcessor,OwlViTProcessor:()=>o.OwlViTProcessor,PaliGemmaProcessor:()=>x.PaliGemmaProcessor,Phi3VProcessor:()=>w.Phi3VProcessor,PixtralProcessor:()=>k.PixtralProcessor,PyAnnoteProcessor:()=>G.PyAnnoteProcessor,Qwen2VLProcessor:()=>b.Qwen2VLProcessor,Sam2Processor:()=>B.Sam2Processor,Sam2VideoProcessor:()=>B.Sam2VideoProcessor,SamProcessor:()=>C.SamProcessor,SmolVLMProcessor:()=>P.SmolVLMProcessor,SpeechT5Processor:()=>M.SpeechT5Processor,UltravoxProcessor:()=>y.UltravoxProcessor,VLChatProcessor:()=>f.VLChatProcessor,VoxtralProcessor:()=>l.VoxtralProcessor,Wav2Vec2Processor:()=>h.Wav2Vec2Processor,Wav2Vec2ProcessorWithLM:()=>F.Wav2Vec2ProcessorWithLM,WhisperProcessor:()=>S.WhisperProcessor});var i=e("./src/models/florence2/processing_florence2.js"),d=e("./src/models/gemma3n/processing_gemma3n.js"),g=e("./src/models/grounding_dino/processing_grounding_dino.js"),I=e("./src/models/idefics3/processing_idefics3.js"),f=e("./src/models/janus/processing_janus.js"),u=e("./src/models/jina_clip/processing_jina_clip.js"),m=e("./src/models/llava/processing_llava.js"),T=e("./src/models/mgp_str/processing_mgp_str.js"),_=e("./src/models/moonshine/processing_moonshine.js"),o=e("./src/models/owlvit/processing_owlvit.js"),x=e("./src/models/paligemma/processing_paligemma.js"),w=e("./src/models/phi3_v/processing_phi3_v.js"),k=e("./src/models/pixtral/processing_pixtral.js"),G=e("./src/models/pyannote/processing_pyannote.js"),b=e("./src/models/qwen2_vl/processing_qwen2_vl.js"),C=e("./src/models/sam/processing_sam.js"),B=e("./src/models/sam2/processing_sam2.js"),P=e("./src/models/smolvlm/processing_smolvlm.js"),M=e("./src/models/speecht5/processing_speecht5.js"),y=e("./src/models/ultravox/processing_ultravox.js"),l=e("./src/models/voxtral/processing_voxtral.js"),h=e("./src/models/wav2vec2/processing_wav2vec2.js"),F=e("./src/models/wav2vec2_with_lm/processing_wav2vec2_with_lm.js"),S=e("./src/models/whisper/processing_whisper.js")}),"./src/models/pvt/image_processing_pvt.js":((D,a,e)=>{e.r(a),e.d(a,{PvtImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}}),"./src/models/pyannote/feature_extraction_pyannote.js":((D,a,e)=>{e.r(a),e.d(a,{PyAnnoteFeatureExtractor:()=>I});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/maths.js");class I extends i.FeatureExtractor{async _call(u){(0,i.validate_audio_inputs)(u,"PyAnnoteFeatureExtractor"),u instanceof Float64Array&&(u=new Float32Array(u));let m=[1,1,u.length];return{input_values:new d.Tensor("float32",u,m)}}samples_to_frames(u){return(u-this.config.offset)/this.config.step}post_process_speaker_diarization(u,m){let T=m/this.samples_to_frames(m)/this.config.sampling_rate,_=[];for(let o of u.tolist()){let x=[],w=-1;for(let k=0;k<o.length;++k){let G=(0,g.softmax)(o[k]),[b,C]=(0,g.max)(G),[B,P]=[k,k+1];C!==w?(w=C,x.push({id:C,start:B,end:P,score:b})):(x.at(-1).end=P,x.at(-1).score+=b)}_.push(x.map(({id:k,start:G,end:b,score:C})=>({id:k,start:G*T,end:b*T,confidence:C/(b-G)})))}return _}}}),"./src/models/pyannote/processing_pyannote.js":((D,a,e)=>{e.r(a),e.d(a,{PyAnnoteProcessor:()=>g});var i=e("./src/base/processing_utils.js"),d=e("./src/models/pyannote/feature_extraction_pyannote.js");class g extends i.Processor{static feature_extractor_class=d.PyAnnoteFeatureExtractor;async _call(f){return await this.feature_extractor(f)}post_process_speaker_diarization(...f){return this.feature_extractor.post_process_speaker_diarization(...f)}get sampling_rate(){return this.feature_extractor.config.sampling_rate}}}),"./src/models/qwen2_vl/image_processing_qwen2_vl.js":((D,a,e)=>{e.r(a),e.d(a,{Qwen2VLImageProcessor:()=>g});var i=e("./src/base/image_processors_utils.js"),d=e("./src/utils/tensor.js");class g extends i.ImageProcessor{async _call(f,...u){let{pixel_values:m,original_sizes:T,reshaped_input_sizes:_}=await super._call(f,...u),o=m,{temporal_patch_size:x,merge_size:w,patch_size:k}=this.config;o.dims[0]===1&&(o=(0,d.cat)(Array.from({length:x},()=>o),0));let G=o.dims[0]/x,b=o.dims[1],C=Math.floor(o.dims[2]/k),B=Math.floor(o.dims[3]/k),P=o.view(G,x,b,Math.floor(C/w),w,k,Math.floor(B/w),w,k).permute(0,3,6,4,7,2,1,5,8).view(G*C*B,b*x*k*k),M=new d.Tensor("int64",[G,C,B],[1,3]);return{pixel_values:P,image_grid_thw:M,original_sizes:T,reshaped_input_sizes:_}}}}),"./src/models/qwen2_vl/processing_qwen2_vl.js":((D,a,e)=>{e.r(a),e.d(a,{Qwen2VLProcessor:()=>f});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js"),g=e("./src/tokenizers.js"),I=e("./src/utils/image.js");class f extends i.Processor{static image_processor_class=d.AutoImageProcessor;static tokenizer_class=g.AutoTokenizer;async _call(m,T=null,..._){Array.isArray(m)||(m=[m]);let o,x;if(T&&(o=await this.image_processor(T),x=o.image_grid_thw),x){let k=this.image_processor.config.merge_size**2,G=0,b=x.tolist();m=m.map(C=>{for(;C.includes("<|image_pad|>");){let B=Number(b[G++].reduce((P,M)=>P*M,1n));C=C.replace("<|image_pad|>","<|placeholder|>".repeat(Math.floor(B/k)))}return C.replaceAll("<|placeholder|>","<|image_pad|>")})}return{...this.tokenizer(m),...o}}}}),"./src/models/rt_detr/image_processing_rt_detr.js":((D,a,e)=>{e.r(a),e.d(a,{RTDetrImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{post_process_object_detection(...I){return(0,i.post_process_object_detection)(...I)}}}),"./src/models/sam/image_processing_sam.js":((D,a,e)=>{e.r(a),e.d(a,{SamImageProcessor:()=>I});var i=e("./src/base/image_processors_utils.js"),d=e("./src/utils/core.js"),g=e("./src/utils/tensor.js");class I extends i.ImageProcessor{reshape_input_points(u,m,T,_=!1){u=structuredClone(u);let o=(0,d.calculateDimensions)(u);if(o.length===3)_||(o=[1,...o]),u=[u];else if(o.length!==4)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");for(let x=0;x<u.length;++x){let[w,k]=m[x],[G,b]=T[x],C=[b/k,G/w];for(let B=0;B<u[x].length;++B)for(let P=0;P<u[x][B].length;++P)for(let M=0;M<u[x][B][P].length;++M)u[x][B][P][M]*=C[M%2]}return new g.Tensor("float32",Float32Array.from(u.flat(1/0)),o)}add_input_labels(u,m){let T=(0,d.calculateDimensions)(u);if(T.length===2)T=[1,...T],u=[u];else if(T.length!==3)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");if(T.some((_,o)=>_!==m.dims[o]))throw Error(`The first ${T.length} dimensions of 'input_points' and 'input_labels' must be the same.`);return new g.Tensor("int64",u.flat(1/0).map(BigInt),T)}async _call(u,{input_points:m=null,input_labels:T=null,input_boxes:_=null}={}){let o=await super._call(u);if(m&&(o.input_points=this.reshape_input_points(m,o.original_sizes,o.reshaped_input_sizes)),T){if(!o.input_points)throw Error("`input_points` must be provided if `input_labels` are provided.");o.input_labels=this.add_input_labels(T,o.input_points)}return _&&(o.input_boxes=this.reshape_input_points(_,o.original_sizes,o.reshaped_input_sizes,!0)),o}async post_process_masks(u,m,T,{mask_threshold:_=0,binarize:o=!0,pad_size:x=null}={}){let w=[];x=x??this.pad_size??this.size;let k=[x.height,x.width];for(let G=0;G<m.length;++G){let b=m[G],C=T[G],B=await(0,g.interpolate_4d)(u[G],{mode:"bilinear",size:k});if(B=B.slice(null,null,[0,C[0]],[0,C[1]]),B=await(0,g.interpolate_4d)(B,{mode:"bilinear",size:b}),o){let P=B.data,M=new Uint8Array(P.length);for(let y=0;y<P.length;++y)P[y]>_&&(M[y]=1);B=new g.Tensor("bool",M,B.dims)}w.push(B)}return w}generate_crop_boxes(u,m,{crop_n_layers:T=0,overlap_ratio:_=512/1500,points_per_crop:o=32,crop_n_points_downscale_factor:x=1}={}){}}}),"./src/models/sam/processing_sam.js":((D,a,e)=>{e.r(a),e.d(a,{SamProcessor:()=>g});var i=e("./src/base/processing_utils.js"),d=e("./src/models/auto/image_processing_auto.js");class g extends i.Processor{static image_processor_class=d.AutoImageProcessor;async _call(...f){return await this.image_processor(...f)}post_process_masks(...f){return this.image_processor.post_process_masks(...f)}reshape_input_points(...f){return this.image_processor.reshape_input_points(...f)}}}),"./src/models/sam2/image_processing_sam2.js":((D,a,e)=>{e.r(a),e.d(a,{Sam2ImageProcessor:()=>i.SamImageProcessor});var i=e("./src/models/sam/image_processing_sam.js")}),"./src/models/sam2/processing_sam2.js":((D,a,e)=>{e.r(a),e.d(a,{Sam2Processor:()=>d,Sam2VideoProcessor:()=>g});var i=e("./src/models/sam/processing_sam.js");class d extends i.SamProcessor{}class g extends d{}}),"./src/models/sam3/image_processing_sam3.js":((D,a,e)=>{e.r(a),e.d(a,{Sam3ImageProcessor:()=>i.Sam2ImageProcessor});var i=e("./src/models/sam2/image_processing_sam2.js")}),"./src/models/seamless_m4t/feature_extraction_seamless_m4t.js":((D,a,e)=>{e.r(a),e.d(a,{SeamlessM4TFeatureExtractor:()=>I});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/audio.js");class I extends i.FeatureExtractor{constructor(u){super(u);let m=this.config.sampling_rate,T=(0,g.mel_filter_bank)(257,this.config.num_mel_bins,20,Math.floor(m/2),m,null,"kaldi",!0);this.mel_filters=T,this.window=(0,g.window_function)(400,"povey",{periodic:!1})}async _extract_fbank_features(u,m){return u=u.map(T=>T*32768),(0,g.spectrogram)(u,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:m,transpose:!0})}async _call(u,{padding:m=!0,pad_to_multiple_of:T=2,do_normalize_per_mel_bins:_=!0,return_attention_mask:o=!0}={}){(0,i.validate_audio_inputs)(u,"SeamlessM4TFeatureExtractor");let x=await this._extract_fbank_features(u,this.config.max_length);if(_){let[M,y]=x.dims,l=x.data;for(let h=0;h<y;++h){let F=0;for(let N=0;N<M;++N)F+=l[N*y+h];let S=F/M,V=0;for(let N=0;N<M;++N)V+=(l[N*y+h]-S)**2;V/=M-1;let R=Math.sqrt(V+1e-7);for(let N=0;N<M;++N){let Q=N*y+h;l[Q]=(l[Q]-S)/R}}}let w;if(m){let[M,y]=x.dims,l=x.data,h=M%T;if(h>0){let F=new Float32Array(y*(M+h));F.set(l),F.fill(this.config.padding_value,l.length);let S=M+h;x=new d.Tensor(x.type,F,[S,y]),o&&(w=new d.Tensor("int64",new BigInt64Array(S),[1,S]),w.data.fill(1n,0,M))}}let[k,G]=x.dims,b=this.config.stride;if(k%b!==0)throw new Error(`The number of frames (${k}) must be a multiple of the stride (${b}).`);let B=x.view(1,Math.floor(k/b),G*b),P={input_features:B};if(o){let M=B.dims[1],y=new BigInt64Array(M);if(w){let l=w.data;for(let h=1,F=0;h<k;h+=b,++F)y[F]=l[h]}else y.fill(1n);P.attention_mask=new d.Tensor("int64",y,[1,M])}return P}}}),"./src/models/segformer/image_processing_segformer.js":((D,a,e)=>{e.r(a),e.d(a,{SegformerFeatureExtractor:()=>g,SegformerImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{post_process_semantic_segmentation(...f){return(0,i.post_process_semantic_segmentation)(...f)}}class g extends d{}}),"./src/models/siglip/image_processing_siglip.js":((D,a,e)=>{e.r(a),e.d(a,{SiglipImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}}),"./src/models/smolvlm/image_processing_smolvlm.js":((D,a,e)=>{e.r(a),e.d(a,{SmolVLMImageProcessor:()=>i.Idefics3ImageProcessor});var i=e("./src/models/idefics3/image_processing_idefics3.js")}),"./src/models/smolvlm/processing_smolvlm.js":((D,a,e)=>{e.r(a),e.d(a,{SmolVLMProcessor:()=>i.Idefics3Processor});var i=e("./src/models/idefics3/processing_idefics3.js")}),"./src/models/snac/feature_extraction_snac.js":((D,a,e)=>{e.r(a),e.d(a,{SnacFeatureExtractor:()=>d});var i=e("./src/models/dac/feature_extraction_dac.js");class d extends i.DacFeatureExtractor{}}),"./src/models/speecht5/feature_extraction_speecht5.js":((D,a,e)=>{e.r(a),e.d(a,{SpeechT5FeatureExtractor:()=>d});var i=e("./src/base/feature_extraction_utils.js");class d extends i.FeatureExtractor{}}),"./src/models/speecht5/processing_speecht5.js":((D,a,e)=>{e.r(a),e.d(a,{SpeechT5Processor:()=>I});var i=e("./src/base/processing_utils.js"),d=e("./src/tokenizers.js"),g=e("./src/models/auto/feature_extraction_auto.js");class I extends i.Processor{static tokenizer_class=d.AutoTokenizer;static feature_extractor_class=g.AutoFeatureExtractor;async _call(u){return await this.feature_extractor(u)}}}),"./src/models/swin2sr/image_processing_swin2sr.js":((D,a,e)=>{e.r(a),e.d(a,{Swin2SRImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{pad_image(I,f,u,m={}){let[T,_,o]=f;return super.pad_image(I,f,{width:_+(u-_%u)%u,height:T+(u-T%u)%u},{mode:"symmetric",center:!1,constant_values:-1,...m})}}}),"./src/models/ultravox/processing_ultravox.js":((D,a,e)=>{e.r(a),e.d(a,{UltravoxProcessor:()=>I});var i=e("./src/models/auto/feature_extraction_auto.js"),d=e("./src/tokenizers.js"),g=e("./src/base/processing_utils.js");class I extends g.Processor{static tokenizer_class=d.AutoTokenizer;static feature_extractor_class=i.AutoFeatureExtractor;static uses_processor_config=!0;async _call(u,m=null,T={}){if(Array.isArray(u))throw new Error("Batched inputs are not supported yet.");let _={};if(m){let x=m.length,{input_features:w}=await this.feature_extractor(m,{...T,max_length:x}),k=Math.round(x/this.config.encoder_ds_factor+1e-4),G=1+Math.ceil(k/this.config.stack_factor);_.audio_token_len=[G],_.audio_values=w;let b=this.config.audio_placeholder;if(!u.includes(b))throw new Error(`The input text does not contain the image token ${b}.`);u=u.replaceAll(b,b.repeat(G))}return{...this.tokenizer(u,{add_special_tokens:!1,...T}),..._}}}}),"./src/models/vit/image_processing_vit.js":((D,a,e)=>{e.r(a),e.d(a,{ViTFeatureExtractor:()=>g,ViTImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{}class g extends d{}}),"./src/models/vitmatte/image_processing_vitmatte.js":((D,a,e)=>{e.r(a),e.d(a,{VitMatteImageProcessor:()=>g});var i=e("./src/base/image_processors_utils.js"),d=e("./src/utils/tensor.js");class g extends i.ImageProcessor{async _call(f,u){Array.isArray(f)||(f=[f]),Array.isArray(u)||(u=[u]);let m=await Promise.all(f.map(o=>this.preprocess(o))),T=await Promise.all(u.map(o=>this.preprocess(o,{do_normalize:!1,do_convert_rgb:!1,do_convert_grayscale:!0})));return{pixel_values:(0,d.stack)(m.map((o,x)=>(0,d.cat)([o.pixel_values,T[x].pixel_values],0)),0),original_sizes:m.map(o=>o.original_size),reshaped_input_sizes:m.map(o=>o.reshaped_input_size)}}}}),"./src/models/vitpose/image_processing_vitpose.js":((D,a,e)=>{e.r(a),e.d(a,{VitPoseImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{post_process_pose_estimation(I,f,{threshold:u=null}={}){let m=I.tolist(),[T,_,o,x]=I.dims,w=[];for(let k=0;k<T;++k){let G=m[k],b=f[k],C=[];for(let B=0;B<b.length;++B){let P=b[B],M=[],y=[],l=[],h=P.at(-2)/x,F=P.at(-1)/o;for(let S=0;S<G.length;++S){let[V,R]=[0,0],N=0,Q=-1/0,K=G[S];for(let te=0;te<K.length;++te){let se=K[te];for(let ce=0;ce<se.length;++ce){let we=se[ce];N+=we,Q=Math.max(Q,we),V+=(ce+.5)*we,R+=te*we}}if(u!=null&&Q<u)continue;let J=[h*V/N,F*R/N];M.push(J),l.push(S),y.push(Q)}C.push({bbox:P,scores:y,labels:l,keypoints:M})}w.push(C)}return w}}}),"./src/models/voxtral/processing_voxtral.js":((D,a,e)=>{e.r(a),e.d(a,{VoxtralProcessor:()=>_});var i=e("./src/models/auto/feature_extraction_auto.js"),d=e("./src/tokenizers.js"),g=e("./src/base/processing_utils.js"),I=e("./src/utils/tensor.js");let f="[AUDIO]",u="[BEGIN_AUDIO]",m=375;function T(o,x){let w=[];for(let k=0;k<o.length;k+=x)w.push(o.subarray(k,Math.min(k+x,o.length)));return w}class _ extends g.Processor{static tokenizer_class=d.AutoTokenizer;static feature_extractor_class=i.AutoFeatureExtractor;static uses_processor_config=!1;async _call(x,w=null,k={}){if(Array.isArray(x))throw new Error("Batched inputs are not supported yet.");let G={};if(w){if(!x.includes(f))throw new Error(`The input text does not contain the audio token ${f}.`);Array.isArray(w)||(w=[w]);let C=x.split(f),B=C.length-1;if(B!==w.length)throw new Error(`The number of audio inputs (${w.length}) does not match the number of audio tokens in the text (${B}).`);let P=this.feature_extractor.config.n_samples,M=w.map(S=>T(S,P)),y=M.map(S=>S.length),l=M.flat(),h=(await Promise.all(l.map(S=>this.feature_extractor(S,k)))).map(S=>S.input_features);G.audio_values=h.length>1?(0,I.cat)(h,0):h[0];let F=C[0];for(let S=0;S<y.length;++S){F+=u;for(let V=0;V<y[S];++V)F+=f.repeat(m);F+=C[S+1]}x=F}return{...this.tokenizer(x,{add_special_tokens:!1,...k}),...G}}}}),"./src/models/wav2vec2/feature_extraction_wav2vec2.js":((D,a,e)=>{e.r(a),e.d(a,{Wav2Vec2FeatureExtractor:()=>g});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js");class g extends i.FeatureExtractor{_zero_mean_unit_var_norm(f){let m=f.reduce((_,o)=>_+o,0)/f.length,T=f.reduce((_,o)=>_+(o-m)**2,0)/f.length;return f.map(_=>(_-m)/Math.sqrt(T+1e-7))}async _call(f){(0,i.validate_audio_inputs)(f,"Wav2Vec2FeatureExtractor"),f instanceof Float64Array&&(f=new Float32Array(f));let u=f;this.config.do_normalize&&(u=this._zero_mean_unit_var_norm(u));let m=[1,u.length];return{input_values:new d.Tensor("float32",u,m),attention_mask:new d.Tensor("int64",new BigInt64Array(u.length).fill(1n),m)}}}}),"./src/models/wav2vec2/processing_wav2vec2.js":((D,a,e)=>{e.r(a),e.d(a,{Wav2Vec2Processor:()=>I});var i=e("./src/tokenizers.js"),d=e("./src/models/auto/feature_extraction_auto.js"),g=e("./src/base/processing_utils.js");class I extends g.Processor{static tokenizer_class=i.AutoTokenizer;static feature_extractor_class=d.AutoFeatureExtractor;async _call(u){return await this.feature_extractor(u)}}}),"./src/models/wav2vec2_with_lm/processing_wav2vec2_with_lm.js":((D,a,e)=>{e.r(a),e.d(a,{Wav2Vec2ProcessorWithLM:()=>I});var i=e("./src/tokenizers.js"),d=e("./src/models/auto/feature_extraction_auto.js"),g=e("./src/base/processing_utils.js");class I extends g.Processor{static tokenizer_class=i.AutoTokenizer;static feature_extractor_class=d.AutoFeatureExtractor;async _call(u){return await this.feature_extractor(u)}}}),"./src/models/wespeaker/feature_extraction_wespeaker.js":((D,a,e)=>{e.r(a),e.d(a,{WeSpeakerFeatureExtractor:()=>I});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/audio.js");class I extends i.FeatureExtractor{constructor(u){super(u);let m=this.config.sampling_rate,T=(0,g.mel_filter_bank)(257,this.config.num_mel_bins,20,Math.floor(m/2),m,null,"kaldi",!0);this.mel_filters=T,this.window=(0,g.window_function)(400,"hamming",{periodic:!1}),this.min_num_frames=this.config.min_num_frames}async _extract_fbank_features(u){return u=u.map(m=>m*32768),(0,g.spectrogram)(u,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,transpose:!0,min_num_frames:this.min_num_frames})}async _call(u){(0,i.validate_audio_inputs)(u,"WeSpeakerFeatureExtractor");let m=(await this._extract_fbank_features(u)).unsqueeze_(0);if(this.config.fbank_centering_span===null){let T=m.mean(1).data,_=m.data,[o,x,w]=m.dims;for(let k=0;k<o;++k){let G=k*x*w,b=k*w;for(let C=0;C<x;++C){let B=G+C*w;for(let P=0;P<w;++P)_[B+P]-=T[b+P]}}}return{input_features:m}}}}),"./src/models/whisper/common_whisper.js":((D,a,e)=>{e.r(a),e.d(a,{WHISPER_LANGUAGE_MAPPING:()=>d,WHISPER_TO_LANGUAGE_CODE_MAPPING:()=>g,whisper_language_to_code:()=>I});let i=[["en","english"],["zh","chinese"],["de","german"],["es","spanish"],["ru","russian"],["ko","korean"],["fr","french"],["ja","japanese"],["pt","portuguese"],["tr","turkish"],["pl","polish"],["ca","catalan"],["nl","dutch"],["ar","arabic"],["sv","swedish"],["it","italian"],["id","indonesian"],["hi","hindi"],["fi","finnish"],["vi","vietnamese"],["he","hebrew"],["uk","ukrainian"],["el","greek"],["ms","malay"],["cs","czech"],["ro","romanian"],["da","danish"],["hu","hungarian"],["ta","tamil"],["no","norwegian"],["th","thai"],["ur","urdu"],["hr","croatian"],["bg","bulgarian"],["lt","lithuanian"],["la","latin"],["mi","maori"],["ml","malayalam"],["cy","welsh"],["sk","slovak"],["te","telugu"],["fa","persian"],["lv","latvian"],["bn","bengali"],["sr","serbian"],["az","azerbaijani"],["sl","slovenian"],["kn","kannada"],["et","estonian"],["mk","macedonian"],["br","breton"],["eu","basque"],["is","icelandic"],["hy","armenian"],["ne","nepali"],["mn","mongolian"],["bs","bosnian"],["kk","kazakh"],["sq","albanian"],["sw","swahili"],["gl","galician"],["mr","marathi"],["pa","punjabi"],["si","sinhala"],["km","khmer"],["sn","shona"],["yo","yoruba"],["so","somali"],["af","afrikaans"],["oc","occitan"],["ka","georgian"],["be","belarusian"],["tg","tajik"],["sd","sindhi"],["gu","gujarati"],["am","amharic"],["yi","yiddish"],["lo","lao"],["uz","uzbek"],["fo","faroese"],["ht","haitian creole"],["ps","pashto"],["tk","turkmen"],["nn","nynorsk"],["mt","maltese"],["sa","sanskrit"],["lb","luxembourgish"],["my","myanmar"],["bo","tibetan"],["tl","tagalog"],["mg","malagasy"],["as","assamese"],["tt","tatar"],["haw","hawaiian"],["ln","lingala"],["ha","hausa"],["ba","bashkir"],["jw","javanese"],["su","sundanese"]],d=new Map(i),g=new Map([...i.map(([f,u])=>[u,f]),["burmese","my"],["valencian","ca"],["flemish","nl"],["haitian","ht"],["letzeburgesch","lb"],["pushto","ps"],["panjabi","pa"],["moldavian","ro"],["moldovan","ro"],["sinhalese","si"],["castilian","es"]]);function I(f){f=f.toLowerCase();let u=g.get(f);if(u===void 0){let m=f.match(/^<\|([a-z]{2})\|>$/);if(m&&(f=m[1]),d.has(f))u=f;else{let _=f.length===2?d.keys():d.values();throw new Error(`Language "${f}" is not supported. Must be one of: ${JSON.stringify(Array.from(_))}`)}}return u}}),"./src/models/whisper/feature_extraction_whisper.js":((D,a,e)=>{e.r(a),e.d(a,{WhisperFeatureExtractor:()=>f});var i=e("./src/base/feature_extraction_utils.js"),d=e("./src/utils/tensor.js"),g=e("./src/utils/audio.js"),I=e("./src/utils/maths.js");class f extends i.FeatureExtractor{constructor(m){super(m),this.config.mel_filters??=(0,g.mel_filter_bank)(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,8e3,this.config.sampling_rate,"slaney","slaney"),this.window=(0,g.window_function)(this.config.n_fft,"hann")}async _extract_fbank_features(m){let T=await(0,g.spectrogram)(m,this.window,this.config.n_fft,this.config.hop_length,{power:2,mel_filters:this.config.mel_filters,log_mel:"log10",max_num_frames:Math.min(Math.floor(m.length/this.config.hop_length),this.config.nb_max_frames)}),_=T.data,o=(0,I.max)(_)[0];for(let x=0;x<_.length;++x)_[x]=(Math.max(_[x],o-8)+4)/4;return T}async _call(m,{max_length:T=null}={}){(0,i.validate_audio_inputs)(m,"WhisperFeatureExtractor");let _,o=T??this.config.n_samples;return m.length>o?(m.length>this.config.n_samples&&console.warn("Attempting to extract features for audio longer than 30 seconds. If using a pipeline to extract transcript from a long audio clip, remember to specify `chunk_length_s` and/or `stride_length_s`."),_=m.slice(0,o)):(_=new Float32Array(o),_.set(m)),{input_features:(await this._extract_fbank_features(_)).unsqueeze_(0)}}}}),"./src/models/whisper/generation_whisper.js":((D,a,e)=>{e.r(a),e.d(a,{WhisperGenerationConfig:()=>d});var i=e("./src/generation/configuration_utils.js");class d extends i.GenerationConfig{return_timestamps=null;return_token_timestamps=null;num_frames=null;alignment_heads=null;task=null;language=null;no_timestamps_token_id=null;prompt_ids=null;is_multilingual=null;lang_to_id=null;task_to_id=null;max_initial_timestamp_index=1}}),"./src/models/whisper/processing_whisper.js":((D,a,e)=>{e.r(a),e.d(a,{WhisperProcessor:()=>I});var i=e("./src/models/auto/feature_extraction_auto.js"),d=e("./src/tokenizers.js"),g=e("./src/base/processing_utils.js");class I extends g.Processor{static tokenizer_class=d.AutoTokenizer;static feature_extractor_class=i.AutoFeatureExtractor;async _call(u){return await this.feature_extractor(u)}}}),"./src/models/yolos/image_processing_yolos.js":((D,a,e)=>{e.r(a),e.d(a,{YolosFeatureExtractor:()=>g,YolosImageProcessor:()=>d});var i=e("./src/base/image_processors_utils.js");class d extends i.ImageProcessor{post_process_object_detection(...f){return(0,i.post_process_object_detection)(...f)}}class g extends d{}}),"./src/ops/registry.js":((D,a,e)=>{e.r(a),e.d(a,{TensorOpRegistry:()=>I});var i=e("./src/backends/onnx.js"),d=e("./src/utils/tensor.js");let g=async(f,u,m)=>{let T=await(0,i.createInferenceSession)(new Uint8Array(f),u);return(async _=>{let o=(0,i.isONNXProxy)(),x=Object.fromEntries(Object.entries(_).map(([k,G])=>[k,(o?G.clone():G).ort_tensor])),w=await(0,i.runInferenceSession)(T,x);return Array.isArray(m)?m.map(k=>new d.Tensor(w[k])):new d.Tensor(w[m])})};class I{static session_options={};static get nearest_interpolate_4d(){return this._nearest_interpolate_4d||(this._nearest_interpolate_4d=g([8,10,18,0,58,129,1,10,41,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,18,10,4,109,111,100,101,34,7,110,101,97,114,101,115,116,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,21],this.session_options,"y")),this._nearest_interpolate_4d}static get bilinear_interpolate_4d(){return this._bilinear_interpolate_4d||(this._bilinear_interpolate_4d=g([8,9,18,0,58,128,1,10,40,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,17,10,4,109,111,100,101,34,6,108,105,110,101,97,114,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bilinear_interpolate_4d}static get bicubic_interpolate_4d(){return this._bicubic_interpolate_4d||(this._bicubic_interpolate_4d=g([8,9,18,0,58,127,10,39,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,16,10,4,109,111,100,101,34,5,99,117,98,105,99,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bicubic_interpolate_4d}static get matmul(){return this._matmul||(this._matmul=g([8,9,18,0,58,55,10,17,10,1,97,10,1,98,18,1,99,34,6,77,97,116,77,117,108,18,1,114,90,9,10,1,97,18,4,10,2,8,1,90,9,10,1,98,18,4,10,2,8,1,98,9,10,1,99,18,4,10,2,8,1,66,2,16,20],this.session_options,"c")),this._matmul}static get stft(){return this._stft||(this._stft=g([8,7,18,0,58,148,1,10,38,10,1,115,10,1,106,10,1,119,10,1,108,18,1,111,34,4,83,84,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,115,90,26,10,1,115,18,21,10,19,8,1,18,15,10,3,18,1,98,10,3,18,1,115,10,3,18,1,99,90,11,10,1,106,18,6,10,4,8,7,18,0,90,16,10,1,119,18,11,10,9,8,1,18,5,10,3,18,1,119,90,11,10,1,108,18,6,10,4,8,7,18,0,98,31,10,1,111,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,102,10,3,18,1,100,10,3,18,1,99,66,2,16,17],this.session_options,"o")),this._stft}static get rfft(){return this._rfft||(this._rfft=g([8,9,18,0,58,97,10,33,10,1,120,10,0,10,1,97,18,1,121,34,3,68,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,100,90,21,10,1,120,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,90,11,10,1,97,18,6,10,4,8,7,18,0,98,21,10,1,121,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,66,2,16,20],this.session_options,"y")),this._rfft}static get top_k(){return this._top_k||(this._top_k=g([8,10,18,0,58,73,10,18,10,1,120,10,1,107,18,1,118,18,1,105,34,4,84,111,112,75,18,1,116,90,9,10,1,120,18,4,10,2,8,1,90,15,10,1,107,18,10,10,8,8,7,18,4,10,2,8,1,98,9,10,1,118,18,4,10,2,8,1,98,9,10,1,105,18,4,10,2,8,7,66,2,16,21],this.session_options,["v","i"])),this._top_k}static get slice(){return this._slice||(this._slice=g([8,7,18,0,58,96,10,25,10,1,120,10,1,115,10,1,101,10,1,97,10,1,116,18,1,121,34,5,83,108,105,99,101,18,1,114,90,9,10,1,120,18,4,10,2,8,1,90,9,10,1,115,18,4,10,2,8,7,90,9,10,1,101,18,4,10,2,8,7,90,9,10,1,97,18,4,10,2,8,7,90,9,10,1,116,18,4,10,2,8,7,98,9,10,1,121,18,4,10,2,8,1,66,2,16,13],this.session_options,"y")),this._slice}}}),"./src/pipelines.js":((D,a,e)=>{e.r(a),e.d(a,{AudioClassificationPipeline:()=>N,AutomaticSpeechRecognitionPipeline:()=>K,BackgroundRemovalPipeline:()=>ce,DepthEstimationPipeline:()=>ae,DocumentQuestionAnsweringPipeline:()=>L,FeatureExtractionPipeline:()=>V,FillMaskPipeline:()=>P,ImageClassificationPipeline:()=>te,ImageFeatureExtractionPipeline:()=>R,ImageSegmentationPipeline:()=>se,ImageToImagePipeline:()=>Y,ImageToTextPipeline:()=>J,ObjectDetectionPipeline:()=>_e,Pipeline:()=>G,QuestionAnsweringPipeline:()=>B,SummarizationPipeline:()=>y,Text2TextGenerationPipeline:()=>M,TextClassificationPipeline:()=>b,TextGenerationPipeline:()=>F,TextToAudioPipeline:()=>W,TokenClassificationPipeline:()=>C,TranslationPipeline:()=>l,ZeroShotAudioClassificationPipeline:()=>Q,ZeroShotClassificationPipeline:()=>S,ZeroShotImageClassificationPipeline:()=>we,ZeroShotObjectDetectionPipeline:()=>X,pipeline:()=>Le});var i=e("./src/tokenizers.js"),d=e("./src/models.js"),g=e("./src/models/auto/processing_auto.js"),I=e("./src/base/processing_utils.js"),f=e("./src/utils/generic.js"),u=e("./src/utils/core.js"),m=e("./src/utils/maths.js"),T=e("./src/utils/audio.js"),_=e("./src/utils/tensor.js"),o=e("./src/utils/image.js");async function x(ge){return Array.isArray(ge)||(ge=[ge]),await Promise.all(ge.map(p=>o.RawImage.read(p)))}async function w(ge,p){return Array.isArray(ge)||(ge=[ge]),await Promise.all(ge.map(q=>typeof q=="string"||q instanceof URL?(0,T.read_audio)(q,p):q instanceof Float64Array?new Float32Array(q):q))}function k(ge,p){p&&(ge=ge.map(me=>me|0));let[q,de,pe,Te]=ge;return{xmin:q,ymin:de,xmax:pe,ymax:Te}}class G extends f.Callable{constructor({task:p,model:q,tokenizer:de=null,processor:pe=null}){super(),this.task=p,this.model=q,this.tokenizer=de,this.processor=pe}async dispose(){await this.model.dispose()}}class b extends G{constructor(p){super(p)}async _call(p,{top_k:q=1}={}){let de=this.tokenizer(p,{padding:!0,truncation:!0}),pe=await this.model(de),Te=this.model.config.problem_type==="multi_label_classification"?fe=>fe.sigmoid():fe=>new _.Tensor("float32",(0,m.softmax)(fe.data),fe.dims),me=this.model.config.id2label,ne=[];for(let fe of pe.logits){let le=Te(fe),he=await(0,_.topk)(le,q),De=he[0].tolist(),ye=he[1].tolist().map((Ce,Qe)=>({label:me?me[Ce]:`LABEL_${Ce}`,score:De[Qe]}));q===1?ne.push(...ye):ne.push(ye)}return Array.isArray(p)||q===1?ne:ne[0]}}class C extends G{constructor(p){super(p)}async _call(p,{ignore_labels:q=["O"]}={}){let de=Array.isArray(p),pe=this.tokenizer(de?p:[p],{padding:!0,truncation:!0}),me=(await this.model(pe)).logits,ne=this.model.config.id2label,fe=[];for(let le=0;le<me.dims[0];++le){let he=pe.input_ids[le],De=me[le],ve=[];for(let ye=0;ye<De.dims[0];++ye){let Ce=De[ye],Qe=(0,m.max)(Ce.data)[1],Be=ne?ne[Qe]:`LABEL_${Qe}`;if(q.includes(Be))continue;let Re=this.tokenizer.decode([he[ye].item()],{skip_special_tokens:!0});if(Re==="")continue;let ke=(0,m.softmax)(Ce.data);ve.push({entity:Be,score:ke[Qe],index:ye,word:Re})}fe.push(ve)}return de?fe:fe[0]}}class B extends G{constructor(p){super(p)}async _call(p,q,{top_k:de=1}={}){let pe=this.tokenizer(p,{text_pair:q,padding:!0,truncation:!0}),{start_logits:Te,end_logits:me}=await this.model(pe),ne=pe.input_ids.tolist(),fe=pe.attention_mask.tolist(),le=this.tokenizer.all_special_ids,he=[];for(let De=0;De<Te.dims[0];++De){let ve=ne[De],ye=ve.findIndex(je=>je==this.tokenizer.sep_token_id),Ce=fe[De].map((je,nt)=>je==1&&(nt===0||nt>ye&&le.findIndex(ut=>ut==ve[nt])===-1)),Qe=Te[De].tolist(),Be=me[De].tolist();for(let je=1;je<Qe.length;++je)(fe[De]==0||je<=ye||le.findIndex(nt=>nt==ve[je])!==-1)&&(Qe[je]=-1/0,Be[je]=-1/0);let Re=(0,m.softmax)(Qe).map((je,nt)=>[je,nt]),ke=(0,m.softmax)(Be).map((je,nt)=>[je,nt]);Re[0][0]=0,ke[0][0]=0;let qe=(0,u.product)(Re,ke).filter(je=>je[0][1]<=je[1][1]).map(je=>[je[0][1],je[1][1],je[0][0]*je[1][0]]).sort((je,nt)=>nt[2]-je[2]);for(let je=0;je<Math.min(qe.length,de);++je){let[nt,ut,Pt]=qe[je],jt=ve.slice(nt,ut+1),ft=this.tokenizer.decode(jt,{skip_special_tokens:!0});he.push({answer:ft,score:Pt})}}return de===1?he[0]:he}}class P extends G{constructor(p){super(p)}async _call(p,{top_k:q=5}={}){let de=this.tokenizer(p,{padding:!0,truncation:!0}),{logits:pe}=await this.model(de),Te=[],me=de.input_ids.tolist();for(let ne=0;ne<me.length;++ne){let fe=me[ne],le=fe.findIndex(Ce=>Ce==this.tokenizer.mask_token_id);if(le===-1)throw Error(`Mask token (${this.tokenizer.mask_token}) not found in text.`);let he=pe[ne][le],De=await(0,_.topk)(new _.Tensor("float32",(0,m.softmax)(he.data),he.dims),q),ve=De[0].tolist(),ye=De[1].tolist();Te.push(ye.map((Ce,Qe)=>{let Be=fe.slice();return Be[le]=Ce,{score:ve[Qe],token:Number(Ce),token_str:this.tokenizer.decode([Ce]),sequence:this.tokenizer.decode(Be,{skip_special_tokens:!0})}}))}return Array.isArray(p)?Te:Te[0]}}class M extends G{_key="generated_text";constructor(p){super(p)}async _call(p,q={}){Array.isArray(p)||(p=[p]),this.model.config.prefix&&(p=p.map(fe=>this.model.config.prefix+fe));let de=this.model.config.task_specific_params;de&&de[this.task]&&de[this.task].prefix&&(p=p.map(fe=>de[this.task].prefix+fe));let pe=this.tokenizer,Te={padding:!0,truncation:!0},me;this instanceof l&&"_build_translation_inputs"in pe?me=pe._build_translation_inputs(p,Te,q):me=pe(p,Te);let ne=await this.model.generate({...me,...q});return pe.batch_decode(ne,{skip_special_tokens:!0}).map(fe=>({[this._key]:fe}))}}class y extends M{_key="summary_text";constructor(p){super(p)}}class l extends M{_key="translation_text";constructor(p){super(p)}}function h(ge){return Array.isArray(ge)&&ge.every(p=>"role"in p&&"content"in p)}class F extends G{constructor(p){super(p)}async _call(p,q={}){let de=!1,pe=!1,Te=q.add_special_tokens??(this.tokenizer.add_bos_token||this.tokenizer.add_eos_token)??!1,me;if(typeof p=="string")me=p=[p];else if(Array.isArray(p)&&p.every(ye=>typeof ye=="string"))de=!0,me=p;else{if(h(p))p=[p];else if(Array.isArray(p)&&p.every(h))de=!0;else throw new Error("Input must be a string, an array of strings, a Chat, or an array of Chats");pe=!0,me=p.map(ye=>this.tokenizer.apply_chat_template(ye,{tokenize:!1,add_generation_prompt:!0})),Te=!1}let ne=pe?!1:q.return_full_text??!0;this.tokenizer.padding_side="left";let fe=this.tokenizer(me,{add_special_tokens:Te,padding:!0,truncation:!0}),le=await this.model.generate({...fe,...q}),he=this.tokenizer.batch_decode(le,{skip_special_tokens:!0}),De;!ne&&fe.input_ids.dims.at(-1)>0&&(De=this.tokenizer.batch_decode(fe.input_ids,{skip_special_tokens:!0}).map(ye=>ye.length));let ve=Array.from({length:p.length},ye=>[]);for(let ye=0;ye<he.length;++ye){let Ce=Math.floor(ye/le.dims[0]*p.length);De&&(he[ye]=he[ye].slice(De[Ce])),ve[Ce].push({generated_text:pe?[...p[Ce],{role:"assistant",content:he[ye]}]:he[ye]})}return!de&&ve.length===1?ve[0]:ve}}class S extends G{constructor(p){super(p),this.label2id=Object.fromEntries(Object.entries(this.model.config.label2id).map(([q,de])=>[q.toLowerCase(),de])),this.entailment_id=this.label2id.entailment,this.entailment_id===void 0&&(console.warn("Could not find 'entailment' in label2id mapping. Using 2 as entailment_id."),this.entailment_id=2),this.contradiction_id=this.label2id.contradiction??this.label2id.not_entailment,this.contradiction_id===void 0&&(console.warn("Could not find 'contradiction' in label2id mapping. Using 0 as contradiction_id."),this.contradiction_id=0)}async _call(p,q,{hypothesis_template:de="This example is {}.",multi_label:pe=!1}={}){let Te=Array.isArray(p);Te||(p=[p]),Array.isArray(q)||(q=[q]);let me=q.map(le=>de.replace("{}",le)),ne=pe||q.length===1,fe=[];for(let le of p){let he=[];for(let ye of me){let Ce=this.tokenizer(le,{text_pair:ye,padding:!0,truncation:!0}),Qe=await this.model(Ce);ne?he.push([Qe.logits.data[this.contradiction_id],Qe.logits.data[this.entailment_id]]):he.push(Qe.logits.data[this.entailment_id])}let ve=(ne?he.map(ye=>(0,m.softmax)(ye)[1]):(0,m.softmax)(he)).map((ye,Ce)=>[ye,Ce]).sort((ye,Ce)=>Ce[0]-ye[0]);fe.push({sequence:le,labels:ve.map(ye=>q[ye[1]]),scores:ve.map(ye=>ye[0])})}return Te?fe:fe[0]}}class V extends G{constructor(p){super(p)}async _call(p,{pooling:q="none",normalize:de=!1,quantize:pe=!1,precision:Te="binary"}={}){let me=this.tokenizer(p,{padding:!0,truncation:!0}),ne=await this.model(me),fe=ne.last_hidden_state??ne.logits??ne.token_embeddings;switch(q){case"none":break;case"mean":fe=(0,_.mean_pooling)(fe,me.attention_mask);break;case"first_token":case"cls":fe=fe.slice(null,0);break;case"last_token":case"eos":fe=fe.slice(null,-1);break;default:throw Error(`Pooling method '${q}' not supported.`)}return de&&(fe=fe.normalize(2,-1)),pe&&(fe=(0,_.quantize_embeddings)(fe,Te)),fe}}class R extends G{constructor(p){super(p)}async _call(p,{pool:q=null}={}){let de=await x(p),{pixel_values:pe}=await this.processor(de),Te=await this.model({pixel_values:pe}),me;if(q){if(!("pooler_output"in Te))throw Error("No pooled output was returned. Make sure the model has a 'pooler' layer when using the 'pool' option.");me=Te.pooler_output}else me=Te.last_hidden_state??Te.logits??Te.image_embeds;return me}}class N extends G{constructor(p){super(p)}async _call(p,{top_k:q=5}={}){let de=this.processor.feature_extractor.config.sampling_rate,pe=await w(p,de),Te=this.model.config.id2label,me=[];for(let ne of pe){let fe=await this.processor(ne),he=(await this.model(fe)).logits[0],De=await(0,_.topk)(new _.Tensor("float32",(0,m.softmax)(he.data),he.dims),q),ve=De[0].tolist(),Ce=De[1].tolist().map((Qe,Be)=>({label:Te?Te[Qe]:`LABEL_${Qe}`,score:ve[Be]}));me.push(Ce)}return Array.isArray(p)?me:me[0]}}class Q extends G{constructor(p){super(p)}async _call(p,q,{hypothesis_template:de="This is a sound of {}."}={}){let pe=!Array.isArray(p);pe&&(p=[p]);let Te=q.map(he=>de.replace("{}",he)),me=this.tokenizer(Te,{padding:!0,truncation:!0}),ne=this.processor.feature_extractor.config.sampling_rate,fe=await w(p,ne),le=[];for(let he of fe){let De=await this.processor(he),ve=await this.model({...me,...De}),ye=(0,m.softmax)(ve.logits_per_audio.data);le.push([...ye].map((Ce,Qe)=>({score:Ce,label:q[Qe]})))}return pe?le[0]:le}}class K extends G{constructor(p){super(p)}async _call(p,q={}){switch(this.model.config.model_type){case"whisper":case"lite-whisper":return this._call_whisper(p,q);case"wav2vec2":case"wav2vec2-bert":case"unispeech":case"unispeech-sat":case"hubert":case"parakeet_ctc":return this._call_wav2vec2(p,q);case"moonshine":return this._call_moonshine(p,q);default:throw new Error(`AutomaticSpeechRecognitionPipeline does not support model type '${this.model.config.model_type}'.`)}}async _call_wav2vec2(p,q){q.language&&console.warn('`language` parameter is not yet supported for `wav2vec2` models, defaulting to "English".'),q.task&&console.warn('`task` parameter is not yet supported for `wav2vec2` models, defaulting to "transcribe".');let de=!Array.isArray(p);de&&(p=[p]);let pe=this.processor.feature_extractor.config.sampling_rate,Te=await w(p,pe),me=[];for(let ne of Te){let fe=await this.processor(ne),he=(await this.model(fe)).logits[0],De=[];for(let ye of he)De.push((0,m.max)(ye.data)[1]);let ve=this.tokenizer.decode(De,{skip_special_tokens:!0}).trim();me.push({text:ve})}return de?me[0]:me}async _call_whisper(p,q){let de=q.return_timestamps??!1,pe=q.chunk_length_s??0,Te=q.force_full_sequences??!1,me=q.stride_length_s??null,ne={...q};de==="word"&&(ne.return_token_timestamps=!0,ne.return_timestamps=!1);let fe=!Array.isArray(p);fe&&(p=[p]);let le=this.processor.feature_extractor.config.chunk_length/this.model.config.max_source_positions,he=this.processor.feature_extractor.config.hop_length,De=this.processor.feature_extractor.config.sampling_rate,ve=await w(p,De),ye=[];for(let Ce of ve){let Qe=[];if(pe>0){if(me===null)me=pe/6;else if(pe<=me)throw Error("`chunk_length_s` must be larger than `stride_length_s`.");let ke=De*pe,qe=De*me,je=ke-2*qe,nt=0;for(;;){let ut=nt+ke,Pt=Ce.subarray(nt,ut),jt=await this.processor(Pt),ft=nt===0,$t=ut>=Ce.length;if(Qe.push({stride:[Pt.length,ft?0:qe,$t?0:qe],input_features:jt.input_features,is_last:$t}),$t)break;nt+=je}}else Qe=[{stride:[Ce.length,0,0],input_features:(await this.processor(Ce)).input_features,is_last:!0}];for(let ke of Qe){ne.num_frames=Math.floor(ke.stride[0]/he);let qe=await this.model.generate({inputs:ke.input_features,...ne});de==="word"?(ke.tokens=qe.sequences.tolist()[0],ke.token_timestamps=qe.token_timestamps.tolist()[0].map(je=>(0,m.round)(je,2))):ke.tokens=qe[0].tolist(),ke.stride=ke.stride.map(je=>je/De)}let[Be,Re]=this.tokenizer._decode_asr(Qe,{time_precision:le,return_timestamps:de,force_full_sequences:Te});ye.push({text:Be,...Re})}return fe?ye[0]:ye}async _call_moonshine(p,q){let de=!Array.isArray(p);de&&(p=[p]);let pe=this.processor.feature_extractor.config.sampling_rate,Te=await w(p,pe),me=[];for(let ne of Te){let fe=await this.processor(ne),le=Math.floor(ne.length/pe)*6,he=await this.model.generate({max_new_tokens:le,...q,...fe}),De=this.processor.batch_decode(he,{skip_special_tokens:!0})[0];me.push({text:De})}return de?me[0]:me}}class J extends G{constructor(p){super(p)}async _call(p,q={}){let de=Array.isArray(p),pe=await x(p),{pixel_values:Te}=await this.processor(pe),me=[];for(let ne of Te){ne.dims=[1,...ne.dims];let fe=await this.model.generate({inputs:ne,...q}),le=this.tokenizer.batch_decode(fe,{skip_special_tokens:!0}).map(he=>({generated_text:he.trim()}));me.push(le)}return de?me:me[0]}}class te extends G{constructor(p){super(p)}async _call(p,{top_k:q=5}={}){let de=await x(p),{pixel_values:pe}=await this.processor(de),Te=await this.model({pixel_values:pe}),me=this.model.config.id2label,ne=[];for(let fe of Te.logits){let le=await(0,_.topk)(new _.Tensor("float32",(0,m.softmax)(fe.data),fe.dims),q),he=le[0].tolist(),ve=le[1].tolist().map((ye,Ce)=>({label:me?me[ye]:`LABEL_${ye}`,score:he[Ce]}));ne.push(ve)}return Array.isArray(p)?ne:ne[0]}}class se extends G{constructor(p){super(p),this.subtasks_mapping={panoptic:"post_process_panoptic_segmentation",instance:"post_process_instance_segmentation",semantic:"post_process_semantic_segmentation"}}async _call(p,{threshold:q=.5,mask_threshold:de=.5,overlap_mask_area_threshold:pe=.8,label_ids_to_fuse:Te=null,target_sizes:me=null,subtask:ne=null}={}){if(Array.isArray(p)&&p.length!==1)throw Error("Image segmentation pipeline currently only supports a batch size of 1.");let le=await x(p),he=le.map(ke=>[ke.height,ke.width]),De=await this.processor(le),{inputNames:ve,outputNames:ye}=this.model.sessions.model;if(!ve.includes("pixel_values")){if(ve.length!==1)throw Error(`Expected a single input name, but got ${ve.length} inputs: ${ve}.`);let ke=ve[0];if(ke in De)throw Error(`Input name ${ke} already exists in the inputs.`);De[ke]=De.pixel_values}let Ce=await this.model(De),Qe=null;if(ne!==null)Qe=this.subtasks_mapping[ne];else if(this.processor.image_processor){for(let[ke,qe]of Object.entries(this.subtasks_mapping))if(qe in this.processor.image_processor){Qe=this.processor.image_processor[qe].bind(this.processor.image_processor),ne=ke;break}}let Be=this.model.config.id2label,Re=[];if(ne)if(ne==="panoptic"||ne==="instance"){let ke=Qe(Ce,q,de,pe,Te,me??he)[0],qe=ke.segmentation;for(let je of ke.segments_info){let nt=new Uint8ClampedArray(qe.data.length);for(let Pt=0;Pt<qe.data.length;++Pt)qe.data[Pt]===je.id&&(nt[Pt]=255);let ut=new o.RawImage(nt,qe.dims[1],qe.dims[0],1);Re.push({score:je.score,label:Be[je.label_id],mask:ut})}}else if(ne==="semantic"){let{segmentation:ke,labels:qe}=Qe(Ce,me??he)[0];for(let je of qe){let nt=new Uint8ClampedArray(ke.data.length);for(let Pt=0;Pt<ke.data.length;++Pt)ke.data[Pt]===je&&(nt[Pt]=255);let ut=new o.RawImage(nt,ke.dims[1],ke.dims[0],1);Re.push({score:null,label:Be[je],mask:ut})}}else throw Error(`Subtask ${ne} not supported.`);else{let qe=Ce[ye[0]];for(let je=0;je<he.length;++je){let nt=he[je],ut=qe[je];ut.data.some(jt=>jt<-1e-5||jt>1+1e-5)&&ut.sigmoid_();let Pt=await o.RawImage.fromTensor(ut.mul_(255).to("uint8")).resize(nt[1],nt[0]);Re.push({label:null,score:null,mask:Pt})}}return Re}}class ce extends se{constructor(p){super(p)}async _call(p,q={}){if(Array.isArray(p)&&p.length!==1)throw Error("Background removal pipeline currently only supports a batch size of 1.");let pe=await x(p),Te=await super._call(p,q);return pe.map((ne,fe)=>{let le=ne.clone();return le.putAlpha(Te[fe].mask),le})}}class we extends G{constructor(p){super(p)}async _call(p,q,{hypothesis_template:de="This is a photo of {}"}={}){let pe=Array.isArray(p),Te=await x(p),me=q.map(ve=>de.replace("{}",ve)),ne=this.tokenizer(me,{padding:this.model.config.model_type==="siglip"?"max_length":!0,truncation:!0}),{pixel_values:fe}=await this.processor(Te),le=await this.model({...ne,pixel_values:fe}),he=this.model.config.model_type==="siglip"?ve=>ve.sigmoid().data:ve=>(0,m.softmax)(ve.data),De=[];for(let ve of le.logits_per_image){let Ce=[...he(ve)].map((Qe,Be)=>({score:Qe,label:q[Be]}));Ce.sort((Qe,Be)=>Be.score-Qe.score),De.push(Ce)}return pe?De:De[0]}}class _e extends G{constructor(p){super(p)}async _call(p,{threshold:q=.9,percentage:de=!1}={}){let pe=Array.isArray(p);if(pe&&p.length!==1)throw Error("Object detection pipeline currently only supports a batch size of 1.");let Te=await x(p),me=de?null:Te.map(ye=>[ye.height,ye.width]),{pixel_values:ne,pixel_mask:fe}=await this.processor(Te),le=await this.model({pixel_values:ne,pixel_mask:fe}),he=this.processor.image_processor.post_process_object_detection(le,q,me),De=this.model.config.id2label,ve=he.map(ye=>ye.boxes.map((Ce,Qe)=>({score:ye.scores[Qe],label:De[ye.classes[Qe]],box:k(Ce,!de)})));return pe?ve:ve[0]}}class X extends G{constructor(p){super(p)}async _call(p,q,{threshold:de=.1,top_k:pe=null,percentage:Te=!1}={}){let me=Array.isArray(p),ne=await x(p),fe=this.tokenizer(q,{padding:!0,truncation:!0}),le=await this.processor(ne),he=[];for(let De=0;De<ne.length;++De){let ve=ne[De],ye=Te?null:[[ve.height,ve.width]],Ce=le.pixel_values[De].unsqueeze_(0),Qe=await this.model({...fe,pixel_values:Ce}),Be;if("post_process_grounded_object_detection"in this.processor){let Re=this.processor.post_process_grounded_object_detection(Qe,fe.input_ids,{box_threshold:de,text_threshold:de,target_sizes:ye})[0];Be=Re.boxes.map((ke,qe)=>({score:Re.scores[qe],label:Re.labels[qe],box:k(ke,!Te)}))}else{let Re=this.processor.image_processor.post_process_object_detection(Qe,de,ye,!0)[0];Be=Re.boxes.map((ke,qe)=>({score:Re.scores[qe],label:q[Re.classes[qe]],box:k(ke,!Te)}))}Be.sort((Re,ke)=>ke.score-Re.score),pe!==null&&(Be=Be.slice(0,pe)),he.push(Be)}return me?he:he[0]}}class L extends G{constructor(p){super(p)}async _call(p,q,de={}){let pe=(await x(p))[0],{pixel_values:Te}=await this.processor(pe),me=`<s_docvqa><s_question>${q}</s_question><s_answer>`,ne=this.tokenizer(me,{add_special_tokens:!1,padding:!0,truncation:!0}).input_ids,fe=await this.model.generate({inputs:Te,max_length:this.model.config.decoder.max_position_embeddings,decoder_input_ids:ne,...de}),he=this.tokenizer.batch_decode(fe)[0].match(/<s_answer>(.*?)<\/s_answer>/),De=null;return he&&he.length>=2&&(De=he[1].trim()),[{answer:De}]}}class W extends G{DEFAULT_VOCODER_ID="Xenova/speecht5_hifigan";constructor(p){super(p),this.vocoder=p.vocoder??null}async _prepare_speaker_embeddings(p){if((typeof p=="string"||p instanceof URL)&&(p=new Float32Array(await(await fetch(p)).arrayBuffer())),p instanceof Float32Array)p=new _.Tensor("float32",p,[p.length]);else if(!(p instanceof _.Tensor))throw new Error("Speaker embeddings must be a `Tensor`, `Float32Array`, `string`, or `URL`.");return p}async _call(p,{speaker_embeddings:q=null,num_inference_steps:de,speed:pe}={}){return this.processor?this._call_text_to_spectrogram(p,{speaker_embeddings:q}):this.model.config.model_type==="supertonic"?this._call_supertonic(p,{speaker_embeddings:q,num_inference_steps:de,speed:pe}):this._call_text_to_waveform(p)}async _call_supertonic(p,{speaker_embeddings:q,num_inference_steps:de,speed:pe}){if(!q)throw new Error("Speaker embeddings must be provided for Supertonic models.");q=await this._prepare_speaker_embeddings(q);let{sampling_rate:Te,style_dim:me}=this.model.config;q=q.view(1,-1,me);let ne=this.tokenizer(p,{padding:!0,truncation:!0}),{waveform:fe}=await this.model.generate_speech({...ne,style:q,num_inference_steps:de,speed:pe});return new T.RawAudio(fe.data,Te)}async _call_text_to_waveform(p){let q=this.tokenizer(p,{padding:!0,truncation:!0}),{waveform:de}=await this.model(q),pe=this.model.config.sampling_rate;return new T.RawAudio(de.data,pe)}async _call_text_to_spectrogram(p,{speaker_embeddings:q}){this.vocoder||(console.log("No vocoder specified, using default HifiGan vocoder."),this.vocoder=await d.AutoModel.from_pretrained(this.DEFAULT_VOCODER_ID,{dtype:"fp32"}));let{input_ids:de}=this.tokenizer(p,{padding:!0,truncation:!0});q=await this._prepare_speaker_embeddings(q),q=q.view(1,-1);let{waveform:pe}=await this.model.generate_speech(de,q,{vocoder:this.vocoder}),Te=this.processor.feature_extractor.config.sampling_rate;return new T.RawAudio(pe.data,Te)}}class Y extends G{constructor(p){super(p)}async _call(p){let q=await x(p),de=await this.processor(q),pe=await this.model(de),Te=[];for(let me of pe.reconstruction){let ne=me.squeeze().clamp_(0,1).mul_(255).round_().to("uint8");Te.push(o.RawImage.fromTensor(ne))}return Te.length>1?Te:Te[0]}}class ae extends G{constructor(p){super(p)}async _call(p){let q=await x(p),de=await this.processor(q),{predicted_depth:pe}=await this.model(de),Te=[];for(let me=0;me<q.length;++me){let ne=pe[me],[fe,le]=ne.dims.slice(-2),[he,De]=q[me].size,ve=(await(0,_.interpolate_4d)(ne.view(1,1,fe,le),{size:[De,he],mode:"bilinear"})).view(De,he),ye=ve.min().item(),Ce=ve.max().item(),Qe=ve.sub(ye).div_(Ce-ye).mul_(255).to("uint8").unsqueeze(0),Be=o.RawImage.fromTensor(Qe);Te.push({predicted_depth:ve,depth:Be})}return Te.length>1?Te:Te[0]}}let be=Object.freeze({"text-classification":{tokenizer:i.AutoTokenizer,pipeline:b,model:d.AutoModelForSequenceClassification,default:{model:"Xenova/distilbert-base-uncased-finetuned-sst-2-english"},type:"text"},"token-classification":{tokenizer:i.AutoTokenizer,pipeline:C,model:d.AutoModelForTokenClassification,default:{model:"Xenova/bert-base-multilingual-cased-ner-hrl"},type:"text"},"question-answering":{tokenizer:i.AutoTokenizer,pipeline:B,model:d.AutoModelForQuestionAnswering,default:{model:"Xenova/distilbert-base-cased-distilled-squad"},type:"text"},"fill-mask":{tokenizer:i.AutoTokenizer,pipeline:P,model:d.AutoModelForMaskedLM,default:{model:"Xenova/bert-base-uncased"},type:"text"},summarization:{tokenizer:i.AutoTokenizer,pipeline:y,model:d.AutoModelForSeq2SeqLM,default:{model:"Xenova/distilbart-cnn-6-6"},type:"text"},translation:{tokenizer:i.AutoTokenizer,pipeline:l,model:d.AutoModelForSeq2SeqLM,default:{model:"Xenova/t5-small"},type:"text"},"text2text-generation":{tokenizer:i.AutoTokenizer,pipeline:M,model:d.AutoModelForSeq2SeqLM,default:{model:"Xenova/flan-t5-small"},type:"text"},"text-generation":{tokenizer:i.AutoTokenizer,pipeline:F,model:d.AutoModelForCausalLM,default:{model:"Xenova/gpt2"},type:"text"},"zero-shot-classification":{tokenizer:i.AutoTokenizer,pipeline:S,model:d.AutoModelForSequenceClassification,default:{model:"Xenova/distilbert-base-uncased-mnli"},type:"text"},"audio-classification":{pipeline:N,model:d.AutoModelForAudioClassification,processor:g.AutoProcessor,default:{model:"Xenova/wav2vec2-base-superb-ks"},type:"audio"},"zero-shot-audio-classification":{tokenizer:i.AutoTokenizer,pipeline:Q,model:d.AutoModel,processor:g.AutoProcessor,default:{model:"Xenova/clap-htsat-unfused"},type:"multimodal"},"automatic-speech-recognition":{tokenizer:i.AutoTokenizer,pipeline:K,model:[d.AutoModelForSpeechSeq2Seq,d.AutoModelForCTC],processor:g.AutoProcessor,default:{model:"Xenova/whisper-tiny.en"},type:"multimodal"},"text-to-audio":{tokenizer:i.AutoTokenizer,pipeline:W,model:[d.AutoModelForTextToWaveform,d.AutoModelForTextToSpectrogram],processor:[g.AutoProcessor,null],default:{model:"Xenova/speecht5_tts"},type:"text"},"image-to-text":{tokenizer:i.AutoTokenizer,pipeline:J,model:d.AutoModelForVision2Seq,processor:g.AutoProcessor,default:{model:"Xenova/vit-gpt2-image-captioning"},type:"multimodal"},"image-classification":{pipeline:te,model:d.AutoModelForImageClassification,processor:g.AutoProcessor,default:{model:"Xenova/vit-base-patch16-224"},type:"multimodal"},"image-segmentation":{pipeline:se,model:[d.AutoModelForImageSegmentation,d.AutoModelForSemanticSegmentation,d.AutoModelForUniversalSegmentation],processor:g.AutoProcessor,default:{model:"Xenova/detr-resnet-50-panoptic"},type:"multimodal"},"background-removal":{pipeline:ce,model:[d.AutoModelForImageSegmentation,d.AutoModelForSemanticSegmentation,d.AutoModelForUniversalSegmentation],processor:g.AutoProcessor,default:{model:"Xenova/modnet"},type:"image"},"zero-shot-image-classification":{tokenizer:i.AutoTokenizer,pipeline:we,model:d.AutoModel,processor:g.AutoProcessor,default:{model:"Xenova/clip-vit-base-patch32"},type:"multimodal"},"object-detection":{pipeline:_e,model:d.AutoModelForObjectDetection,processor:g.AutoProcessor,default:{model:"Xenova/detr-resnet-50"},type:"multimodal"},"zero-shot-object-detection":{tokenizer:i.AutoTokenizer,pipeline:X,model:d.AutoModelForZeroShotObjectDetection,processor:g.AutoProcessor,default:{model:"Xenova/owlvit-base-patch32"},type:"multimodal"},"document-question-answering":{tokenizer:i.AutoTokenizer,pipeline:L,model:d.AutoModelForDocumentQuestionAnswering,processor:g.AutoProcessor,default:{model:"Xenova/donut-base-finetuned-docvqa"},type:"multimodal"},"image-to-image":{pipeline:Y,model:d.AutoModelForImageToImage,processor:g.AutoProcessor,default:{model:"Xenova/swin2SR-classical-sr-x2-64"},type:"image"},"depth-estimation":{pipeline:ae,model:d.AutoModelForDepthEstimation,processor:g.AutoProcessor,default:{model:"Xenova/dpt-large"},type:"image"},"feature-extraction":{tokenizer:i.AutoTokenizer,pipeline:V,model:d.AutoModel,default:{model:"Xenova/all-MiniLM-L6-v2"},type:"text"},"image-feature-extraction":{processor:g.AutoProcessor,pipeline:R,model:[d.AutoModelForImageFeatureExtraction,d.AutoModel],default:{model:"Xenova/vit-base-patch16-224-in21k"},type:"image"}}),xe=Object.freeze({"sentiment-analysis":"text-classification",ner:"token-classification",asr:"automatic-speech-recognition","text-to-speech":"text-to-audio",embeddings:"feature-extraction"});async function Le(ge,p=null,{progress_callback:q=null,config:de=null,cache_dir:pe=null,local_files_only:Te=!1,revision:me="main",device:ne=null,dtype:fe=null,subfolder:le="onnx",use_external_data_format:he=null,model_file_name:De=null,session_options:ve={}}={}){ge=xe[ge]??ge;let ye=be[ge.split("_",1)[0]];if(!ye)throw Error(`Unsupported pipeline: ${ge}. Must be one of [${Object.keys(be)}]`);p||(p=ye.default.model,console.log(`No model specified. Using default model: "${p}".`));let Ce={progress_callback:q,config:de,cache_dir:pe,local_files_only:Te,revision:me,device:ne,dtype:fe,subfolder:le,use_external_data_format:he,model_file_name:De,session_options:ve},Qe=new Map([["tokenizer",ye.tokenizer],["model",ye.model],["processor",ye.processor]]),Be=await $e(Qe,p,Ce);Be.task=ge,(0,u.dispatchCallback)(q,{status:"ready",task:ge,model:p});let Re=ye.pipeline;return new Re(Be)}async function $e(ge,p,q){let de=Object.create(null),pe=[];for(let[Te,me]of ge.entries()){if(!me)continue;let ne;Array.isArray(me)?ne=new Promise(async(fe,le)=>{let he;for(let De of me){if(De===null){fe(null);return}try{fe(await De.from_pretrained(p,q));return}catch(ve){if(ve.message?.includes("Unsupported model type"))he=ve;else if(ve.message?.includes("Could not locate file"))he=ve;else{le(ve);return}}}le(he)}):ne=me.from_pretrained(p,q),de[Te]=ne,pe.push(ne)}await Promise.all(pe);for(let[Te,me]of Object.entries(de))de[Te]=await me;return de}}),"./src/tokenizers.js":((D,a,e)=>{e.r(a),e.d(a,{AlbertTokenizer:()=>Ds,AutoTokenizer:()=>mr,BartTokenizer:()=>Oe,BertTokenizer:()=>Ls,BlenderbotSmallTokenizer:()=>Se,BlenderbotTokenizer:()=>Fe,BloomTokenizer:()=>gt,CLIPTokenizer:()=>vs,CamembertTokenizer:()=>z,CodeGenTokenizer:()=>xs,CodeLlamaTokenizer:()=>ss,CohereTokenizer:()=>Fs,ConvBertTokenizer:()=>j,DebertaTokenizer:()=>lt,DebertaV2Tokenizer:()=>Os,DistilBertTokenizer:()=>O,ElectraTokenizer:()=>ue,EsmTokenizer:()=>os,FalconTokenizer:()=>Ts,GPT2Tokenizer:()=>Je,GPTNeoXTokenizer:()=>ws,GemmaTokenizer:()=>bs,Grok1Tokenizer:()=>js,HerbertTokenizer:()=>n,LlamaTokenizer:()=>Nt,M2M100Tokenizer:()=>ms,MBart50Tokenizer:()=>We,MBartTokenizer:()=>st,MPNetTokenizer:()=>Ps,MarianTokenizer:()=>hs,MgpstrTokenizer:()=>Vs,MobileBertTokenizer:()=>Is,NllbTokenizer:()=>ps,NougatTokenizer:()=>Tt,PreTrainedTokenizer:()=>Ze,Qwen2Tokenizer:()=>Bs,RoFormerTokenizer:()=>v,RobertaTokenizer:()=>it,SiglipTokenizer:()=>Es,SpeechT5Tokenizer:()=>Ke,SqueezeBertTokenizer:()=>is,T5Tokenizer:()=>Ge,TokenizerModel:()=>V,VitsTokenizer:()=>Rs,Wav2Vec2CTCTokenizer:()=>rs,WhisperTokenizer:()=>Ns,XLMRobertaTokenizer:()=>Qt,XLMTokenizer:()=>Z,is_chinese_char:()=>B});var i=e("./src/utils/generic.js"),d=e("./src/utils/core.js"),g=e("./src/utils/hub.js"),I=e("./src/utils/maths.js"),f=e("./src/utils/tensor.js"),u=e("./src/utils/data-structures.js"),m=e("./node_modules/@huggingface/jinja/dist/index.js"),T=e("./src/models/whisper/common_whisper.js");async function _(ee,c){let A=await Promise.all([(0,g.getModelJSON)(ee,"tokenizer.json",!0,c),(0,g.getModelJSON)(ee,"tokenizer_config.json",!0,c)]);return c.legacy!==null&&(A[1].legacy=c.legacy),A}function o(ee,c){let A=[],U=0;for(let $ of ee.matchAll(c)){let ie=$[0];U<$.index&&A.push(ee.slice(U,$.index)),ie.length>0&&A.push(ie),U=$.index+ie.length}return U<ee.length&&A.push(ee.slice(U)),A}function x(ee,c=!0){if(ee.Regex!==void 0){let A=ee.Regex.replace(/\\([#&~])/g,"$1");for(let[U,$]of F)A=A.replaceAll(U,$);return new RegExp(A,"gu")}else if(ee.String!==void 0){let A=(0,d.escapeRegExp)(ee.String);return new RegExp(c?A:`(${A})`,"gu")}else return console.warn("Unknown pattern type:",ee),null}function w(ee){return new Map(Object.entries(ee))}function k(ee){let c=ee.dims;switch(c.length){case 1:return ee.tolist();case 2:if(c[0]!==1)throw new Error("Unable to decode tensor with `batch size !== 1`. Use `tokenizer.batch_decode(...)` for batched inputs.");return ee.tolist()[0];default:throw new Error(`Expected tensor to have 1-2 dimensions, got ${c.length}.`)}}function G(ee){return ee.replace(/ \./g,".").replace(/ \?/g,"?").replace(/ \!/g,"!").replace(/ ,/g,",").replace(/ \' /g,"'").replace(/ n\'t/g,"n't").replace(/ \'m/g,"'m").replace(/ \'s/g,"'s").replace(/ \'ve/g,"'ve").replace(/ \'re/g,"'re")}function b(ee){return ee.replace(new RegExp("\\p{M}","gu"),"")}function C(ee){return b(ee.toLowerCase())}function B(ee){return ee>=19968&&ee<=40959||ee>=13312&&ee<=19903||ee>=131072&&ee<=173791||ee>=173824&&ee<=177983||ee>=177984&&ee<=178207||ee>=178208&&ee<=183983||ee>=63744&&ee<=64255||ee>=194560&&ee<=195103}function P(ee,c,A){let U=[],$=0;for(;$<ee.length;){if(U.push(ee[$]),(c.get(ee[$])??A)!==A){++$;continue}for(;++$<ee.length&&(c.get(ee[$])??A)===A;)c.get(U.at(-1))!==A&&(U[U.length-1]+=ee[$])}return U}function M(ee){return ee.match(/\S+/g)||[]}let y="\\p{P}\\u0021-\\u002F\\u003A-\\u0040\\u005B-\\u0060\\u007B-\\u007E",l=new RegExp(`^[${y}]+$`,"gu"),h=".,!?\u2026\u3002\uFF0C\u3001\u0964\u06D4\u060C",F=new Map([["(?i:'s|'t|'re|'ve|'m|'ll|'d)","(?:'([sS]|[tT]|[rR][eE]|[vV][eE]|[mM]|[lL][lL]|[dD]))"],["(?i:[sdmt]|ll|ve|re)","(?:[sS]|[dD]|[mM]|[tT]|[lL][lL]|[vV][eE]|[rR][eE])"],["[^\\r\\n\\p{L}\\p{N}]?+","[^\\r\\n\\p{L}\\p{N}]?"],["[^\\s\\p{L}\\p{N}]++","[^\\s\\p{L}\\p{N}]+"],[` ?[^(\\s|[${h}])]+`,` ?[^\\s${h}]+`]]);class S{constructor(c){this.content=c.content,this.id=c.id,this.single_word=c.single_word??!1,this.lstrip=c.lstrip??!1,this.rstrip=c.rstrip??!1,this.special=c.special??!1,this.normalized=c.normalized??null}}class V extends i.Callable{constructor(c){super(),this.config=c,this.vocab=[],this.tokens_to_ids=new Map,this.unk_token_id=void 0,this.unk_token=void 0,this.end_of_word_suffix=void 0,this.fuse_unk=this.config.fuse_unk??!1}static fromConfig(c,...A){switch(c.type){case"WordPiece":return new R(c);case"Unigram":return new N(c,...A);case"BPE":return new J(c);default:if(c.vocab)return Array.isArray(c.vocab)?new N(c,...A):Object.hasOwn(c,"continuing_subword_prefix")&&Object.hasOwn(c,"unk_token")?Object.hasOwn(c,"merges")?new J(c):new R(c):new te(c,...A);throw new Error(`Unknown TokenizerModel type: ${c.type}`)}}_call(c){return c=this.encode(c),this.fuse_unk&&(c=P(c,this.tokens_to_ids,this.unk_token_id)),c}encode(c){throw Error("encode should be implemented in subclass.")}convert_tokens_to_ids(c){return c.map(A=>this.tokens_to_ids.get(A)??this.unk_token_id)}convert_ids_to_tokens(c){return c.map(A=>this.vocab[A]??this.unk_token)}}class R extends V{constructor(c){super(c),this.tokens_to_ids=w(c.vocab),this.unk_token_id=this.tokens_to_ids.get(c.unk_token),this.unk_token=c.unk_token,this.max_input_chars_per_word=c.max_input_chars_per_word??100,this.vocab=new Array(this.tokens_to_ids.size);for(let[A,U]of this.tokens_to_ids)this.vocab[U]=A}encode(c){let A=[];for(let U of c){let $=[...U];if($.length>this.max_input_chars_per_word){A.push(this.unk_token);continue}let ie=!1,Pe=0,Ne=[];for(;Pe<$.length;){let Ve=$.length,ze=null;for(;Pe<Ve;){let Ie=$.slice(Pe,Ve).join("");if(Pe>0&&(Ie=this.config.continuing_subword_prefix+Ie),this.tokens_to_ids.has(Ie)){ze=Ie;break}--Ve}if(ze===null){ie=!0;break}Ne.push(ze),Pe=Ve}ie?A.push(this.unk_token):A.push(...Ne)}return A}}class N extends V{constructor(c,A){super(c);let U=c.vocab.length;this.vocab=new Array(U),this.scores=new Array(U);for(let $=0;$<U;++$)[this.vocab[$],this.scores[$]]=c.vocab[$];this.unk_token_id=c.unk_id,this.unk_token=this.vocab[c.unk_id],this.tokens_to_ids=new Map(this.vocab.map(($,ie)=>[$,ie])),this.bos_token=" ",this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=A.eos_token,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.unk_token=this.vocab[this.unk_token_id],this.minScore=(0,I.min)(this.scores)[0],this.unk_score=this.minScore-10,this.scores[this.unk_token_id]=this.unk_score,this.trie=new u.CharTrie,this.trie.extend(this.vocab),this.fuse_unk=!0}populateNodes(c){let A=c.chars,U=1,$=0;for(;$<A.length;){let ie=!1,Pe=[],Ne=A.slice($).join(""),Ve=this.trie.commonPrefixSearch(Ne);for(let ze of Ve){Pe.push(ze);let Ie=this.tokens_to_ids.get(ze),_t=this.scores[Ie],ot=(0,d.len)(ze);c.insert($,ot,_t,Ie),!ie&&ot===U&&(ie=!0)}ie||c.insert($,U,this.unk_score,this.unk_token_id),$+=U}}tokenize(c){let A=new u.TokenLattice(c,this.bos_token_id,this.eos_token_id);return this.populateNodes(A),A.tokens()}encode(c){let A=[];for(let U of c){let $=this.tokenize(U);A.push(...$)}return A}}let Q=(()=>{let ee=[...Array.from({length:94},($,ie)=>ie+33),...Array.from({length:12},($,ie)=>ie+161),...Array.from({length:82},($,ie)=>ie+174)],c=ee.slice(),A=0;for(let $=0;$<256;++$)ee.includes($)||(ee.push($),c.push(256+A),A+=1);let U=c.map($=>String.fromCharCode($));return Object.fromEntries(ee.map(($,ie)=>[$,U[ie]]))})(),K=(0,d.reverseDictionary)(Q);class J extends V{constructor(c){super(c),this.tokens_to_ids=w(c.vocab),this.unk_token_id=this.tokens_to_ids.get(c.unk_token),this.unk_token=c.unk_token,this.vocab=new Array(this.tokens_to_ids.size);for(let[U,$]of this.tokens_to_ids)this.vocab[$]=U;let A=Array.isArray(c.merges[0]);this.merges=A?c.merges:c.merges.map(U=>U.split(" ",2)),this.bpe_ranks=new Map(this.merges.map((U,$)=>[JSON.stringify(U),$])),this.end_of_word_suffix=c.end_of_word_suffix,this.continuing_subword_suffix=c.continuing_subword_suffix??null,this.byte_fallback=this.config.byte_fallback??!1,this.byte_fallback&&(this.text_encoder=new TextEncoder),this.ignore_merges=this.config.ignore_merges??!1,this.max_length_to_cache=256,this.cache_capacity=1e4,this.cache=new u.LRUCache(this.cache_capacity)}clear_cache(){this.cache.clear()}bpe(c){if(c.length===0)return[];let A=this.cache.get(c);if(A!==void 0)return A;let U=Array.from(c);this.end_of_word_suffix&&(U[U.length-1]+=this.end_of_word_suffix);let $=[];if(U.length>1){let ie=new u.PriorityQueue((Ve,ze)=>Ve.score<ze.score),Pe={token:U[0],bias:0,prev:null,next:null},Ne=Pe;for(let Ve=1;Ve<U.length;++Ve){let ze={bias:Ve/U.length,token:U[Ve],prev:Ne,next:null};Ne.next=ze,this._add_node(ie,Ne),Ne=ze}for(;!ie.isEmpty();){let Ve=ie.pop();if(Ve.deleted||!Ve.next||Ve.next.deleted)continue;if(Ve.deleted=!0,Ve.next.deleted=!0,Ve.prev){let Ie={...Ve.prev};Ve.prev.deleted=!0,Ve.prev=Ie,Ie.prev?Ie.prev.next=Ie:Pe=Ie}let ze={token:Ve.token+Ve.next.token,bias:Ve.bias,prev:Ve.prev,next:Ve.next.next};ze.prev?(ze.prev.next=ze,this._add_node(ie,ze.prev)):Pe=ze,ze.next&&(ze.next.prev=ze,this._add_node(ie,ze))}for(let Ve=Pe;Ve!==null;Ve=Ve.next)$.push(Ve.token)}else $=U;if(this.continuing_subword_suffix)for(let ie=0;ie<$.length-1;++ie)$[ie]+=this.continuing_subword_suffix;return c.length<this.max_length_to_cache&&this.cache.put(c,$),$}_add_node(c,A){let U=this.bpe_ranks.get(JSON.stringify([A.token,A.next.token]));U!==void 0&&(A.score=U+A.bias,c.push(A))}encode(c){let A=[];for(let U of c){if(this.ignore_merges&&this.tokens_to_ids.has(U)){A.push(U);continue}let $=this.bpe(U);for(let ie of $)if(this.tokens_to_ids.has(ie))A.push(ie);else if(this.byte_fallback){let Pe=Array.from(this.text_encoder.encode(ie)).map(Ne=>`<0x${Ne.toString(16).toUpperCase().padStart(2,"0")}>`);Pe.every(Ne=>this.tokens_to_ids.has(Ne))?A.push(...Pe):A.push(this.unk_token)}else A.push(this.unk_token)}return A}}class te extends V{constructor(c,A){super(c),this.tokens_to_ids=w(A.target_lang?c.vocab[A.target_lang]:c.vocab),this.bos_token=A.bos_token,this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=A.eos_token,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.pad_token=A.pad_token,this.pad_token_id=this.tokens_to_ids.get(this.pad_token),this.unk_token=A.unk_token,this.unk_token_id=this.tokens_to_ids.get(this.unk_token),this.vocab=new Array(this.tokens_to_ids.size);for(let[U,$]of this.tokens_to_ids)this.vocab[$]=U}encode(c){return c}}class se extends i.Callable{constructor(c){super(),this.config=c}static fromConfig(c){if(c===null)return null;switch(c.type){case"BertNormalizer":return new $e(c);case"Precompiled":return new ft(c);case"Sequence":return new Le(c);case"Replace":return new ce(c);case"NFC":return new _e(c);case"NFD":return new X(c);case"NFKC":return new L(c);case"NFKD":return new W(c);case"Strip":return new Y(c);case"StripAccents":return new ae(c);case"Lowercase":return new be(c);case"Prepend":return new xe(c);default:throw new Error(`Unknown Normalizer type: ${c.type}`)}}normalize(c){throw Error("normalize should be implemented in subclass.")}_call(c){return this.normalize(c)}}class ce extends se{normalize(c){let A=x(this.config.pattern);return A===null?c:c.replaceAll(A,this.config.content)}}class we extends se{form=void 0;normalize(c){return c=c.normalize(this.form),c}}class _e extends we{form="NFC"}class X extends we{form="NFD"}class L extends we{form="NFKC"}class W extends we{form="NFKD"}class Y extends se{normalize(c){return this.config.strip_left&&this.config.strip_right?c=c.trim():(this.config.strip_left&&(c=c.trimStart()),this.config.strip_right&&(c=c.trimEnd())),c}}class ae extends se{normalize(c){return c=b(c),c}}class be extends se{normalize(c){return c=c.toLowerCase(),c}}class xe extends se{normalize(c){return c=this.config.prepend+c,c}}class Le extends se{constructor(c){super(c),this.normalizers=c.normalizers.map(A=>se.fromConfig(A))}normalize(c){return this.normalizers.reduce((A,U)=>U.normalize(A),c)}}class $e extends se{_tokenize_chinese_chars(c){let A=[];for(let U=0;U<c.length;++U){let $=c[U],ie=$.charCodeAt(0);B(ie)?(A.push(" "),A.push($),A.push(" ")):A.push($)}return A.join("")}stripAccents(c){return c.normalize("NFD").replace(new RegExp("\\p{Mn}","gu"),"")}_is_control(c){switch(c){case" ":case`
|
|
24
|
+
`:case"\r":return!1;default:return new RegExp("^\\p{Cc}|\\p{Cf}|\\p{Co}|\\p{Cs}$","u").test(c)}}_clean_text(c){let A=[];for(let U of c){let $=U.charCodeAt(0);$===0||$===65533||this._is_control(U)||(/^\s$/.test(U)?A.push(" "):A.push(U))}return A.join("")}normalize(c){return this.config.clean_text&&(c=this._clean_text(c)),this.config.handle_chinese_chars&&(c=this._tokenize_chinese_chars(c)),this.config.lowercase?(c=c.toLowerCase(),this.config.strip_accents!==!1&&(c=this.stripAccents(c))):this.config.strip_accents&&(c=this.stripAccents(c)),c}}class ge extends i.Callable{static fromConfig(c){if(c===null)return null;switch(c.type){case"BertPreTokenizer":return new p(c);case"Sequence":return new $t(c);case"Whitespace":return new Hs(c);case"WhitespaceSplit":return new Js(c);case"Metaspace":return new Pt(c);case"ByteLevel":return new q(c);case"Split":return new de(c);case"Punctuation":return new pe(c);case"Digits":return new Te(c);case"Replace":return new Ys(c);case"FixedLength":return new kt(c);default:throw new Error(`Unknown PreTokenizer type: ${c.type}`)}}pre_tokenize_text(c,A){throw Error("pre_tokenize_text should be implemented in subclass.")}pre_tokenize(c,A){return(Array.isArray(c)?c.map(U=>this.pre_tokenize_text(U,A)):this.pre_tokenize_text(c,A)).flat()}_call(c,A){return this.pre_tokenize(c,A)}}class p extends ge{constructor(c){super(),this.pattern=new RegExp(`[^\\s${y}]+|[${y}]`,"gu")}pre_tokenize_text(c,A){return c.trim().match(this.pattern)||[]}}class q extends ge{constructor(c){super(),this.config=c,this.add_prefix_space=this.config.add_prefix_space,this.trim_offsets=this.config.trim_offsets,this.use_regex=this.config.use_regex??!0,this.pattern=new RegExp("'s|'t|'re|'ve|'m|'ll|'d| ?\\p{L}+| ?\\p{N}+| ?[^\\s\\p{L}\\p{N}]+|\\s+(?!\\S)|\\s+","gu"),this.byte_encoder=Q,this.text_encoder=new TextEncoder}pre_tokenize_text(c,A){return this.add_prefix_space&&!c.startsWith(" ")&&(c=" "+c),(this.use_regex?c.match(this.pattern)||[]:[c]).map($=>Array.from(this.text_encoder.encode($),ie=>this.byte_encoder[ie]).join(""))}}class de extends ge{constructor(c){super(),this.config=c,this.pattern=x(this.config.pattern,this.config.invert)}pre_tokenize_text(c,A){return this.pattern===null?[]:this.config.invert?c.match(this.pattern)||[]:this.config.behavior?.toLowerCase()==="removed"?c.split(this.pattern).filter(U=>U):o(c,this.pattern)}}class pe extends ge{constructor(c){super(),this.config=c,this.pattern=new RegExp(`[^${y}]+|[${y}]+`,"gu")}pre_tokenize_text(c,A){return c.match(this.pattern)||[]}}class Te extends ge{constructor(c){super(),this.config=c;let A=`[^\\d]+|\\d${this.config.individual_digits?"":"+"}`;this.pattern=new RegExp(A,"gu")}pre_tokenize_text(c,A){return c.match(this.pattern)||[]}}class me extends i.Callable{constructor(c){super(),this.config=c}static fromConfig(c){if(c===null)return null;switch(c.type){case"TemplateProcessing":return new le(c);case"ByteLevel":return new he(c);case"RobertaProcessing":return new fe(c);case"BertProcessing":return new ne(c);case"Sequence":return new De(c);default:throw new Error(`Unknown PostProcessor type: ${c.type}`)}}post_process(c,...A){throw Error("post_process should be implemented in subclass.")}_call(c,...A){return this.post_process(c,...A)}}class ne extends me{constructor(c){super(c),this.cls=c.cls[0],this.sep=c.sep[0]}post_process(c,A=null,{add_special_tokens:U=!0}={}){U&&(c=(0,d.mergeArrays)([this.cls],c,[this.sep]));let $=new Array(c.length).fill(0);if(A!==null){let ie=U&&this instanceof fe?[this.sep]:[],Pe=U?[this.sep]:[];c=(0,d.mergeArrays)(c,ie,A,Pe),$=(0,d.mergeArrays)($,new Array(A.length+ie.length+Pe.length).fill(1))}return{tokens:c,token_type_ids:$}}}class fe extends ne{}class le extends me{constructor(c){super(c),this.single=c.single,this.pair=c.pair}post_process(c,A=null,{add_special_tokens:U=!0}={}){let $=A===null?this.single:this.pair,ie=[],Pe=[];for(let Ne of $)"SpecialToken"in Ne?U&&(ie.push(Ne.SpecialToken.id),Pe.push(Ne.SpecialToken.type_id)):"Sequence"in Ne&&(Ne.Sequence.id==="A"?(ie=(0,d.mergeArrays)(ie,c),Pe=(0,d.mergeArrays)(Pe,new Array(c.length).fill(Ne.Sequence.type_id))):Ne.Sequence.id==="B"&&(ie=(0,d.mergeArrays)(ie,A),Pe=(0,d.mergeArrays)(Pe,new Array(A.length).fill(Ne.Sequence.type_id))));return{tokens:ie,token_type_ids:Pe}}}class he extends me{post_process(c,A=null){return A&&(c=(0,d.mergeArrays)(c,A)),{tokens:c}}}class De extends me{constructor(c){super(c),this.processors=c.processors.map(A=>me.fromConfig(A))}post_process(c,A=null,U={}){let $;for(let ie of this.processors)if(ie instanceof he)c=ie.post_process(c).tokens,A&&(A=ie.post_process(A).tokens);else{let Pe=ie.post_process(c,A,U);c=Pe.tokens,$=Pe.token_type_ids}return{tokens:c,token_type_ids:$}}}class ve extends i.Callable{constructor(c){super(),this.config=c,this.added_tokens=[],this.end_of_word_suffix=null,this.trim_offsets=c.trim_offsets}static fromConfig(c){if(c===null)return null;switch(c.type){case"WordPiece":return new Re(c);case"Metaspace":return new jt(c);case"ByteLevel":return new ke(c);case"Replace":return new ye(c);case"ByteFallback":return new Ce(c);case"Fuse":return new Qe(c);case"Strip":return new Be(c);case"Sequence":return new je(c);case"CTC":return new qe(c);case"BPEDecoder":return new nt(c);default:throw new Error(`Unknown Decoder type: ${c.type}`)}}_call(c){return this.decode(c)}decode(c){return this.decode_chain(c).join("")}decode_chain(c){throw Error("`decode_chain` should be implemented in subclass.")}}class ye extends ve{decode_chain(c){let A=x(this.config.pattern);return A===null?c:c.map(U=>U.replaceAll(A,this.config.content))}}class Ce extends ve{constructor(c){super(c),this.text_decoder=new TextDecoder}decode_chain(c){let A=[],U=[];for(let $ of c){let ie=null;if($.length===6&&$.startsWith("<0x")&&$.endsWith(">")){let Pe=parseInt($.slice(3,5),16);isNaN(Pe)||(ie=Pe)}if(ie!==null)U.push(ie);else{if(U.length>0){let Pe=this.text_decoder.decode(Uint8Array.from(U));A.push(Pe),U=[]}A.push($)}}if(U.length>0){let $=this.text_decoder.decode(Uint8Array.from(U));A.push($),U=[]}return A}}class Qe extends ve{decode_chain(c){return[c.join("")]}}class Be extends ve{constructor(c){super(c),this.content=this.config.content,this.start=this.config.start,this.stop=this.config.stop}decode_chain(c){return c.map(A=>{let U=0;for(let ie=0;ie<this.start&&A[ie]===this.content;++ie){U=ie+1;continue}let $=A.length;for(let ie=0;ie<this.stop;++ie){let Pe=A.length-ie-1;if(A[Pe]===this.content){$=Pe;continue}else break}return A.slice(U,$)})}}class Re extends ve{constructor(c){super(c),this.cleanup=c.cleanup}decode_chain(c){return c.map((A,U)=>(U!==0&&(A.startsWith(this.config.prefix)?A=A.replace(this.config.prefix,""):A=" "+A),this.cleanup&&(A=G(A)),A))}}class ke extends ve{constructor(c){super(c),this.byte_decoder=K,this.text_decoder=new TextDecoder("utf-8",{fatal:!1,ignoreBOM:!0}),this.end_of_word_suffix=null}convert_tokens_to_string(c){let A=c.join(""),U=new Uint8Array([...A].map(ie=>this.byte_decoder[ie]));return this.text_decoder.decode(U)}decode_chain(c){let A=[],U=[];for(let $ of c)this.added_tokens.find(ie=>ie.content===$)!==void 0?(U.length>0&&(A.push(this.convert_tokens_to_string(U)),U=[]),A.push($)):U.push($);return U.length>0&&A.push(this.convert_tokens_to_string(U)),A}}class qe extends ve{constructor(c){super(c),this.pad_token=this.config.pad_token,this.word_delimiter_token=this.config.word_delimiter_token,this.cleanup=this.config.cleanup}convert_tokens_to_string(c){if(c.length===0)return"";let A=[c[0]];for(let ie=1;ie<c.length;++ie)c[ie]!==A.at(-1)&&A.push(c[ie]);let $=A.filter(ie=>ie!==this.pad_token).join("");return this.cleanup&&($=G($).replaceAll(this.word_delimiter_token," ").trim()),$}decode_chain(c){return[this.convert_tokens_to_string(c)]}}class je extends ve{constructor(c){super(c),this.decoders=c.decoders.map(A=>ve.fromConfig(A))}decode_chain(c){return this.decoders.reduce((A,U)=>U.decode_chain(A),c)}}class nt extends ve{constructor(c){super(c),this.suffix=this.config.suffix}decode_chain(c){return c.map((A,U)=>A.replaceAll(this.suffix,U===c.length-1?"":" "))}}class ut extends ve{decode_chain(c){let A="";for(let U=1;U<c.length;U+=2)A+=c[U];return[A]}}class Pt extends ge{constructor(c){super(),this.replacement=c.replacement,this.strRep=c.str_rep||this.replacement,this.prepend_scheme=c.prepend_scheme??"always"}pre_tokenize_text(c,{section_index:A=void 0}={}){let U=c.replaceAll(" ",this.strRep);return!U.startsWith(this.replacement)&&(this.prepend_scheme==="always"||this.prepend_scheme==="first"&&A===0)&&(U=this.strRep+U),[U]}}class jt extends ve{constructor(c){super(c),this.replacement=c.replacement}decode_chain(c){let A=[];for(let U=0;U<c.length;++U){let $=c[U].replaceAll(this.replacement," ");U==0&&$.startsWith(" ")&&($=$.substring(1)),A.push($)}return A}}class ft extends se{constructor(c){super(c),this.charsmap=c.precompiled_charsmap}normalize(c){return c=c.replace(/[\u0001-\u0008\u000B\u000E-\u001F\u007F\u008F\u009F]/gm,""),c=c.replace(/[\u0009\u000A\u000C\u000D\u00A0\u1680\u2000-\u200F\u2028\u2029\u202F\u205F\u2581\u3000\uFEFF\uFFFD]/gm," "),c.includes("\uFF5E")?c=c.split("\uFF5E").map(U=>U.normalize("NFKC")).join("\uFF5E"):c=c.normalize("NFKC"),c}}class $t extends ge{constructor(c){super(),this.tokenizers=c.pretokenizers.map(A=>ge.fromConfig(A))}pre_tokenize_text(c,A){return this.tokenizers.reduce((U,$)=>$.pre_tokenize(U,A),[c])}}class Hs extends ge{constructor(c){super()}pre_tokenize_text(c,A){return c.match(/\w+|[^\w\s]+/g)||[]}}class Js extends ge{constructor(c){super()}pre_tokenize_text(c,A){return M(c)}}class Ys extends ge{constructor(c){super(),this.config=c,this.pattern=x(this.config.pattern),this.content=this.config.content}pre_tokenize_text(c,A){return this.pattern===null?[c]:[c.replaceAll(this.pattern,this.config.content)]}}class kt extends ge{constructor(c){super(),this._length=c.length}pre_tokenize_text(c,A){let U=[];for(let $=0;$<c.length;$+=this._length)U.push(c.slice($,$+this._length));return U}}let qt=["bos_token","eos_token","unk_token","sep_token","pad_token","cls_token","mask_token"];function us(ee,c,A,U){for(let $ of Object.keys(ee)){let ie=c-ee[$].length,Pe=A($),Ne=new Array(ie).fill(Pe);ee[$]=U==="right"?(0,d.mergeArrays)(ee[$],Ne):(0,d.mergeArrays)(Ne,ee[$])}}function qs(ee,c){for(let A of Object.keys(ee))ee[A].length=c}class Ze extends i.Callable{return_token_type_ids=!1;padding_side="right";constructor(c,A){super(),this.config=A,this.normalizer=se.fromConfig(c.normalizer),this.pre_tokenizer=ge.fromConfig(c.pre_tokenizer),this.model=V.fromConfig(c.model,A),this.post_processor=me.fromConfig(c.post_processor),this.decoder=ve.fromConfig(c.decoder),this.special_tokens=[],this.all_special_ids=[],this.added_tokens=[];for(let U of c.added_tokens){let $=new S(U);this.added_tokens.push($),this.model.tokens_to_ids.set($.content,$.id),this.model.vocab[$.id]=$.content,$.special&&(this.special_tokens.push($.content),this.all_special_ids.push($.id))}if(this.additional_special_tokens=A.additional_special_tokens??[],this.special_tokens.push(...this.additional_special_tokens),this.special_tokens=[...new Set(this.special_tokens)],this.decoder&&(this.decoder.added_tokens=this.added_tokens,this.decoder.end_of_word_suffix=this.model.end_of_word_suffix),this.added_tokens_splitter=new u.DictionarySplitter(this.added_tokens.map(U=>U.content)),this.added_tokens_map=new Map(this.added_tokens.map(U=>[U.content,U])),this.mask_token=this.getToken("mask_token"),this.mask_token_id=this.model.tokens_to_ids.get(this.mask_token),this.pad_token=this.getToken("pad_token","eos_token"),this.pad_token_id=this.model.tokens_to_ids.get(this.pad_token),this.sep_token=this.getToken("sep_token"),this.sep_token_id=this.model.tokens_to_ids.get(this.sep_token),this.unk_token=this.getToken("unk_token"),this.unk_token_id=this.model.tokens_to_ids.get(this.unk_token),this.bos_token=this.getToken("bos_token"),this.bos_token_id=this.model.tokens_to_ids.get(this.bos_token),this.eos_token=this.getToken("eos_token"),this.eos_token_id=this.model.tokens_to_ids.get(this.eos_token),this.model_max_length=A.model_max_length,this.remove_space=A.remove_space,this.clean_up_tokenization_spaces=A.clean_up_tokenization_spaces??!0,this.do_lowercase_and_remove_accent=A.do_lowercase_and_remove_accent??!1,A.padding_side&&(this.padding_side=A.padding_side),this.add_bos_token=A.add_bos_token,this.add_eos_token=A.add_eos_token,this.legacy=!1,this.chat_template=A.chat_template??null,Array.isArray(this.chat_template)){let U=Object.create(null);for(let{name:$,template:ie}of this.chat_template){if(typeof $!="string"||typeof ie!="string")throw new Error('Chat template must be a list of objects with "name" and "template" properties');U[$]=ie}this.chat_template=U}this._compiled_template_cache=new Map}getToken(...c){for(let A of c){let U=this.config[A];if(U)if(typeof U=="object"){if(U.__type==="AddedToken")return U.content;throw Error(`Unknown token: ${U}`)}else return U}return null}static async from_pretrained(c,{progress_callback:A=null,config:U=null,cache_dir:$=null,local_files_only:ie=!1,revision:Pe="main",legacy:Ne=null}={}){let Ve=await _(c,{progress_callback:A,config:U,cache_dir:$,local_files_only:ie,revision:Pe,legacy:Ne});return new this(...Ve)}_call(c,{text_pair:A=null,add_special_tokens:U=!0,padding:$=!1,truncation:ie=null,max_length:Pe=null,return_tensor:Ne=!0,return_token_type_ids:Ve=null}={}){let ze=Array.isArray(c),Ie;if(ze){if(c.length===0)throw Error("text array must be non-empty");if(A!==null){if(Array.isArray(A)){if(c.length!==A.length)throw Error("text and text_pair must have the same length")}else throw Error("text_pair must also be an array");Ie=c.map((ot,Ft)=>this._encode_plus(ot,{text_pair:A[Ft],add_special_tokens:U,return_token_type_ids:Ve}))}else Ie=c.map(ot=>this._encode_plus(ot,{add_special_tokens:U,return_token_type_ids:Ve}))}else{if(c==null)throw Error("text may not be null or undefined");if(Array.isArray(A))throw Error("When specifying `text_pair`, since `text` is a string, `text_pair` must also be a string (i.e., not an array).");Ie=[this._encode_plus(c,{text_pair:A,add_special_tokens:U,return_token_type_ids:Ve})]}if(Pe===null?Pe=this.model_max_length:ie===null&&($===!0?(console.warn("`max_length` is ignored when `padding: true` and there is no truncation strategy. To pad to max length, use `padding: 'max_length'`."),Pe=this.model_max_length):$===!1&&(console.warn("Truncation was not explicitly activated but `max_length` is provided a specific value, please use `truncation: true` to explicitly truncate examples to max length."),ie=!0)),$===!0&&(Pe=Math.min((0,I.max)(Ie.map(ot=>ot.input_ids.length))[0],Pe??1/0)),Pe=Math.min(Pe,this.model_max_length??1/0),$||ie)for(let ot=0;ot<Ie.length;++ot)Ie[ot].input_ids.length!==Pe&&(Ie[ot].input_ids.length>Pe?ie&&qs(Ie[ot],Pe):$&&us(Ie[ot],Pe,Ft=>Ft==="input_ids"?this.pad_token_id:0,this.padding_side));let _t={};if(Ne){if(!($&&ie)&&Ie.some(Ft=>{for(let Rt of Object.keys(Ft))if(Ft[Rt].length!==Ie[0][Rt]?.length)return!0;return!1}))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=true' and 'truncation=true' to have batched tensors with the same length.");let ot=[Ie.length,Ie[0].input_ids.length];for(let Ft of Object.keys(Ie[0]))_t[Ft]=new f.Tensor("int64",BigInt64Array.from(Ie.flatMap(Rt=>Rt[Ft]).map(BigInt)),ot)}else{for(let ot of Object.keys(Ie[0]))_t[ot]=Ie.map(Ft=>Ft[ot]);if(!ze)for(let ot of Object.keys(_t))_t[ot]=_t[ot][0]}return _t}_encode_text(c){if(c===null)return null;let A=this.added_tokens_splitter.split(c);for(let $=0;$<A.length;++$){let ie=this.added_tokens_map.get(A[$]);ie&&(ie.lstrip&&$>0&&(A[$-1]=A[$-1].trimEnd()),ie.rstrip&&$<A.length-1&&(A[$+1]=A[$+1].trimStart()))}return A.flatMap(($,ie)=>{if($.length===0)return[];if(this.added_tokens_map.has($))return[$];if(this.remove_space===!0&&($=$.trim().split(/\s+/).join(" ")),this.do_lowercase_and_remove_accent&&($=C($)),this.normalizer!==null&&($=this.normalizer($)),$.length===0)return[];let Pe=this.pre_tokenizer!==null?this.pre_tokenizer($,{section_index:ie}):[$];return this.model(Pe)})}_encode_plus(c,{text_pair:A=null,add_special_tokens:U=!0,return_token_type_ids:$=null}={}){let{tokens:ie,token_type_ids:Pe}=this._tokenize_helper(c,{pair:A,add_special_tokens:U}),Ne=this.model.convert_tokens_to_ids(ie),Ve={input_ids:Ne,attention_mask:new Array(Ne.length).fill(1)};return($??this.return_token_type_ids)&&Pe&&(Ve.token_type_ids=Pe),Ve}_tokenize_helper(c,{pair:A=null,add_special_tokens:U=!1}={}){let $=this._encode_text(c),ie=this._encode_text(A);return this.post_processor?this.post_processor($,ie,{add_special_tokens:U}):{tokens:(0,d.mergeArrays)($??[],ie??[])}}tokenize(c,{pair:A=null,add_special_tokens:U=!1}={}){return this._tokenize_helper(c,{pair:A,add_special_tokens:U}).tokens}encode(c,{text_pair:A=null,add_special_tokens:U=!0,return_token_type_ids:$=null}={}){return this._encode_plus(c,{text_pair:A,add_special_tokens:U,return_token_type_ids:$}).input_ids}batch_decode(c,A={}){return c instanceof f.Tensor&&(c=c.tolist()),c.map(U=>this.decode(U,A))}decode(c,A={}){if(c instanceof f.Tensor&&(c=k(c)),!Array.isArray(c)||c.length===0||!(0,d.isIntegralNumber)(c[0]))throw Error("token_ids must be a non-empty array of integers.");return this.decode_single(c,A)}decode_single(c,{skip_special_tokens:A=!1,clean_up_tokenization_spaces:U=null}){let $=this.model.convert_ids_to_tokens(c);A&&($=$.filter(Pe=>!this.special_tokens.includes(Pe)));let ie=this.decoder?this.decoder($):$.join(" ");return this.decoder&&this.decoder.end_of_word_suffix&&(ie=ie.replaceAll(this.decoder.end_of_word_suffix," "),A&&(ie=ie.trim())),(U??this.clean_up_tokenization_spaces)&&(ie=G(ie)),ie}get_chat_template({chat_template:c=null,tools:A=null}={}){if(this.chat_template&&typeof this.chat_template=="object"){let U=this.chat_template;if(c!==null&&Object.hasOwn(U,c))c=U[c];else if(c===null)if(A!==null&&"tool_use"in U)c=U.tool_use;else if("default"in U)c=U.default;else throw Error(`This model has multiple chat templates with no default specified! Please either pass a chat template or the name of the template you wish to use to the 'chat_template' argument. Available template names are ${Object.keys(U).sort()}.`)}else if(c===null)if(this.chat_template)c=this.chat_template;else throw Error("Cannot use apply_chat_template() because tokenizer.chat_template is not set and no template argument was passed! For information about writing templates and setting the tokenizer.chat_template attribute, please see the documentation at https://huggingface.co/docs/transformers/main/en/chat_templating");return c}apply_chat_template(c,{tools:A=null,documents:U=null,chat_template:$=null,add_generation_prompt:ie=!1,tokenize:Pe=!0,padding:Ne=!1,truncation:Ve=!1,max_length:ze=null,return_tensor:Ie=!0,return_dict:_t=!1,tokenizer_kwargs:ot={},...Ft}={}){if($=this.get_chat_template({chat_template:$,tools:A}),typeof $!="string")throw Error(`chat_template must be a string, but got ${typeof $}`);let Rt=this._compiled_template_cache.get($);Rt===void 0&&(Rt=new m.Template($),this._compiled_template_cache.set($,Rt));let yt=Object.create(null);for(let Vt of qt){let cs=this.getToken(Vt);cs&&(yt[Vt]=cs)}let Zt=Rt.render({messages:c,add_generation_prompt:ie,tools:A,documents:U,...yt,...Ft});if(Pe){let Vt=this._call(Zt,{add_special_tokens:!1,padding:Ne,truncation:Ve,max_length:ze,return_tensor:Ie,...ot});return _t?Vt:Vt.input_ids}return Zt}}class Ls extends Ze{return_token_type_ids=!0}class Ds extends Ze{return_token_type_ids=!0}class Is extends Ze{return_token_type_ids=!0}class is extends Ze{return_token_type_ids=!0}class lt extends Ze{return_token_type_ids=!0}class Os extends Ze{return_token_type_ids=!0}class n extends Ze{return_token_type_ids=!0}class j extends Ze{return_token_type_ids=!0}class v extends Ze{return_token_type_ids=!0}class O extends Ze{}class z extends Ze{}class Z extends Ze{return_token_type_ids=!0;constructor(c,A){super(c,A),console.warn('WARNING: `XLMTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}}class ue extends Ze{return_token_type_ids=!0}class Ge extends Ze{}class Je extends Ze{}class Oe extends Ze{}class st extends Ze{constructor(c,A){super(c,A),this.languageRegex=/^[a-z]{2}_[A-Z]{2}$/,this.language_codes=this.special_tokens.filter(U=>this.languageRegex.test(U)),this.lang_to_token=U=>U}_build_translation_inputs(c,A,U){return ls(this,c,A,U)}}class We extends st{}class it extends Ze{}class gt extends Ze{}let Kt="\u2581";class Nt extends Ze{padding_side="left";constructor(c,A){super(c,A),this.legacy=A.legacy??!0,this.legacy||(this.normalizer=null,this.pre_tokenizer=new Pt({replacement:Kt,prepend_scheme:"first"}))}_encode_text(c){if(c===null)return null;if(this.legacy||c.length===0)return super._encode_text(c);let A=super._encode_text(Kt+c.replaceAll(Kt," "));return A.length>1&&A[0]===Kt&&this.special_tokens.includes(A[1])&&(A=A.slice(1)),A}}class ss extends Ze{}class Qt extends Ze{}class Ps extends Ze{}class Ts extends Ze{}class ws extends Ze{}class os extends Ze{}class Bs extends Ze{}class bs extends Ze{}class js extends Ze{}function ls(ee,c,A,U){if(!("language_codes"in ee)||!Array.isArray(ee.language_codes))throw new Error("Tokenizer must have `language_codes` attribute set and it should be an array of language ids.");if(!("languageRegex"in ee)||!(ee.languageRegex instanceof RegExp))throw new Error("Tokenizer must have `languageRegex` attribute set and it should be a regular expression.");if(!("lang_to_token"in ee)||typeof ee.lang_to_token!="function")throw new Error("Tokenizer must have `lang_to_token` attribute set and it should be a function.");let $=U.src_lang,ie=U.tgt_lang;if(!ee.language_codes.includes(ie))throw new Error(`Target language code "${ie}" is not valid. Must be one of: {${ee.language_codes.join(", ")}}`);if($!==void 0){if(!ee.language_codes.includes($))throw new Error(`Source language code "${$}" is not valid. Must be one of: {${ee.language_codes.join(", ")}}`);for(let Pe of ee.post_processor.config.single)if("SpecialToken"in Pe&&ee.languageRegex.test(Pe.SpecialToken.id)){Pe.SpecialToken.id=ee.lang_to_token($);break}}return U.forced_bos_token_id=ee.model.convert_tokens_to_ids([ee.lang_to_token(ie)])[0],ee._call(c,A)}class ps extends Ze{constructor(c,A){super(c,A),this.languageRegex=/^[a-z]{3}_[A-Z][a-z]{3}$/,this.language_codes=this.special_tokens.filter(U=>this.languageRegex.test(U)),this.lang_to_token=U=>U}_build_translation_inputs(c,A,U){return ls(this,c,A,U)}}class ms extends Ze{constructor(c,A){super(c,A),this.languageRegex=/^__[a-z]{2,3}__$/,this.language_codes=this.special_tokens.filter(U=>this.languageRegex.test(U)).map(U=>U.slice(2,-2)),this.lang_to_token=U=>`__${U}__`}_build_translation_inputs(c,A,U){return ls(this,c,A,U)}}class Ns extends Ze{get timestamp_begin(){return this.model.convert_tokens_to_ids(["<|notimestamps|>"])[0]+1}_decode_asr(c,{return_timestamps:A=!1,return_language:U=!1,time_precision:$=null,force_full_sequences:ie=!0}={}){if($===null)throw Error("Must specify time_precision");let Pe=null,Ne=A==="word";function Ve(){return{language:Pe,timestamp:[null,null],text:""}}let ze=[],Ie=Ve(),_t=0,ot=this.timestamp_begin,Rt=ot+1500,yt=[],Zt=[],Vt=!1,cs=null,zs=new Set(this.all_special_ids);for(let vt of c){let Ut=vt.tokens,Ht=Ne?vt.token_timestamps:null,Ms=null,gs=ot;if("stride"in vt){let[zt,At,Dt]=vt.stride;if(_t-=At,cs=zt-Dt,At&&(gs=At/$+ot),Dt)for(let Lt=Ut.length-1;Lt>=0;--Lt){let as=Number(Ut[Lt]);if(as>=ot){if(Ms!==null&&(as-ot)*$<cs)break;Ms=as}}}let es=[],fs=[];for(let zt=0;zt<Ut.length;++zt){let At=Number(Ut[zt]);if(zs.has(At)){let Dt=this.decode([At]),Lt=T.WHISPER_LANGUAGE_MAPPING.get(Dt.slice(2,-2));if(Lt!==void 0){if(Pe!==null&&Lt!==Pe&&!A){yt.push(es);let as=this.findLongestCommonSequence(yt)[0],Zs=this.decode(as);Ie.text=Zs,ze.push(Ie),yt=[],es=[],Ie=Ve()}Pe=Ie.language=Lt}}else if(At>=ot&&At<=Rt){let Dt=(At-ot)*$+_t,Lt=(0,I.round)(Dt,2);if(Ms!==null&&At>=Ms)Vt=!0;else if(Vt||yt.length>0&&At<gs)Vt=!1;else if(Ie.timestamp[0]===null)Ie.timestamp[0]=Lt;else if(Lt!==Ie.timestamp[0]){Ie.timestamp[1]=Lt,yt.push(es),Ne&&Zt.push(fs);let[as,Zs]=this.findLongestCommonSequence(yt,Zt),ks=this.decode(as);Ie.text=ks,Ne&&(Ie.words=this.collateWordTimestamps(as,Zs,Pe)),ze.push(Ie),yt=[],es=[],Zt=[],fs=[],Ie=Ve()}}else if(es.push(At),Ne){let Dt=(0,I.round)(Ht[zt]+_t,2),Lt;if(zt+1<Ht.length){Lt=(0,I.round)(Ht[zt+1]+_t,2);let as=this.decode([At]);l.test(as)&&(Lt=(0,I.round)(Math.min(Dt+$,Lt),2))}else Lt=null;fs.push([Dt,Lt])}}if("stride"in vt){let[zt,At,Dt]=vt.stride;_t+=zt-Dt}es.length>0?(yt.push(es),Ne&&Zt.push(fs)):yt.every(zt=>zt.length===0)&&(Ie=Ve(),yt=[],es=[],Zt=[],fs=[])}if(yt.length>0){if(ie&&A)throw new Error("Whisper did not predict an ending timestamp, which can happen if audio is cut off in the middle of a word. Also make sure WhisperTimeStampLogitsProcessor was used during generation.");let[vt,Ut]=this.findLongestCommonSequence(yt,Zt),Ht=this.decode(vt);Ie.text=Ht,Ne&&(Ie.words=this.collateWordTimestamps(vt,Ut,Pe)),ze.push(Ie)}let Xt=Object.create(null),Cs=ze.map(vt=>vt.text).join("");if(A||U){for(let vt=0;vt<ze.length;++vt){let Ut=ze[vt];A||delete Ut.timestamp,U||delete Ut.language}if(Ne){let vt=[];for(let Ut of ze)for(let Ht of Ut.words)vt.push(Ht);Xt={chunks:vt}}else Xt={chunks:ze}}return[Cs,Xt]}findLongestCommonSequence(c,A=null){let U=c[0],$=U.length,ie=[],Pe=Array.isArray(A)&&A.length>0,Ne=Pe?[]:null,Ve=Pe?A[0]:null;for(let ze=1;ze<c.length;++ze){let Ie=c[ze],_t=0,ot=[$,$,0,0],Ft=Ie.length;for(let Xt=1;Xt<$+Ft;++Xt){let Cs=Math.max(0,$-Xt),vt=Math.min($,$+Ft-Xt),Ut=U.slice(Cs,vt),Ht=Math.max(0,Xt-$),Ms=Math.min(Ft,Xt),gs=Ie.slice(Ht,Ms);if(Ut.length!==gs.length)throw new Error("There is a bug within whisper `decode_asr` function, please report it. Dropping to prevent bad inference.");let es;Pe?es=Ut.filter((At,Dt)=>At===gs[Dt]&&Ve[Cs+Dt]<=A[ze][Ht+Dt]).length:es=Ut.filter((At,Dt)=>At===gs[Dt]).length;let fs=Xt/1e4,zt=es/Xt+fs;es>1&&zt>_t&&(_t=zt,ot=[Cs,vt,Ht,Ms])}let[Rt,yt,Zt,Vt]=ot,cs=Math.floor((yt+Rt)/2),zs=Math.floor((Vt+Zt)/2);ie.push(...U.slice(0,cs)),U=Ie.slice(zs),$=U.length,Pe&&(Ne.push(...Ve.slice(0,cs)),Ve=A[ze].slice(zs))}return ie.push(...U),Pe?(Ne.push(...Ve),[ie,Ne]):[ie,[]]}collateWordTimestamps(c,A,U){let[$,ie,Pe]=this.combineTokensIntoWords(c,U),Ne=[];for(let Ve=0;Ve<$.length;++Ve){let ze=Pe[Ve];Ne.push({text:$[Ve],timestamp:[A[ze.at(0)][0],A[ze.at(-1)][1]]})}return Ne}combineTokensIntoWords(c,A,U=`"'\u201C\xA1\xBF([{-`,$=`"'.\u3002,\uFF0C!\uFF01?\uFF1F:\uFF1A\u201D)]}\u3001`){A=A??"english";let ie,Pe,Ne;return["chinese","japanese","thai","lao","myanmar"].includes(A)?[ie,Pe,Ne]=this.splitTokensOnUnicode(c):[ie,Pe,Ne]=this.splitTokensOnSpaces(c),this.mergePunctuations(ie,Pe,Ne,U,$)}decode(c,A){let U;return A?.decode_with_timestamps?(c instanceof f.Tensor&&(c=k(c)),U=this.decodeWithTimestamps(c,A)):U=super.decode(c,A),U}decodeWithTimestamps(c,A){let U=A?.time_precision??.02,$=Array.from(this.all_special_ids).at(-1)+1,ie=[[]];for(let Pe of c)if(Pe=Number(Pe),Pe>=$){let Ne=((Pe-$)*U).toFixed(2);ie.push(`<|${Ne}|>`),ie.push([])}else ie[ie.length-1].push(Pe);return ie=ie.map(Pe=>typeof Pe=="string"?Pe:super.decode(Pe,A)),ie.join("")}splitTokensOnUnicode(c){let A=this.decode(c,{decode_with_timestamps:!0}),U="\uFFFD",$=[],ie=[],Pe=[],Ne=[],Ve=[],ze=0;for(let Ie=0;Ie<c.length;++Ie){let _t=c[Ie];Ne.push(_t),Ve.push(Ie);let ot=this.decode(Ne,{decode_with_timestamps:!0});(!ot.includes(U)||A[ze+ot.indexOf(U)]===U)&&($.push(ot),ie.push(Ne),Pe.push(Ve),Ne=[],Ve=[],ze+=ot.length)}return[$,ie,Pe]}splitTokensOnSpaces(c){let[A,U,$]=this.splitTokensOnUnicode(c),ie=[],Pe=[],Ne=[],Ve=new RegExp(`^[${y}]$`,"gu");for(let ze=0;ze<A.length;++ze){let Ie=A[ze],_t=U[ze],ot=$[ze],Ft=_t[0]>=this.model.tokens_to_ids.get("<|endoftext|>"),Rt=Ie.startsWith(" "),yt=Ie.trim(),Zt=Ve.test(yt);if(Ft||Rt||Zt||ie.length===0)ie.push(Ie),Pe.push(_t),Ne.push(ot);else{let Vt=ie.length-1;ie[Vt]+=Ie,Pe[Vt].push(..._t),Ne[Vt].push(...ot)}}return[ie,Pe,Ne]}mergePunctuations(c,A,U,$,ie){let Pe=structuredClone(c),Ne=structuredClone(A),Ve=structuredClone(U),ze=Pe.length-2,Ie=Pe.length-1;for(;ze>=0;)Pe[ze].startsWith(" ")&&$.includes(Pe[ze].trim())?(Pe[Ie]=Pe[ze]+Pe[Ie],Ne[Ie]=(0,d.mergeArrays)(Ne[ze],Ne[Ie]),Ve[Ie]=(0,d.mergeArrays)(Ve[ze],Ve[Ie]),Pe[ze]="",Ne[ze]=[],Ve[ze]=[]):Ie=ze,--ze;for(ze=0,Ie=1;Ie<Pe.length;)!Pe[ze].endsWith(" ")&&ie.includes(Pe[Ie])?(Pe[ze]+=Pe[Ie],Ne[ze]=(0,d.mergeArrays)(Ne[ze],Ne[Ie]),Ve[ze]=(0,d.mergeArrays)(Ve[ze],Ve[Ie]),Pe[Ie]="",Ne[Ie]=[],Ve[Ie]=[]):ze=Ie,++Ie;return[Pe.filter(_t=>_t),Ne.filter(_t=>_t.length>0),Ve.filter(_t=>_t.length>0)]}}class xs extends Ze{}class vs extends Ze{}class Es extends Ze{}class hs extends Ze{constructor(c,A){super(c,A),this.languageRegex=/^(>>\w+<<)\s*/g,this.supported_language_codes=this.model.vocab.filter(U=>this.languageRegex.test(U)),console.warn('WARNING: `MarianTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}_encode_text(c){if(c===null)return null;let[A,...U]=c.trim().split(this.languageRegex);if(U.length===0)return super._encode_text(A);if(U.length===2){let[$,ie]=U;return this.supported_language_codes.includes($)||console.warn(`Unsupported language code "${$}" detected, which may lead to unexpected behavior. Should be one of: ${JSON.stringify(this.supported_language_codes)}`),(0,d.mergeArrays)([$],super._encode_text(ie))}}}class rs extends Ze{}class Fe extends Ze{}class Se extends Ze{}class Ke extends Ze{}class Tt extends Ze{}class Rs extends Ze{constructor(c,A){super(c,A),this.decoder=new ut({})}}class Fs extends Ze{}class Vs extends Ze{}class mr{static TOKENIZER_CLASS_MAPPING={T5Tokenizer:Ge,DistilBertTokenizer:O,CamembertTokenizer:z,DebertaTokenizer:lt,DebertaV2Tokenizer:Os,BertTokenizer:Ls,HerbertTokenizer:n,ConvBertTokenizer:j,RoFormerTokenizer:v,XLMTokenizer:Z,ElectraTokenizer:ue,MobileBertTokenizer:Is,SqueezeBertTokenizer:is,AlbertTokenizer:Ds,GPT2Tokenizer:Je,BartTokenizer:Oe,MBartTokenizer:st,MBart50Tokenizer:We,RobertaTokenizer:it,WhisperTokenizer:Ns,CodeGenTokenizer:xs,CLIPTokenizer:vs,SiglipTokenizer:Es,MarianTokenizer:hs,BloomTokenizer:gt,NllbTokenizer:ps,M2M100Tokenizer:ms,LlamaTokenizer:Nt,CodeLlamaTokenizer:ss,XLMRobertaTokenizer:Qt,MPNetTokenizer:Ps,FalconTokenizer:Ts,GPTNeoXTokenizer:ws,EsmTokenizer:os,Wav2Vec2CTCTokenizer:rs,BlenderbotTokenizer:Fe,BlenderbotSmallTokenizer:Se,SpeechT5Tokenizer:Ke,NougatTokenizer:Tt,VitsTokenizer:Rs,Qwen2Tokenizer:Bs,GemmaTokenizer:bs,Grok1Tokenizer:js,CohereTokenizer:Fs,MgpstrTokenizer:Vs,PreTrainedTokenizer:Ze};static async from_pretrained(c,{progress_callback:A=null,config:U=null,cache_dir:$=null,local_files_only:ie=!1,revision:Pe="main",legacy:Ne=null}={}){let[Ve,ze]=await _(c,{progress_callback:A,config:U,cache_dir:$,local_files_only:ie,revision:Pe,legacy:Ne}),Ie=ze.tokenizer_class?.replace(/Fast$/,"")??"PreTrainedTokenizer",_t=this.TOKENIZER_CLASS_MAPPING[Ie];return _t||(console.warn(`Unknown tokenizer class "${Ie}", attempting to construct from base class.`),_t=Ze),new _t(Ve,ze)}}}),"./src/utils/audio.js":((D,a,e)=>{e.r(a),e.d(a,{RawAudio:()=>R,hamming:()=>o,hanning:()=>_,mel_filter_bank:()=>B,read_audio:()=>m,spectrogram:()=>h,window_function:()=>F});var i=e("./src/utils/hub.js"),d=e("./src/utils/maths.js"),g=e("./src/utils/core.js"),I=e("./src/env.js"),f=e("./src/utils/tensor.js"),u=e("node:fs");async function m(N,Q){if(typeof AudioContext>"u")throw Error("Unable to load audio from path/URL since `AudioContext` is not available in your environment. Instead, audio data should be passed directly to the pipeline/processor. For more information and some example code, see https://huggingface.co/docs/transformers.js/guides/node-audio-processing.");let K=await(await(0,i.getFile)(N)).arrayBuffer(),J=new AudioContext({sampleRate:Q});typeof Q>"u"&&console.warn(`No sampling rate provided, using default of ${J.sampleRate}Hz.`);let te=await J.decodeAudioData(K),se;if(te.numberOfChannels===2){let ce=Math.sqrt(2),we=te.getChannelData(0),_e=te.getChannelData(1);se=new Float32Array(we.length);for(let X=0;X<te.length;++X)se[X]=ce*(we[X]+_e[X])/2}else se=te.getChannelData(0);return se}function T(N,Q){if(N<1)return new Float64Array;if(N===1)return new Float64Array([1]);let K=1-Q,J=2*Math.PI/(N-1),te=new Float64Array(N);for(let se=0;se<N;++se)te[se]=Q-K*Math.cos(se*J);return te}function _(N){return T(N,.5)}function o(N){return T(N,.54)}let x={htk:N=>2595*Math.log10(1+N/700),kaldi:N=>1127*Math.log(1+N/700),slaney:(N,Q=1e3,K=15,J=27/Math.log(6.4))=>N>=Q?K+Math.log(N/Q)*J:3*N/200};function w(N,Q="htk"){let K=x[Q];if(!K)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof N=="number"?K(N):N.map(J=>K(J))}let k={htk:N=>700*(10**(N/2595)-1),kaldi:N=>700*(Math.exp(N/1127)-1),slaney:(N,Q=1e3,K=15,J=Math.log(6.4)/27)=>N>=K?Q*Math.exp(J*(N-K)):200*N/3};function G(N,Q="htk"){let K=k[Q];if(!K)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof N=="number"?K(N):N.map(J=>K(J))}function b(N,Q){let K=Float64Array.from({length:Q.length-1},(ce,we)=>Q[we+1]-Q[we]),J=Array.from({length:N.length},()=>new Array(Q.length));for(let ce=0;ce<N.length;++ce){let we=J[ce];for(let _e=0;_e<Q.length;++_e)we[_e]=Q[_e]-N[ce]}let te=Q.length-2,se=Array.from({length:te},()=>new Array(N.length));for(let ce=0;ce<N.length;++ce){let we=J[ce];for(let _e=0;_e<te;++_e){let X=-we[_e]/K[_e],L=we[_e+2]/K[_e+1];se[_e][ce]=Math.max(0,Math.min(X,L))}}return se}function C(N,Q,K){let J=(Q-N)/(K-1);return Float64Array.from({length:K},(te,se)=>N+J*se)}function B(N,Q,K,J,te,se=null,ce="htk",we=!1){if(se!==null&&se!=="slaney")throw new Error('norm must be one of null or "slaney"');if(N<2)throw new Error(`Require num_frequency_bins: ${N} >= 2`);if(K>J)throw new Error(`Require min_frequency: ${K} <= max_frequency: ${J}`);let _e=w(K,ce),X=w(J,ce),L=C(_e,X,Q+2),W=G(L,ce),Y;if(we){let be=te/((N-1)*2);Y=w(Float64Array.from({length:N},(xe,Le)=>Le*be),ce),W=L}else Y=C(0,Math.floor(te/2),N);let ae=b(Y,W);if(se!==null&&se==="slaney")for(let be=0;be<Q;++be){let xe=ae[be],Le=2/(W[be+2]-W[be]);for(let $e=0;$e<N;++$e)xe[$e]*=Le}return ae}function P(N,Q,K){let J=new N.constructor(N.length+Q+K),te=N.length-1;for(let se=0;se<N.length;++se)J[Q+se]=N[se];for(let se=1;se<=Q;++se)J[Q-se]=N[(0,g.calculateReflectOffset)(se,te)];for(let se=1;se<=K;++se)J[te+Q+se]=N[(0,g.calculateReflectOffset)(te-se,te)];return J}function M(N,Q,K,J,te){if(K<=0)throw new Error("reference must be greater than zero");if(J<=0)throw new Error("min_value must be greater than zero");K=Math.max(J,K);let se=Math.log10(K);for(let ce=0;ce<N.length;++ce)N[ce]=Q*Math.log10(Math.max(J,N[ce])-se);if(te!==null){if(te<=0)throw new Error("db_range must be greater than zero");let ce=(0,d.max)(N)[0]-te;for(let we=0;we<N.length;++we)N[we]=Math.max(N[we],ce)}return N}function y(N,Q=1,K=1e-5,J=null){return M(N,20,Q,K,J)}function l(N,Q=1,K=1e-10,J=null){return M(N,10,Q,K,J)}async function h(N,Q,K,J,{fft_length:te=null,power:se=1,center:ce=!0,pad_mode:we="reflect",onesided:_e=!0,preemphasis:X=null,preemphasis_htk_flavor:L=!0,mel_filters:W=null,mel_floor:Y=1e-10,log_mel:ae=null,reference:be=1,min_value:xe=1e-10,db_range:Le=null,remove_dc_offset:$e=null,min_num_frames:ge=null,max_num_frames:p=null,do_pad:q=!0,transpose:de=!1,mel_offset:pe=0}={}){let Te=Q.length;if(te===null&&(te=K),K>te)throw Error(`frame_length (${K}) may not be larger than fft_length (${te})`);if(Te!==K)throw new Error(`Length of the window (${Te}) must equal frame_length (${K})`);if(J<=0)throw new Error("hop_length must be greater than zero");if(se===null&&W!==null)throw new Error("You have provided `mel_filters` but `power` is `None`. Mel spectrogram computation is not yet supported for complex-valued spectrogram. Specify `power` to fix this issue.");if(!L)throw new Error("`preemphasis_htk_flavor=false` is not currently supported.");if(ce)switch(we){case"reflect":{let Re=Math.floor((te-1)/2)+1;N=P(N,Re,Re);break}case"constant":{let Re=Math.floor(te/2),ke=new N.constructor(N.length+2*Re);ke.set(N,Re),N=ke;break}default:throw new Error(`pad_mode="${we}" not implemented yet.`)}let me=Math.floor(1+Math.floor((N.length-K)/J));ge!==null&&me<ge&&(me=ge);let ne=_e?Math.floor(te/2)+1:te,fe=me,le=me;p!==null&&(p>me?q&&(le=p):le=fe=p);let he=new d.FFT(te),De=new Float64Array(te),ve=new Float64Array(he.outputBufferSize),ye=new Float32Array(ne*le);for(let Re=0;Re<fe;++Re){let ke=Re*J,qe=Math.min(N.length-ke,K);qe!==K&&De.fill(0,0,K);for(let je=0;je<qe;++je)De[je]=N[ke+je];if($e){let je=0;for(let ut=0;ut<qe;++ut)je+=De[ut];let nt=je/qe;for(let ut=0;ut<qe;++ut)De[ut]-=nt}if(X!==null){for(let je=qe-1;je>=1;--je)De[je]-=X*De[je-1];De[0]*=1-X}for(let je=0;je<Q.length;++je)De[je]*=Q[je];he.realTransform(ve,De);for(let je=0;je<ne;++je){let nt=je<<1;ye[je*le+Re]=ve[nt]**2+ve[nt+1]**2}}if(se!==null&&se!==2){let Re=se/2;for(let ke=0;ke<ye.length;++ke)ye[ke]**=Re}let Ce=W.length,Qe=await(0,f.matmul)(new f.Tensor("float32",W.flat(),[Ce,ne]),new f.Tensor("float32",ye,[ne,le]));de&&(Qe=Qe.transpose(1,0));let Be=Qe.data;for(let Re=0;Re<Be.length;++Re)Be[Re]=pe+Math.max(Y,Be[Re]);if(se!==null&&ae!==null){let Re=Math.min(Be.length,fe*Ce);switch(ae){case"log":for(let ke=0;ke<Re;++ke)Be[ke]=Math.log(Be[ke]);break;case"log10":for(let ke=0;ke<Re;++ke)Be[ke]=Math.log10(Be[ke]);break;case"dB":if(se===1)y(Be,be,xe,Le);else if(se===2)l(Be,be,xe,Le);else throw new Error(`Cannot use log_mel option '${ae}' with power ${se}`);break;default:throw new Error(`log_mel must be one of null, 'log', 'log10' or 'dB'. Got '${ae}'`)}}return Qe}function F(N,Q,{periodic:K=!0,frame_length:J=null,center:te=!0}={}){let se=K?N+1:N,ce;switch(Q){case"boxcar":ce=new Float64Array(se).fill(1);break;case"hann":case"hann_window":ce=_(se);break;case"hamming":ce=o(se);break;case"povey":ce=_(se).map(we=>Math.pow(we,.85));break;default:throw new Error(`Unknown window type ${Q}.`)}if(K&&(ce=ce.subarray(0,N)),J===null)return ce;if(N>J)throw new Error(`Length of the window (${N}) may not be larger than frame_length (${J})`);return ce}function S(N,Q){let K=44,J=new ArrayBuffer(K+N.length*4),te=new DataView(J);V(te,0,"RIFF"),te.setUint32(4,36+N.length*4,!0),V(te,8,"WAVE"),V(te,12,"fmt "),te.setUint32(16,16,!0),te.setUint16(20,3,!0),te.setUint16(22,1,!0),te.setUint32(24,Q,!0),te.setUint32(28,Q*4,!0),te.setUint16(32,4,!0),te.setUint16(34,32,!0),V(te,36,"data"),te.setUint32(40,N.length*4,!0);for(let se=0;se<N.length;++se,K+=4)te.setFloat32(K,N[se],!0);return J}function V(N,Q,K){for(let J=0;J<K.length;++J)N.setUint8(Q+J,K.charCodeAt(J))}class R{constructor(Q,K){this.audio=Q,this.sampling_rate=K}toWav(){return S(this.audio,this.sampling_rate)}toBlob(){let Q=this.toWav();return new Blob([Q],{type:"audio/wav"})}async save(Q){let K;if(I.apis.IS_BROWSER_ENV){if(I.apis.IS_WEBWORKER_ENV)throw new Error("Unable to save a file from a Web Worker.");K=g.saveBlob}else if(I.apis.IS_FS_AVAILABLE)K=async(J,te)=>{let se=await te.arrayBuffer();u.default.writeFileSync(J,Buffer.from(se))};else throw new Error("Unable to save because filesystem is disabled in this environment.");await K(Q,this.toBlob())}}}),"./src/utils/constants.js":((D,a,e)=>{e.r(a),e.d(a,{CHAT_TEMPLATE_NAME:()=>u,CONFIG_NAME:()=>d,FEATURE_EXTRACTOR_NAME:()=>g,GENERATION_CONFIG_NAME:()=>m,GITHUB_ISSUE_URL:()=>i,IMAGE_PROCESSOR_NAME:()=>I,PROCESSOR_NAME:()=>f});let i="https://github.com/huggingface/transformers.js/issues/new/choose",d="config.json",g="preprocessor_config.json",I=g,f="processor_config.json",u="chat_template.jinja",m="generation_config.json"}),"./src/utils/core.js":((D,a,e)=>{e.r(a),e.d(a,{calculateDimensions:()=>m,calculateReflectOffset:()=>x,count:()=>b,dispatchCallback:()=>i,escapeRegExp:()=>g,isIntegralNumber:()=>f,isNullishDimension:()=>u,isTypedArray:()=>I,len:()=>G,mergeArrays:()=>_,pick:()=>k,pop:()=>T,product:()=>o,reverseDictionary:()=>d,saveBlob:()=>w});function i(C,B){C&&C(B)}function d(C){return Object.fromEntries(Object.entries(C).map(([B,P])=>[P,B]))}function g(C){return C.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function I(C){return C?.prototype?.__proto__?.constructor?.name==="TypedArray"}function f(C){return Number.isInteger(C)||typeof C=="bigint"}function u(C){return C==null||C===-1}function m(C){let B=[],P=C;for(;Array.isArray(P);)B.push(P.length),P=P[0];return B}function T(C,B,P=void 0){let M=C[B];if(M!==void 0)return delete C[B],M;if(P===void 0)throw Error(`Key ${B} does not exist in object.`);return P}function _(...C){return Array.prototype.concat.apply([],C)}function o(...C){return C.reduce((B,P)=>B.flatMap(M=>P.map(y=>[M,y])))}function x(C,B){return Math.abs((C+B)%(2*B)-B)}function w(C,B){let P=URL.createObjectURL(B),M=document.createElement("a");M.href=P,M.download=C,M.click(),M.remove(),URL.revokeObjectURL(P)}function k(C,B){return Object.assign({},...B.map(P=>{if(C[P]!==void 0)return{[P]:C[P]}}))}function G(C){let B=0;for(let P of C)++B;return B}function b(C,B){let P=0;for(let M of C)M===B&&++P;return P}}),"./src/utils/data-structures.js":((D,a,e)=>{e.r(a),e.d(a,{CharTrie:()=>d,DictionarySplitter:()=>u,LRUCache:()=>m,PriorityQueue:()=>i,TokenLattice:()=>I});class i{constructor(_=(x,w)=>x>w,o=1/0){this._heap=[],this._comparator=_,this._maxSize=o}get size(){return this._heap.length}isEmpty(){return this.size===0}peek(){return this._heap[0]}push(..._){return this.extend(_)}extend(_){for(let o of _)if(this.size<this._maxSize)this._heap.push(o),this._siftUp();else{let x=this._smallest();this._comparator(o,this._heap[x])&&(this._heap[x]=o,this._siftUpFrom(x))}return this.size}pop(){let _=this.peek(),o=this.size-1;return o>0&&this._swap(0,o),this._heap.pop(),this._siftDown(),_}replace(_){let o=this.peek();return this._heap[0]=_,this._siftDown(),o}_parent(_){return(_+1>>>1)-1}_left(_){return(_<<1)+1}_right(_){return _+1<<1}_greater(_,o){return this._comparator(this._heap[_],this._heap[o])}_swap(_,o){let x=this._heap[_];this._heap[_]=this._heap[o],this._heap[o]=x}_siftUp(){this._siftUpFrom(this.size-1)}_siftUpFrom(_){for(;_>0&&this._greater(_,this._parent(_));)this._swap(_,this._parent(_)),_=this._parent(_)}_siftDown(){let _=0;for(;this._left(_)<this.size&&this._greater(this._left(_),_)||this._right(_)<this.size&&this._greater(this._right(_),_);){let o=this._right(_)<this.size&&this._greater(this._right(_),this._left(_))?this._right(_):this._left(_);this._swap(_,o),_=o}}_smallest(){return 2**Math.floor(Math.log2(this.size))-1}}class d{constructor(){this.root=g.default()}extend(_){for(let o of _)this.push(o)}push(_){let o=this.root;for(let x of _){let w=o.children.get(x);w===void 0&&(w=g.default(),o.children.set(x,w)),o=w}o.isLeaf=!0}*commonPrefixSearch(_){let o=this.root;if(o===void 0)return;let x="";for(let w of _){if(x+=w,o=o.children.get(w),o===void 0)return;o.isLeaf&&(yield x)}}}class g{constructor(_,o){this.isLeaf=_,this.children=o}static default(){return new g(!1,new Map)}}class I{constructor(_,o,x){this.chars=Array.from(_),this.len=this.chars.length,this.bosTokenId=o,this.eosTokenId=x,this.nodes=[],this.beginNodes=Array.from({length:this.len+1},()=>[]),this.endNodes=Array.from({length:this.len+1},()=>[]);let w=new f(this.bosTokenId,0,0,0,0),k=new f(this.eosTokenId,1,this.len,0,0);this.nodes.push(w.clone()),this.nodes.push(k.clone()),this.beginNodes[this.len].push(k),this.endNodes[0].push(w)}insert(_,o,x,w){let k=this.nodes.length,G=new f(w,k,_,o,x);this.beginNodes[_].push(G),this.endNodes[_+o].push(G),this.nodes.push(G)}viterbi(){let _=this.len,o=0;for(;o<=_;){if(this.beginNodes[o].length==0)return[];for(let b of this.beginNodes[o]){b.prev=null;let C=0,B=null;for(let P of this.endNodes[o]){let M=P.backtraceScore+b.score;(B===null||M>C)&&(B=P.clone(),C=M)}if(B!==null)b.prev=B,b.backtraceScore=C;else return[]}++o}let x=[],k=this.beginNodes[_][0].prev;if(k===null)return[];let G=k.clone();for(;G.prev!==null;)x.push(G.clone()),G=G.clone().prev.clone();return x.reverse(),x}piece(_){return this.chars.slice(_.pos,_.pos+_.length).join("")}tokens(){return this.viterbi().map(o=>this.piece(o))}tokenIds(){return this.viterbi().map(o=>o.tokenId)}}class f{constructor(_,o,x,w,k){this.tokenId=_,this.nodeId=o,this.pos=x,this.length=w,this.score=k,this.prev=null,this.backtraceScore=0}clone(){let _=new f(this.tokenId,this.nodeId,this.pos,this.length,this.score);return _.prev=this.prev,_.backtraceScore=this.backtraceScore,_}}class u{constructor(_){this.trie=this._buildTrie(_)}_buildTrie(_){let o=Object.create(null);for(let x of _){let w=o;for(let k=0;k<x.length;++k)w=w[x[k]]??=Object.create(null);w.end=x}return o}split(_){let o=[],x=_.length,w=0,k=0;for(;k<x;){let G=this.trie,b=null,C=k;for(;C<x&&(G=G[_[C]]);)G.end&&(b=G.end),++C;b?(k>w&&o.push(_.slice(w,k)),o.push(b),k+=b.length,w=k):++k}return w<x&&o.push(_.slice(w)),o}}class m{constructor(_){this.capacity=_,this.cache=new Map}get(_){if(!this.cache.has(_))return;let o=this.cache.get(_);return this.cache.delete(_),this.cache.set(_,o),o}put(_,o){this.cache.has(_)&&this.cache.delete(_),this.cache.set(_,o),this.cache.size>this.capacity&&this.cache.delete(this.cache.keys().next().value)}clear(){this.cache.clear()}}}),"./src/utils/devices.js":((D,a,e)=>{e.r(a),e.d(a,{DEVICE_TYPES:()=>i});let i=Object.freeze({auto:"auto",gpu:"gpu",cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",webnn:"webnn","webnn-npu":"webnn-npu","webnn-gpu":"webnn-gpu","webnn-cpu":"webnn-cpu"})}),"./src/utils/dtypes.js":((D,a,e)=>{e.r(a),e.d(a,{DATA_TYPES:()=>I,DEFAULT_DEVICE_DTYPE_MAPPING:()=>f,DEFAULT_DTYPE_SUFFIX_MAPPING:()=>u,isWebGpuFp16Supported:()=>g});var i=e("./src/env.js"),d=e("./src/utils/devices.js");let g=(function(){let m;return async function(){if(m===void 0)if(!i.apis.IS_WEBGPU_AVAILABLE)m=!1;else try{m=(await navigator.gpu.requestAdapter()).features.has("shader-f16")}catch{m=!1}return m}})(),I=Object.freeze({auto:"auto",fp32:"fp32",fp16:"fp16",q8:"q8",int8:"int8",uint8:"uint8",q4:"q4",bnb4:"bnb4",q4f16:"q4f16"}),f=Object.freeze({[d.DEVICE_TYPES.wasm]:I.q8}),u=Object.freeze({[I.fp32]:"",[I.fp16]:"_fp16",[I.int8]:"_int8",[I.uint8]:"_uint8",[I.q8]:"_quantized",[I.q4]:"_q4",[I.q4f16]:"_q4f16",[I.bnb4]:"_bnb4"})}),"./src/utils/generic.js":((D,a,e)=>{e.r(a),e.d(a,{Callable:()=>i});let i=class{constructor(){let d=function(...g){return d._call(...g)};return Object.setPrototypeOf(d,new.target.prototype)}_call(...d){throw Error("Must implement _call method in subclass")}}}),"./src/utils/hub.js":((D,a,e)=>{e.r(a),e.d(a,{MAX_EXTERNAL_DATA_CHUNKS:()=>f,getFile:()=>x,getModelFile:()=>C,getModelJSON:()=>P,getModelText:()=>B});var i=e("node:fs"),d=e("node:path"),g=e("./src/env.js"),I=e("./src/utils/core.js");let f=100,u={txt:"text/plain",html:"text/html",css:"text/css",js:"text/javascript",json:"application/json",png:"image/png",jpg:"image/jpeg",jpeg:"image/jpeg",gif:"image/gif"};class m{constructor(h){if(this.filePath=h,this.headers=new Headers,this.exists=i.default.existsSync(h),this.exists){this.status=200,this.statusText="OK";let F=i.default.statSync(h);this.headers.set("content-length",F.size.toString()),this.updateContentType();let S=i.default.createReadStream(h);this.body=new ReadableStream({start(V){S.on("data",R=>V.enqueue(R)),S.on("end",()=>V.close()),S.on("error",R=>V.error(R))},cancel(){S.destroy()}})}else this.status=404,this.statusText="Not Found",this.body=null}updateContentType(){let h=this.filePath.toString().split(".").pop().toLowerCase();this.headers.set("content-type",u[h]??"application/octet-stream")}clone(){let h=new m(this.filePath);return h.exists=this.exists,h.status=this.status,h.statusText=this.statusText,h.headers=new Headers(this.headers),h}async arrayBuffer(){return(await i.default.promises.readFile(this.filePath)).buffer}async blob(){let h=await i.default.promises.readFile(this.filePath);return new Blob([h],{type:this.headers.get("content-type")})}async text(){return await i.default.promises.readFile(this.filePath,"utf8")}async json(){return JSON.parse(await this.text())}}function T(l,h=null,F=null){let S;try{S=new URL(l)}catch{return!1}return!(h&&!h.includes(S.protocol)||F&&!F.includes(S.hostname))}let _=/^(\b[\w\-.]+\b\/)?\b[\w\-.]{1,96}\b$/;function o(l){return!(!_.test(l)||l.includes("..")||l.includes("--")||l.endsWith(".git")||l.endsWith(".ipynb"))}async function x(l){if(g.env.useFS&&!T(l,["http:","https:","blob:"]))return new m(l instanceof URL?l.protocol==="file:"?l.pathname:l.toString():l);if(typeof process<"u"&&process?.release?.name==="node"){let h=!!process.env?.TESTING_REMOTELY,F=g.env.version,S=new Headers;if(S.set("User-Agent",`transformers.js/${F}; is_ci/${h};`),T(l,["http:","https:"],["huggingface.co","hf.co"])){let R=process.env?.HF_TOKEN??process.env?.HF_ACCESS_TOKEN;R&&S.set("Authorization",`Bearer ${R}`)}return fetch(l,{headers:S})}else return fetch(l)}let w={400:"Bad request error occurred while trying to load file",401:"Unauthorized access to file",403:"Forbidden access to file",404:"Could not locate file",408:"Request timeout error occurred while trying to load file",500:"Internal server error error occurred while trying to load file",502:"Bad gateway error occurred while trying to load file",503:"Service unavailable error occurred while trying to load file",504:"Gateway timeout error occurred while trying to load file"};function k(l,h,F){if(!F)return null;let S=w[l]??`Error (${l}) occurred while trying to load file`;throw Error(`${S}: "${h}".`)}class G{constructor(h){this.path=h}async match(h){let F=d.default.join(this.path,h),S=new m(F);if(S.exists)return S}async put(h,F,S=void 0){let V=d.default.join(this.path,h);try{let R=F.headers.get("Content-Length"),N=parseInt(R??"0"),Q=0;await i.default.promises.mkdir(d.default.dirname(V),{recursive:!0});let K=i.default.createWriteStream(V),J=F.body.getReader();for(;;){let{done:te,value:se}=await J.read();if(te)break;await new Promise((we,_e)=>{K.write(se,X=>{if(X){_e(X);return}we()})}),Q+=se.length;let ce=N?Q/N*100:0;S?.({progress:ce,loaded:Q,total:N})}K.close()}catch(R){try{await i.default.promises.unlink(V)}catch{}throw R}}}async function b(l,...h){for(let F of h)try{let S=await l.match(F);if(S)return S}catch{continue}}async function C(l,h,F=!0,S={},V=!1){if(!g.env.allowLocalModels){if(S.local_files_only)throw Error("Invalid configuration detected: local models are disabled (`env.allowLocalModels=false`) but you have requested to only use local models (`local_files_only=true`).");if(!g.env.allowRemoteModels)throw Error("Invalid configuration detected: both local and remote models are disabled. Fix by setting `env.allowLocalModels` or `env.allowRemoteModels` to `true`.")}(0,I.dispatchCallback)(S.progress_callback,{status:"initiate",name:l,file:h});let R;if(!R&&g.env.useCustomCache){if(!g.env.customCache)throw Error("`env.useCustomCache=true`, but `env.customCache` is not defined.");if(!g.env.customCache.match||!g.env.customCache.put)throw new Error("`env.customCache` must be an object which implements the `match` and `put` functions of the Web Cache API. For more information, see https://developer.mozilla.org/en-US/docs/Web/API/Cache");R=g.env.customCache}if(!R&&g.env.useBrowserCache){if(typeof caches>"u")throw Error("Browser cache is not available in this environment.");try{R=await caches.open("transformers-cache")}catch(Y){console.warn("An error occurred while opening the browser cache:",Y)}}if(!R&&g.env.useFSCache){if(!g.apis.IS_FS_AVAILABLE)throw Error("File System Cache is not available in this environment.");R=new G(S.cache_dir??g.env.cacheDir)}let N=S.revision??"main",Q=y(l,h),K=o(l),J=K?y(g.env.localModelPath,Q):Q,te=y(g.env.remoteHost,g.env.remotePathTemplate.replaceAll("{model}",l).replaceAll("{revision}",encodeURIComponent(N)),h),se,ce=R instanceof G?N==="main"?Q:y(l,N,h):te,we=!1,_e;R&&(_e=await b(R,J,ce));let X=_e!==void 0;if(_e===void 0){if(g.env.allowLocalModels)if(T(Q,["http:","https:"])){if(S.local_files_only)throw new Error(`\`local_files_only=true\`, but attempted to load a remote file from: ${Q}.`);if(!g.env.allowRemoteModels)throw new Error(`\`env.allowRemoteModels=false\`, but attempted to load a remote file from: ${Q}.`)}else try{_e=await x(J),se=J}catch(ae){console.warn(`Unable to load from local path "${J}": "${ae}"`)}if(_e===void 0||_e.status===404){if(S.local_files_only||!g.env.allowRemoteModels){if(F)throw Error(`\`local_files_only=true\` or \`env.allowRemoteModels=false\` and file was not found locally at "${J}".`);return null}if(!K)throw Error(`Local file missing at "${J}" and download aborted due to invalid model ID "${l}".`);if(_e=await x(te),_e.status!==200)return k(_e.status,te,F);se=ce}we=R&&typeof Response<"u"&&_e instanceof Response&&_e.status===200}(0,I.dispatchCallback)(S.progress_callback,{status:"download",name:l,file:h});let L;if(!(g.apis.IS_NODE_ENV&&V)){let Y;S.progress_callback?X&&typeof navigator<"u"&&/firefox/i.test(navigator.userAgent)?(Y=new Uint8Array(await _e.arrayBuffer()),(0,I.dispatchCallback)(S.progress_callback,{status:"progress",name:l,file:h,progress:100,loaded:Y.length,total:Y.length})):Y=await M(_e,ae=>{(0,I.dispatchCallback)(S.progress_callback,{status:"progress",name:l,file:h,...ae})}):Y=new Uint8Array(await _e.arrayBuffer()),L=Y}if(we&&se&&await R.match(se)===void 0)if(L)await R.put(se,new Response(L,{headers:_e.headers})).catch(Y=>{console.warn(`Unable to add response to browser cache: ${Y}.`)});else{let Y=S.progress_callback?ae=>(0,I.dispatchCallback)(S.progress_callback,{status:"progress",name:l,file:h,...ae}):void 0;await R.put(se,_e,Y)}if((0,I.dispatchCallback)(S.progress_callback,{status:"done",name:l,file:h}),L){if(!g.apis.IS_NODE_ENV&&V)throw new Error("Cannot return path in a browser environment.");return L}if(_e instanceof m)return _e.filePath;let W=await R?.match(se);if(W instanceof m)return W.filePath;if(W instanceof Response)return new Uint8Array(await W.arrayBuffer());if(typeof W=="string")return W;throw new Error("Unable to get model file path or buffer.")}async function B(l,h,F=!0,S={}){let V=await C(l,h,F,S,!1);return V===null?null:new TextDecoder("utf-8").decode(V)}async function P(l,h,F=!0,S={}){let V=await B(l,h,F,S);return V===null?{}:JSON.parse(V)}async function M(l,h){let F=l.headers.get("Content-Length");F===null&&console.warn("Unable to determine content-length from response headers. Will expand buffer when needed.");let S=parseInt(F??"0"),V=new Uint8Array(S),R=0,N=l.body.getReader();async function Q(){let{done:K,value:J}=await N.read();if(K)return;let te=R+J.length;if(te>S){S=te;let ce=new Uint8Array(S);ce.set(V),V=ce}V.set(J,R),R=te;let se=R/S*100;return h({progress:se,loaded:R,total:S}),Q()}return await Q(),V}function y(...l){return l=l.map((h,F)=>(F&&(h=h.replace(new RegExp("^/"),"")),F!==l.length-1&&(h=h.replace(new RegExp("/$"),"")),h)),l.join("/")}}),"./src/utils/image.js":((D,a,e)=>{e.r(a),e.d(a,{RawImage:()=>w,load_image:()=>k});var i=e("./src/utils/core.js"),d=e("./src/utils/hub.js"),g=e("./src/env.js"),I=e("./src/utils/tensor.js"),f=e("sharp");let u,m,T,_=g.apis.IS_BROWSER_ENV||g.apis.IS_WEBWORKER_ENV;if(_)u=(G,b)=>{if(!self.OffscreenCanvas)throw new Error("OffscreenCanvas not supported by this browser.");return new self.OffscreenCanvas(G,b)},T=self.createImageBitmap,m=self.ImageData;else if(f.default)T=async G=>{let C=(await G.metadata()).channels,{data:B,info:P}=await G.rotate().raw().toBuffer({resolveWithObject:!0}),M=new w(new Uint8ClampedArray(B),P.width,P.height,P.channels);return C!==void 0&&C!==P.channels&&M.convert(C),M};else throw new Error("Unable to load image processing library.");let o={0:"nearest",1:"lanczos",2:"bilinear",3:"bicubic",4:"box",5:"hamming"},x=new Map([["png","image/png"],["jpg","image/jpeg"],["jpeg","image/jpeg"],["gif","image/gif"]]);class w{constructor(b,C,B,P){this.data=b,this.width=C,this.height=B,this.channels=P}get size(){return[this.width,this.height]}static async read(b){if(b instanceof w)return b;if(typeof b=="string"||b instanceof URL)return await this.fromURL(b);if(b instanceof Blob)return await this.fromBlob(b);if(typeof HTMLCanvasElement<"u"&&b instanceof HTMLCanvasElement||typeof OffscreenCanvas<"u"&&b instanceof OffscreenCanvas)return this.fromCanvas(b);throw new Error(`Unsupported input type: ${typeof b}`)}static fromCanvas(b){if(!_)throw new Error("fromCanvas() is only supported in browser environments.");let B=b.getContext("2d").getImageData(0,0,b.width,b.height).data;return new w(B,b.width,b.height,4)}static async fromURL(b){let C=await(0,d.getFile)(b);if(C.status!==200)throw new Error(`Unable to read image from "${b}" (${C.status} ${C.statusText})`);let B=await C.blob();return this.fromBlob(B)}static async fromBlob(b){if(_){let C=await T(b),B=u(C.width,C.height).getContext("2d");return B.drawImage(C,0,0),new this(B.getImageData(0,0,C.width,C.height).data,C.width,C.height,4)}else{let C=(0,f.default)(await b.arrayBuffer());return await T(C)}}static fromTensor(b,C="CHW"){if(b.dims.length!==3)throw new Error(`Tensor should have 3 dimensions, but has ${b.dims.length} dimensions.`);if(C==="CHW")b=b.transpose(1,2,0);else if(C!=="HWC")throw new Error(`Unsupported channel format: ${C}`);if(!(b.data instanceof Uint8ClampedArray||b.data instanceof Uint8Array))throw new Error(`Unsupported tensor type: ${b.type}`);switch(b.dims[2]){case 1:case 2:case 3:case 4:return new w(b.data,b.dims[1],b.dims[0],b.dims[2]);default:throw new Error(`Unsupported number of channels: ${b.dims[2]}`)}}grayscale(){if(this.channels===1)return this;let b=new Uint8ClampedArray(this.width*this.height*1);switch(this.channels){case 3:case 4:for(let C=0,B=0;C<this.data.length;C+=this.channels){let P=this.data[C],M=this.data[C+1],y=this.data[C+2];b[B++]=Math.round(.2989*P+.587*M+.114*y)}break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(b,this.width,this.height,1)}rgb(){if(this.channels===3)return this;let b=new Uint8ClampedArray(this.width*this.height*3);switch(this.channels){case 1:for(let C=0,B=0;C<this.data.length;++C)b[B++]=this.data[C],b[B++]=this.data[C],b[B++]=this.data[C];break;case 4:for(let C=0,B=0;C<this.data.length;C+=4)b[B++]=this.data[C],b[B++]=this.data[C+1],b[B++]=this.data[C+2];break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(b,this.width,this.height,3)}rgba(){if(this.channels===4)return this;let b=new Uint8ClampedArray(this.width*this.height*4);switch(this.channels){case 1:for(let C=0,B=0;C<this.data.length;++C)b[B++]=this.data[C],b[B++]=this.data[C],b[B++]=this.data[C],b[B++]=255;break;case 3:for(let C=0,B=0;C<this.data.length;C+=3)b[B++]=this.data[C],b[B++]=this.data[C+1],b[B++]=this.data[C+2],b[B++]=255;break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(b,this.width,this.height,4)}putAlpha(b){if(b.width!==this.width||b.height!==this.height)throw new Error(`Expected mask size to be ${this.width}x${this.height}, but got ${b.width}x${b.height}`);if(b.channels!==1)throw new Error(`Expected mask to have 1 channel, but got ${b.channels}`);let C=this.data,B=b.data,P=this.width*this.height;if(this.channels===3){let M=new Uint8ClampedArray(P*4);for(let y=0,l=0,h=0;y<P;++y)M[h++]=C[l++],M[h++]=C[l++],M[h++]=C[l++],M[h++]=B[y];return this._update(M,this.width,this.height,4)}else if(this.channels===4){for(let M=0;M<P;++M)C[4*M+3]=B[M];return this}throw new Error(`Expected image to have 3 or 4 channels, but got ${this.channels}`)}async resize(b,C,{resample:B=2}={}){if(this.width===b&&this.height===C)return this;let P=o[B]??B,M=(0,i.isNullishDimension)(b),y=(0,i.isNullishDimension)(C);if(M&&y)return this;if(M?b=C/this.height*this.width:y&&(C=b/this.width*this.height),_){let l=this.channels,h=this.toCanvas(),F=u(b,C).getContext("2d");return F.drawImage(h,0,0,b,C),new w(F.getImageData(0,0,b,C).data,b,C,4).convert(l)}else{let l=this.toSharp();switch(P){case"box":case"hamming":(P==="box"||P==="hamming")&&(console.warn(`Resampling method ${P} is not yet supported. Using bilinear instead.`),P="bilinear");case"nearest":case"bilinear":case"bicubic":l=l.affine([b/this.width,0,0,C/this.height],{interpolator:P});break;case"lanczos":l=l.resize({width:b,height:C,fit:"fill",kernel:"lanczos3"});break;default:throw new Error(`Resampling method ${P} is not supported.`)}return await T(l)}}async pad([b,C,B,P]){if(b=Math.max(b,0),C=Math.max(C,0),B=Math.max(B,0),P=Math.max(P,0),b===0&&C===0&&B===0&&P===0)return this;if(_){let M=this.channels,y=this.toCanvas(),l=this.width+b+C,h=this.height+B+P,F=u(l,h).getContext("2d");return F.drawImage(y,0,0,this.width,this.height,b,B,this.width,this.height),new w(F.getImageData(0,0,l,h).data,l,h,4).convert(M)}else{let M=this.toSharp().extend({left:b,right:C,top:B,bottom:P});return await T(M)}}async crop([b,C,B,P]){if(b=Math.max(b,0),C=Math.max(C,0),B=Math.min(B,this.width-1),P=Math.min(P,this.height-1),b===0&&C===0&&B===this.width-1&&P===this.height-1)return this;let M=B-b+1,y=P-C+1;if(_){let l=this.channels,h=this.toCanvas(),F=u(M,y).getContext("2d");return F.drawImage(h,b,C,M,y,0,0,M,y),new w(F.getImageData(0,0,M,y).data,M,y,4).convert(l)}else{let l=this.toSharp().extract({left:b,top:C,width:M,height:y});return await T(l)}}async center_crop(b,C){if(this.width===b&&this.height===C)return this;let B=(this.width-b)/2,P=(this.height-C)/2;if(_){let M=this.channels,y=this.toCanvas(),l=u(b,C).getContext("2d"),h=0,F=0,S=0,V=0;return B>=0?h=B:S=-B,P>=0?F=P:V=-P,l.drawImage(y,h,F,b,C,S,V,b,C),new w(l.getImageData(0,0,b,C).data,b,C,4).convert(M)}else{let M=this.toSharp();if(B>=0&&P>=0)M=M.extract({left:Math.floor(B),top:Math.floor(P),width:b,height:C});else if(B<=0&&P<=0){let y=Math.floor(-P),l=Math.floor(-B);M=M.extend({top:y,left:l,right:b-this.width-l,bottom:C-this.height-y})}else{let y=[0,0],l=0;P<0?(y[0]=Math.floor(-P),y[1]=C-this.height-y[0]):l=Math.floor(P);let h=[0,0],F=0;B<0?(h[0]=Math.floor(-B),h[1]=b-this.width-h[0]):F=Math.floor(B),M=M.extend({top:y[0],bottom:y[1],left:h[0],right:h[1]}).extract({left:F,top:l,width:b,height:C})}return await T(M)}}async toBlob(b="image/png",C=1){if(!_)throw new Error("toBlob() is only supported in browser environments.");return await this.toCanvas().convertToBlob({type:b,quality:C})}toTensor(b="CHW"){let C=new I.Tensor("uint8",new Uint8Array(this.data),[this.height,this.width,this.channels]);if(b!=="HWC")if(b==="CHW")C=C.permute(2,0,1);else throw new Error(`Unsupported channel format: ${b}`);return C}toCanvas(){if(!_)throw new Error("toCanvas() is only supported in browser environments.");let b=this.clone().rgba(),C=u(b.width,b.height),B=new m(b.data,b.width,b.height);return C.getContext("2d").putImageData(B,0,0),C}split(){let{data:b,width:C,height:B,channels:P}=this,M=b.constructor,y=b.length/P,l=Array.from({length:P},()=>new M(y));for(let h=0;h<y;++h){let F=P*h;for(let S=0;S<P;++S)l[S][h]=b[F+S]}return l.map(h=>new w(h,C,B,1))}_update(b,C,B,P=null){return this.data=b,this.width=C,this.height=B,P!==null&&(this.channels=P),this}clone(){return new w(this.data.slice(),this.width,this.height,this.channels)}convert(b){if(this.channels===b)return this;switch(b){case 1:this.grayscale();break;case 3:this.rgb();break;case 4:this.rgba();break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this}async save(b){if(_){if(g.apis.IS_WEBWORKER_ENV)throw new Error("Unable to save an image from a Web Worker.");let C=b.split(".").pop().toLowerCase(),B=x.get(C)??"image/png",P=await this.toBlob(B);(0,i.saveBlob)(b,P)}else{if(g.apis.IS_FS_AVAILABLE)return await this.toSharp().toFile(b);throw new Error("Unable to save the image because filesystem is disabled in this environment.")}}toSharp(){if(_)throw new Error("toSharp() is only supported in server-side environments.");return(0,f.default)(this.data,{raw:{width:this.width,height:this.height,channels:this.channels}})}}let k=w.read.bind(w)}),"./src/utils/maths.js":((D,a,e)=>{e.r(a),e.d(a,{FFT:()=>k,bankers_round:()=>C,cos_sim:()=>u,dot:()=>f,dynamic_time_warping:()=>B,interpolate_data:()=>i,log_softmax:()=>I,magnitude:()=>m,max:()=>_,medianFilter:()=>G,min:()=>T,permute_data:()=>d,round:()=>b,softmax:()=>g});function i(P,[M,y,l],[h,F],S="bilinear",V=!1){let R=F/l,N=h/y,Q=new P.constructor(h*F*M),K=y*l,J=h*F;for(let te=0;te<h;++te)for(let se=0;se<F;++se){let ce=te*F+se,we=(se+.5)/R-.5,_e=(te+.5)/N-.5,X=Math.floor(we),L=Math.floor(_e),W=Math.min(X+1,l-1),Y=Math.min(L+1,y-1);X=Math.max(X,0),L=Math.max(L,0);let ae=we-X,be=_e-L,xe=(1-ae)*(1-be),Le=ae*(1-be),$e=(1-ae)*be,ge=ae*be,p=L*l,q=Y*l,de=p+X,pe=p+W,Te=q+X,me=q+W;for(let ne=0;ne<M;++ne){let fe=ne*K;Q[ne*J+ce]=xe*P[fe+de]+Le*P[fe+pe]+$e*P[fe+Te]+ge*P[fe+me]}}return Q}function d(P,M,y){let l=new Array(y.length),h=new Array(y.length);for(let V=y.length-1,R=1;V>=0;--V)h[V]=R,l[V]=M[y[V]],R*=l[V];let F=y.map((V,R)=>h[y.indexOf(R)]),S=new P.constructor(P.length);for(let V=0;V<P.length;++V){let R=0;for(let N=M.length-1,Q=V;N>=0;--N)R+=Q%M[N]*F[N],Q=Math.floor(Q/M[N]);S[R]=P[V]}return[S,l]}function g(P){let M=_(P)[0],y=P.map(F=>Math.exp(F-M)),l=y.reduce((F,S)=>F+S,0);return y.map(F=>F/l)}function I(P){let M=_(P)[0],y=0;for(let F=0;F<P.length;++F)y+=Math.exp(P[F]-M);let l=Math.log(y);return P.map(F=>F-M-l)}function f(P,M){let y=0;for(let l=0;l<P.length;++l)y+=P[l]*M[l];return y}function u(P,M){let y=f(P,M),l=m(P),h=m(M);return y/(l*h)}function m(P){return Math.sqrt(P.reduce((M,y)=>M+y*y,0))}function T(P){if(P.length===0)throw Error("Array must not be empty");let M=P[0],y=0;for(let l=1;l<P.length;++l)P[l]<M&&(M=P[l],y=l);return[M,y]}function _(P){if(P.length===0)throw Error("Array must not be empty");let M=P[0],y=0;for(let l=1;l<P.length;++l)P[l]>M&&(M=P[l],y=l);return[M,y]}function o(P){return P>0&&(P&P-1)===0}class x{constructor(M){if(this.size=M|0,this.size<=1||!o(this.size))throw new Error("FFT size must be a power of two larger than 1");this._csize=M<<1,this.table=new Float64Array(this.size*2);for(let l=0;l<this.table.length;l+=2){let h=Math.PI*l/this.size;this.table[l]=Math.cos(h),this.table[l+1]=-Math.sin(h)}let y=0;for(let l=1;this.size>l;l<<=1)++y;this._width=y%2===0?y-1:y,this._bitrev=new Int32Array(1<<this._width);for(let l=0;l<this._bitrev.length;++l){this._bitrev[l]=0;for(let h=0;h<this._width;h+=2){let F=this._width-h-2;this._bitrev[l]|=(l>>>h&3)<<F}}}createComplexArray(){return new Float64Array(this._csize)}fromComplexArray(M,y){let l=y||new Array(M.length>>>1);for(let h=0;h<M.length;h+=2)l[h>>>1]=M[h];return l}toComplexArray(M,y){let l=y||this.createComplexArray();for(let h=0;h<l.length;h+=2)l[h]=M[h>>>1],l[h+1]=0;return l}transform(M,y){if(M===y)throw new Error("Input and output buffers must be different");this._transform4(M,y,1)}realTransform(M,y){if(M===y)throw new Error("Input and output buffers must be different");this._realTransform4(M,y,1)}inverseTransform(M,y){if(M===y)throw new Error("Input and output buffers must be different");this._transform4(M,y,-1);for(let l=0;l<M.length;++l)M[l]/=this.size}_transform4(M,y,l){let h=this._csize,S=1<<this._width,V=h/S<<1,R,N,Q=this._bitrev;if(V===4)for(R=0,N=0;R<h;R+=V,++N){let J=Q[N];this._singleTransform2(y,M,R,J,S)}else for(R=0,N=0;R<h;R+=V,++N){let J=Q[N];this._singleTransform4(y,M,R,J,S,l)}let K=this.table;for(S>>=2;S>=2;S>>=2){V=h/S<<1;let J=V>>>2;for(R=0;R<h;R+=V){let te=R+J-1;for(let se=R,ce=0;se<te;se+=2,ce+=S){let we=se,_e=we+J,X=_e+J,L=X+J,W=M[we],Y=M[we+1],ae=M[_e],be=M[_e+1],xe=M[X],Le=M[X+1],$e=M[L],ge=M[L+1],p=K[ce],q=l*K[ce+1],de=ae*p-be*q,pe=ae*q+be*p,Te=K[2*ce],me=l*K[2*ce+1],ne=xe*Te-Le*me,fe=xe*me+Le*Te,le=K[3*ce],he=l*K[3*ce+1],De=$e*le-ge*he,ve=$e*he+ge*le,ye=W+ne,Ce=Y+fe,Qe=W-ne,Be=Y-fe,Re=de+De,ke=pe+ve,qe=l*(de-De),je=l*(pe-ve);M[we]=ye+Re,M[we+1]=Ce+ke,M[_e]=Qe+je,M[_e+1]=Be-qe,M[X]=ye-Re,M[X+1]=Ce-ke,M[L]=Qe-je,M[L+1]=Be+qe}}}}_singleTransform2(M,y,l,h,F){let S=M[h],V=M[h+1],R=M[h+F],N=M[h+F+1];y[l]=S+R,y[l+1]=V+N,y[l+2]=S-R,y[l+3]=V-N}_singleTransform4(M,y,l,h,F,S){let V=F*2,R=F*3,N=M[h],Q=M[h+1],K=M[h+F],J=M[h+F+1],te=M[h+V],se=M[h+V+1],ce=M[h+R],we=M[h+R+1],_e=N+te,X=Q+se,L=N-te,W=Q-se,Y=K+ce,ae=J+we,be=S*(K-ce),xe=S*(J-we);y[l]=_e+Y,y[l+1]=X+ae,y[l+2]=L+xe,y[l+3]=W-be,y[l+4]=_e-Y,y[l+5]=X-ae,y[l+6]=L-xe,y[l+7]=W+be}_realTransform4(M,y,l){let h=this._csize,S=1<<this._width,V=h/S<<1,R,N,Q=this._bitrev;if(V===4)for(R=0,N=0;R<h;R+=V,++N){let te=Q[N];this._singleRealTransform2(y,M,R,te>>>1,S>>>1)}else for(R=0,N=0;R<h;R+=V,++N){let te=Q[N];this._singleRealTransform4(y,M,R,te>>>1,S>>>1,l)}let K=this.table;for(S>>=2;S>=2;S>>=2){V=h/S<<1;let te=V>>>1,se=te>>>1,ce=se>>>1;for(R=0;R<h;R+=V)for(let we=0,_e=0;we<=ce;we+=2,_e+=S){let X=R+we,L=X+se,W=L+se,Y=W+se,ae=M[X],be=M[X+1],xe=M[L],Le=M[L+1],$e=M[W],ge=M[W+1],p=M[Y],q=M[Y+1],de=ae,pe=be,Te=K[_e],me=l*K[_e+1],ne=xe*Te-Le*me,fe=xe*me+Le*Te,le=K[2*_e],he=l*K[2*_e+1],De=$e*le-ge*he,ve=$e*he+ge*le,ye=K[3*_e],Ce=l*K[3*_e+1],Qe=p*ye-q*Ce,Be=p*Ce+q*ye,Re=de+De,ke=pe+ve,qe=de-De,je=pe-ve,nt=ne+Qe,ut=fe+Be,Pt=l*(ne-Qe),jt=l*(fe-Be);if(M[X]=Re+nt,M[X+1]=ke+ut,M[L]=qe+jt,M[L+1]=je-Pt,we===0){M[W]=Re-nt,M[W+1]=ke-ut;continue}if(we===ce)continue;let ft=R+se-we,$t=R+te-we;M[ft]=qe-l*jt,M[ft+1]=-je-l*Pt,M[$t]=Re-l*nt,M[$t+1]=-ke+l*ut}}let J=h>>>1;for(let te=2;te<J;te+=2)M[h-te]=M[te],M[h-te+1]=-M[te+1]}_singleRealTransform2(M,y,l,h,F){let S=M[h],V=M[h+F];y[l]=S+V,y[l+1]=0,y[l+2]=S-V,y[l+3]=0}_singleRealTransform4(M,y,l,h,F,S){let V=F*2,R=F*3,N=M[h],Q=M[h+F],K=M[h+V],J=M[h+R],te=N+K,se=N-K,ce=Q+J,we=S*(Q-J);y[l]=te+ce,y[l+1]=0,y[l+2]=se,y[l+3]=-we,y[l+4]=te-ce,y[l+5]=0,y[l+6]=se,y[l+7]=we}}class w{constructor(M){let y=2*(M-1),l=2*(2*M-1),h=2**Math.ceil(Math.log2(l));this.bufferSize=h,this._a=y;let F=new Float64Array(l),S=new Float64Array(h);this._chirpBuffer=new Float64Array(h),this._buffer1=new Float64Array(h),this._buffer2=new Float64Array(h),this._outBuffer1=new Float64Array(h),this._outBuffer2=new Float64Array(h);let V=-2*Math.PI/M,R=Math.cos(V),N=Math.sin(V);for(let Q=0;Q<l>>1;++Q){let K=(Q+1-M)**2/2,J=Math.sqrt(R**2+N**2)**K,te=K*Math.atan2(N,R),se=2*Q;F[se]=J*Math.cos(te),F[se+1]=J*Math.sin(te),S[se]=F[se],S[se+1]=-F[se+1]}this._slicedChirpBuffer=F.subarray(y,l),this._f=new x(h>>1),this._f.transform(this._chirpBuffer,S)}_transform(M,y,l){let h=this._buffer1,F=this._buffer2,S=this._outBuffer1,V=this._outBuffer2,R=this._chirpBuffer,N=this._slicedChirpBuffer,Q=this._a;if(l)for(let K=0;K<N.length;K+=2){let J=K+1,te=K>>1,se=y[te];h[K]=se*N[K],h[J]=se*N[J]}else for(let K=0;K<N.length;K+=2){let J=K+1;h[K]=y[K]*N[K]-y[J]*N[J],h[J]=y[K]*N[J]+y[J]*N[K]}this._f.transform(S,h);for(let K=0;K<R.length;K+=2){let J=K+1;F[K]=S[K]*R[K]-S[J]*R[J],F[J]=S[K]*R[J]+S[J]*R[K]}this._f.inverseTransform(V,F);for(let K=0;K<V.length;K+=2){let J=V[K+Q],te=V[K+Q+1],se=N[K],ce=N[K+1];M[K]=J*se-te*ce,M[K+1]=J*ce+te*se}}transform(M,y){this._transform(M,y,!1)}realTransform(M,y){this._transform(M,y,!0)}}class k{constructor(M){this.fft_length=M,this.isPowerOfTwo=o(M),this.isPowerOfTwo?(this.fft=new x(M),this.outputBufferSize=2*M):(this.fft=new w(M),this.outputBufferSize=this.fft.bufferSize)}realTransform(M,y){this.fft.realTransform(M,y)}transform(M,y){this.fft.transform(M,y)}}function G(P,M){if(M%2===0||M<=0)throw new Error("Window size must be a positive odd number");let y=new P.constructor(P.length),l=new P.constructor(M),h=Math.floor(M/2);for(let F=0;F<P.length;++F){let S=0;for(let V=-h;V<=h;++V){let R=F+V;R<0?R=Math.abs(R):R>=P.length&&(R=2*(P.length-1)-R),l[S++]=P[R]}l.sort(),y[F]=l[h]}return y}function b(P,M){let y=Math.pow(10,M);return Math.round(P*y)/y}function C(P){let M=Math.round(P);return Math.abs(P)%1===.5?M%2===0?M:M-1:M}function B(P){let M=P.length,y=P[0].length,l=[M+1,y+1],h=Array.from({length:l[0]},()=>Array(l[1]).fill(1/0));h[0][0]=0;let F=Array.from({length:l[0]},()=>Array(l[1]).fill(-1));for(let Q=1;Q<l[1];++Q)for(let K=1;K<l[0];++K){let J=h[K-1][Q-1],te=h[K-1][Q],se=h[K][Q-1],ce,we;J<te&&J<se?(ce=J,we=0):te<J&&te<se?(ce=te,we=1):(ce=se,we=2),h[K][Q]=P[K-1][Q-1]+ce,F[K][Q]=we}for(let Q=0;Q<l[1];++Q)F[0][Q]=2;for(let Q=0;Q<l[0];++Q)F[Q][0]=1;let S=M,V=y,R=[],N=[];for(;S>0||V>0;)switch(R.push(S-1),N.push(V-1),F[S][V]){case 0:--S,--V;break;case 1:--S;break;case 2:--V;break;default:throw new Error(`Internal error in dynamic time warping. Unexpected trace[${S}, ${V}]. Please file a bug report.`)}return R.reverse(),N.reverse(),[R,N]}}),"./src/utils/tensor.js":((D,a,e)=>{e.r(a),e.d(a,{DataTypeMap:()=>I,Tensor:()=>f,cat:()=>y,full:()=>N,full_like:()=>Q,interpolate:()=>T,interpolate_4d:()=>_,layer_norm:()=>C,matmul:()=>o,mean:()=>S,mean_pooling:()=>b,ones:()=>K,ones_like:()=>J,permute:()=>m,quantize_embeddings:()=>_e,rand:()=>ce,randn:()=>we,rfft:()=>x,slice:()=>G,stack:()=>l,std_mean:()=>F,topk:()=>w,zeros:()=>te,zeros_like:()=>se});var i=e("./src/utils/maths.js"),d=e("./src/backends/onnx.js"),g=e("./src/ops/registry.js");let I=Object.freeze({float32:Float32Array,float16:typeof Float16Array<"u"?Float16Array:Uint16Array,float64:Float64Array,string:Array,int8:Int8Array,uint8:Uint8Array,int16:Int16Array,uint16:Uint16Array,int32:Int32Array,uint32:Uint32Array,int64:BigInt64Array,uint64:BigUint64Array,bool:Uint8Array,uint4:Uint8Array,int4:Int8Array});class f{get dims(){return this.ort_tensor.dims}set dims(L){this.ort_tensor.dims=L}get type(){return this.ort_tensor.type}get data(){return this.ort_tensor.data}get size(){return this.ort_tensor.size}get location(){return this.ort_tensor.location}ort_tensor;constructor(...L){return(0,d.isONNXTensor)(L[0])?this.ort_tensor=L[0]:this.ort_tensor=new d.Tensor(L[0],L[1],L[2]),new Proxy(this,{get:(W,Y)=>{if(typeof Y=="string"){let ae=Number(Y);if(Number.isInteger(ae))return W._getitem(ae)}return W[Y]},set:(W,Y,ae)=>W[Y]=ae})}dispose(){this.ort_tensor.dispose()}*[Symbol.iterator](){let[L,...W]=this.dims;if(W.length>0){let Y=W.reduce((ae,be)=>ae*be);for(let ae=0;ae<L;++ae)yield this._subarray(ae,Y,W)}else yield*this.data}_getitem(L){let[W,...Y]=this.dims;if(L=M(L,W),Y.length>0){let ae=Y.reduce((be,xe)=>be*xe);return this._subarray(L,ae,Y)}else return new f(this.type,[this.data[L]],Y)}indexOf(L){let W=this.data;for(let Y=0;Y<W.length;++Y)if(W[Y]==L)return Y;return-1}_subarray(L,W,Y){let ae=L*W,be=(L+1)*W,xe="subarray"in this.data?this.data.subarray(ae,be):this.data.slice(ae,be);return new f(this.type,xe,Y)}item(){let L=this.data;if(L.length!==1)throw new Error(`a Tensor with ${L.length} elements cannot be converted to Scalar`);return L[0]}tolist(){return u(this.data,this.dims)}sigmoid(){return this.clone().sigmoid_()}sigmoid_(){let L=this.data;for(let W=0;W<L.length;++W)L[W]=1/(1+Math.exp(-L[W]));return this}map(L){return this.clone().map_(L)}map_(L){let W=this.data;for(let Y=0;Y<W.length;++Y)W[Y]=L(W[Y],Y,W);return this}mul(L){return this.clone().mul_(L)}mul_(L){let W=this.data;for(let Y=0;Y<W.length;++Y)W[Y]*=L;return this}div(L){return this.clone().div_(L)}div_(L){let W=this.data;for(let Y=0;Y<W.length;++Y)W[Y]/=L;return this}add(L){return this.clone().add_(L)}add_(L){let W=this.data;for(let Y=0;Y<W.length;++Y)W[Y]+=L;return this}sub(L){return this.clone().sub_(L)}sub_(L){let W=this.data;for(let Y=0;Y<W.length;++Y)W[Y]-=L;return this}clone(){return new f(this.type,this.data.slice(),this.dims.slice())}slice(...L){let W=[],Y=[];for(let p=0;p<this.dims.length;++p){let q=L[p];if(q==null)Y.push([0,this.dims[p]]),W.push(this.dims[p]);else if(typeof q=="number")q=M(q,this.dims[p],p),Y.push([q,q+1]);else if(Array.isArray(q)&&q.length===2){let[de,pe]=q;if(de=de===null?0:M(de,this.dims[p],p,!1),pe=pe===null?this.dims[p]:M(pe,this.dims[p],p,!1),de>pe)throw new Error(`Invalid slice: ${q}`);let Te=[Math.max(de,0),Math.min(pe,this.dims[p])];Y.push(Te),W.push(Te[1]-Te[0])}else throw new Error(`Invalid slice: ${q}`)}let ae=Y.map(([p,q])=>q-p),be=ae.reduce((p,q)=>p*q),xe=this.data,Le=new xe.constructor(be),$e=this.stride(),ge=!0;for(let p=1;p<ae.length;++p)if(Y[p][0]!==0||Y[p][1]!==this.dims[p]){ge=!1;break}if(ge){let p=Y[0][0]*$e[0],q=Y[0][1]*$e[0];if(ArrayBuffer.isView(xe))Le.set(xe.subarray(p,q));else if(Array.isArray(xe)){let de=xe.slice(p,q);for(let pe=0;pe<de.length;++pe)Le[pe]=de[pe]}else throw new Error("Unsupported data type for slicing")}else for(let p=0;p<be;++p){let q=0;for(let de=ae.length-1,pe=p;de>=0;--de){let Te=ae[de];q+=(pe%Te+Y[de][0])*$e[de],pe=Math.floor(pe/Te)}Le[p]=xe[q]}return new f(this.type,Le,W)}permute(...L){return m(this,L)}transpose(...L){return this.permute(...L)}sum(L=null,W=!1){return this.norm(1,L,W)}norm(L="fro",W=null,Y=!1){if(L==="fro")L=2;else if(typeof L=="string")throw Error(`Unsupported norm: ${L}`);let ae=this.data,be=(ge,p)=>ge+p**L;if(W===null){let ge=ae.reduce(be,0)**(1/L);return new f(this.type,[ge],[])}let[xe,Le,$e]=h(be,this,W,Y);if(L!==1)for(let ge=0;ge<Le.length;++ge)Le[ge]=Le[ge]**(1/L);return new f(xe,Le,$e)}normalize_(L=2,W=1){W=M(W,this.dims.length);let Y=this.norm(L,W,!0),ae=this.data,be=Y.data;for(let xe=0;xe<ae.length;++xe){let Le=0;for(let $e=this.dims.length-1,ge=xe,p=1;$e>=0;--$e){let q=this.dims[$e];if($e!==W){let de=ge%q;Le+=de*p,p*=this.dims[$e]}ge=Math.floor(ge/q)}ae[xe]/=be[Le]}return this}normalize(L=2,W=1){return this.clone().normalize_(L,W)}stride(){return V(this.dims)}squeeze(L=null){return new f(this.type,this.data,B(this.dims,L))}squeeze_(L=null){return this.dims=B(this.dims,L),this}unsqueeze(L=null){return new f(this.type,this.data,P(this.dims,L))}unsqueeze_(L=null){return this.dims=P(this.dims,L),this}flatten_(L=0,W=-1){W=(W+this.dims.length)%this.dims.length;let Y=this.dims.slice(0,L),ae=this.dims.slice(L,W+1),be=this.dims.slice(W+1);return this.dims=[...Y,ae.reduce((xe,Le)=>xe*Le,1),...be],this}flatten(L=0,W=-1){return this.clone().flatten_(L,W)}view(...L){let W=-1;for(let ae=0;ae<L.length;++ae)if(L[ae]===-1){if(W!==-1)throw new Error("Only one dimension can be inferred");W=ae}let Y=this.data;if(W!==-1){let ae=L.reduce((be,xe,Le)=>Le!==W?be*xe:be,1);L[W]=Y.length/ae}return new f(this.type,Y,L)}neg_(){let L=this.data;for(let W=0;W<L.length;++W)L[W]=-L[W];return this}neg(){return this.clone().neg_()}gt(L){let W=new Uint8Array(this.data.length),Y=this.data;for(let ae=0;ae<Y.length;++ae)W[ae]=Y[ae]>L?1:0;return new f("bool",W,this.dims)}lt(L){let W=new Uint8Array(this.data.length),Y=this.data;for(let ae=0;ae<Y.length;++ae)W[ae]=Y[ae]<L?1:0;return new f("bool",W,this.dims)}clamp_(L,W){let Y=this.data;for(let ae=0;ae<Y.length;++ae)Y[ae]=Math.min(Math.max(Y[ae],L),W);return this}clamp(L,W){return this.clone().clamp_(L,W)}round_(){let L=this.data;for(let W=0;W<L.length;++W)L[W]=Math.round(L[W]);return this}round(){return this.clone().round_()}mean(L=null,W=!1){return S(this,L,W)}min(L=null,W=!1){if(L===null){let xe=(0,i.min)(this.data)[0];return new f(this.type,[xe],[])}let[Y,ae,be]=h((xe,Le)=>Math.min(xe,Le),this,L,W,1/0);return new f(Y,ae,be)}max(L=null,W=!1){if(L===null){let xe=(0,i.max)(this.data)[0];return new f(this.type,[xe],[])}let[Y,ae,be]=h((xe,Le)=>Math.max(xe,Le),this,L,W,-1/0);return new f(Y,ae,be)}argmin(L=null,W=!1){if(L!==null)throw new Error("`dim !== null` not yet implemented.");let Y=(0,i.min)(this.data)[1];return new f("int64",[BigInt(Y)],[])}argmax(L=null,W=!1){if(L!==null)throw new Error("`dim !== null` not yet implemented.");let Y=(0,i.max)(this.data)[1];return new f("int64",[BigInt(Y)],[])}to(L){if(this.type===L)return this;if(!I.hasOwnProperty(L))throw new Error(`Unsupported type: ${L}`);let W,Y=["int64","uint64"].includes(this.type),ae=["int64","uint64"].includes(L);return Y&&!ae?W=Number:!Y&&ae&&(["float16","float32","float64"].includes(this.type)?W=be=>BigInt(Math.floor(be)):W=BigInt),new f(L,I[L].from(this.data,W),this.dims)}}function u(X,L){let W=X.length,Y=L.reduce((be,xe)=>be*xe);if(W!==Y)throw Error(`cannot reshape array of size ${W} into shape (${L})`);let ae=X;for(let be=L.length-1;be>=0;be--)ae=ae.reduce((xe,Le)=>{let $e=xe[xe.length-1];return $e.length<L[be]?$e.push(Le):xe.push([Le]),xe},[[]]);return ae[0]}function m(X,L){let[W,Y]=(0,i.permute_data)(X.data,X.dims,L);return new f(X.type,W,Y)}function T(X,[L,W],Y="bilinear",ae=!1){let be=X.dims.at(-3)??1,xe=X.dims.at(-2),Le=X.dims.at(-1),$e=(0,i.interpolate_data)(X.data,[be,xe,Le],[L,W],Y,ae);return new f(X.type,$e,[be,L,W])}async function _(X,{size:L=null,mode:W="bilinear"}={}){if(X.dims.length!==4)throw new Error("`interpolate_4d` currently only supports 4D input.");if(!L)throw new Error("`interpolate_4d` requires a `size` argument.");let Y;if(L.length===2)Y=[...X.dims.slice(0,2),...L];else if(L.length===3)Y=[X.dims[0],...L];else if(L.length===4)Y=L;else throw new Error("`size` must be of length 2, 3, or 4.");let ae;if(W==="nearest")ae=await g.TensorOpRegistry.nearest_interpolate_4d;else if(W==="bilinear")ae=await g.TensorOpRegistry.bilinear_interpolate_4d;else if(W==="bicubic")ae=await g.TensorOpRegistry.bicubic_interpolate_4d;else throw new Error(`Unsupported mode: ${W}`);let be=new f("int64",new BigInt64Array(Y.map(BigInt)),[Y.length]);return await ae({x:X,s:be})}async function o(X,L){return await(await g.TensorOpRegistry.matmul)({a:X,b:L})}async function x(X,L){return await(await g.TensorOpRegistry.rfft)({x:X,a:L})}async function w(X,L){let W=await g.TensorOpRegistry.top_k;return L==null?L=X.dims.at(-1):L=Math.min(L,X.dims.at(-1)),await W({x:X,k:new f("int64",[BigInt(L)],[1])})}let k=X=>new f("int64",X,[X.length]);async function G(X,L,W,Y,ae){return await(await g.TensorOpRegistry.slice)({x:X,s:k(L),e:k(W),a:k(Y),t:k(ae??new Array(Y.length).fill(1))})}function b(X,L){let W=X.data,Y=L.data,ae=[X.dims[0],X.dims[2]],be=new W.constructor(ae[0]*ae[1]),[xe,Le,$e]=X.dims,ge=0;for(let p=0;p<xe;++p){let q=p*$e*Le;for(let de=0;de<$e;++de){let pe=0,Te=0,me=p*Le,ne=q+de;for(let le=0;le<Le;++le){let he=Number(Y[me+le]);Te+=he,pe+=W[ne+le*$e]*he}let fe=pe/Te;be[ge++]=fe}}return new f(X.type,be,ae)}function C(X,L,{eps:W=1e-5}={}){if(X.dims.length!==2)throw new Error("`layer_norm` currently only supports 2D input.");let[Y,ae]=X.dims;if(L.length!==1&&L[0]!==ae)throw new Error("`normalized_shape` must be a 1D array with shape `[input.dims[1]]`.");let[be,xe]=F(X,1,0,!0),Le=be.data,$e=xe.data,ge=X.data,p=new ge.constructor(ge.length);for(let q=0;q<Y;++q){let de=q*ae;for(let pe=0;pe<ae;++pe){let Te=de+pe;p[Te]=(ge[Te]-$e[q])/(Le[q]+W)}}return new f(X.type,p,X.dims)}function B(X,L){return X=X.slice(),L===null?X=X.filter(W=>W!==1):typeof L=="number"?X[L]===1&&X.splice(L,1):Array.isArray(L)&&(X=X.filter((W,Y)=>W!==1||!L.includes(Y))),X}function P(X,L){return L=M(L,X.length+1),X=X.slice(),X.splice(L,0,1),X}function M(X,L,W=null,Y=!0){if(X<-L||X>=L){if(Y)throw new Error(`IndexError: index ${X} is out of bounds for dimension${W===null?"":" "+W} with size ${L}`);return X<-L?0:L}return X<0&&(X=(X%L+L)%L),X}function y(X,L=0){L=M(L,X[0].dims.length);let W=X[0].dims.slice();W[L]=X.reduce((xe,Le)=>xe+Le.dims[L],0);let Y=W.reduce((xe,Le)=>xe*Le,1),ae=new X[0].data.constructor(Y),be=X[0].type;if(L===0){let xe=0;for(let Le of X){let $e=Le.data;ae.set($e,xe),xe+=$e.length}}else{let xe=0;for(let Le=0;Le<X.length;++Le){let{data:$e,dims:ge}=X[Le];for(let p=0;p<$e.length;++p){let q=0;for(let de=ge.length-1,pe=p,Te=1;de>=0;--de){let me=ge[de],ne=pe%me;de===L&&(ne+=xe),q+=ne*Te,Te*=W[de],pe=Math.floor(pe/me)}ae[q]=$e[p]}xe+=ge[L]}}return new f(be,ae,W)}function l(X,L=0){return y(X.map(W=>W.unsqueeze(L)),L)}function h(X,L,W=null,Y=!1,ae=null){let be=L.data,xe=L.dims;W=M(W,xe.length);let Le=xe.slice();Le[W]=1;let $e=new be.constructor(be.length/xe[W]);ae!==null&&$e.fill(ae);for(let ge=0;ge<be.length;++ge){let p=0;for(let q=xe.length-1,de=ge,pe=1;q>=0;--q){let Te=xe[q];if(q!==W){let me=de%Te;p+=me*pe,pe*=Le[q]}de=Math.floor(de/Te)}$e[p]=X($e[p],be[ge],ge,p)}return Y||Le.splice(W,1),[L.type,$e,Le]}function F(X,L=null,W=1,Y=!1){let ae=X.data,be=X.dims;if(L===null){let pe=ae.reduce((fe,le)=>fe+le,0)/ae.length,Te=Math.sqrt(ae.reduce((fe,le)=>fe+(le-pe)**2,0)/(ae.length-W)),me=new f(X.type,[pe],[]);return[new f(X.type,[Te],[]),me]}L=M(L,be.length);let xe=S(X,L,Y),Le=xe.data,[$e,ge,p]=h((de,pe,Te,me)=>de+(pe-Le[me])**2,X,L,Y);for(let de=0;de<ge.length;++de)ge[de]=Math.sqrt(ge[de]/(be[L]-W));return[new f($e,ge,p),xe]}function S(X,L=null,W=!1){let Y=X.dims,ae=X.data;if(L===null){let $e=ae.reduce((ge,p)=>ge+p,0);return new f(X.type,[$e/ae.length],[])}L=M(L,Y.length);let[be,xe,Le]=h(($e,ge)=>$e+ge,X,L,W);if(Y[L]!==1)for(let $e=0;$e<xe.length;++$e)xe[$e]/=Y[L];return new f(be,xe,Le)}function V(X){let L=new Array(X.length);for(let W=X.length-1,Y=1;W>=0;--W)L[W]=Y,Y*=X[W];return L}function R(X,L,W,Y){let ae=X.reduce((be,xe)=>be*xe,1);return new f(W,new Y(ae).fill(L),X)}function N(X,L){let W,Y;if(typeof L=="number")W="float32",Y=Float32Array;else if(typeof L=="bigint")W="int64",Y=BigInt64Array;else if(typeof L=="boolean")W="bool",Y=Uint8Array;else throw new Error(`Unsupported data type: ${typeof L}`);return R(X,L,W,Y)}function Q(X,L){return N(X.dims,L)}function K(X){return R(X,1n,"int64",BigInt64Array)}function J(X){return K(X.dims)}function te(X){return R(X,0n,"int64",BigInt64Array)}function se(X){return te(X.dims)}function ce(X){let L=X.reduce((W,Y)=>W*Y,1);return new f("float32",Float32Array.from({length:L},()=>Math.random()),X)}function we(X){let L=X.reduce((Y,ae)=>Y*ae,1);function W(){let Y=1-Math.random(),ae=1-Math.random();return Math.sqrt(-2*Math.log(Y))*Math.cos(2*Math.PI*ae)}return new f("float32",Float32Array.from({length:L},()=>W()),X)}function _e(X,L){if(X.dims.length!==2)throw new Error("The tensor must have 2 dimensions");if(X.dims.at(-1)%8!==0)throw new Error("The last dimension of the tensor must be a multiple of 8");if(!["binary","ubinary"].includes(L))throw new Error("The precision must be either 'binary' or 'ubinary'");let W=L==="binary",Y=W?"int8":"uint8",ae=W?Int8Array:Uint8Array,be=X.data,xe=new ae(be.length/8);for(let Le=0;Le<be.length;++Le){let $e=be[Le]>0?1:0,ge=Math.floor(Le/8),p=Le%8;xe[ge]|=$e<<7-p,W&&p===0&&(xe[ge]-=128)}return new f(Y,xe,[X.dims[0],X.dims[1]/8])}}),"./src/utils/video.js":((D,a,e)=>{e.r(a),e.d(a,{RawVideo:()=>I,RawVideoFrame:()=>g,load_video:()=>f});var i=e("./src/utils/image.js"),d=e("./src/env.js");class g{constructor(m,T){this.image=m,this.timestamp=T}}class I{constructor(m,T){m.length>0&&m[0]instanceof i.RawImage&&(m=m.map((_,o)=>new g(_,(o+1)/(m.length+1)*T))),this.frames=m,this.duration=T}get width(){return this.frames[0].image.width}get height(){return this.frames[0].image.height}get fps(){return this.frames.length/this.duration}}async function f(u,{num_frames:m=null,fps:T=null}={}){if(!d.apis.IS_BROWSER_ENV)throw new Error("`load_video` is currently only supported in browser environments.");if(m==null&&T==null)throw new Error("Either num_frames or fps must be provided.");let _=[],o=document.createElement("video");if(o.crossOrigin="anonymous",o.muted=!0,typeof u=="string")o.src=u;else if(u instanceof Blob)o.src=URL.createObjectURL(u);else if(u instanceof HTMLVideoElement)o.src=u.src;else throw new Error("Invalid URL or video element provided.");if(await new Promise(B=>o.onloadedmetadata=B),o.seekable.start(0)===o.seekable.end(0)){let P=await(await fetch(o.src)).blob();o.src=URL.createObjectURL(P),await new Promise(M=>o.onloadedmetadata=M)}let x=o.duration,w,k;m!=null?(w=m,k=m===1?0:x/(m-1)):(k=1/T,w=Math.floor(x/k));let G=[];for(let B=0;B<w;++B)G.push(m===1?x/2:B*k);let b=document.createElement("canvas");b.width=o.videoWidth,b.height=o.videoHeight;let C=b.getContext("2d",{willReadFrequently:!0});for(let B of G){o.currentTime=B,await new Promise(l=>{o.onseeked=l}),C.drawImage(o,0,0,b.width,b.height);let P=C.getImageData(0,0,b.width,b.height),M=new i.RawImage(P.data,b.width,b.height,4),y=new g(M,B);_.push(y)}return o.remove(),new I(_,x)}})},Ju={};(()=>{var D=Object.getPrototypeOf?e=>Object.getPrototypeOf(e):e=>e.__proto__,a;mt.t=function(e,i){if(i&1&&(e=this(e)),i&8||typeof e=="object"&&e&&(i&4&&e.__esModule||i&16&&typeof e.then=="function"))return e;var d=Object.create(null);mt.r(d);var g={};a=a||[null,D({}),D([]),D(D)];for(var I=i&2&&e;typeof I=="object"&&!~a.indexOf(I);I=D(I))Object.getOwnPropertyNames(I).forEach(f=>g[f]=()=>e[f]);return g.default=()=>e,mt.d(d,g),d}})();mt.d=(D,a)=>{for(var e in a)mt.o(a,e)&&!mt.o(D,e)&&Object.defineProperty(D,e,{enumerable:!0,get:a[e]})};mt.o=(D,a)=>Object.prototype.hasOwnProperty.call(D,a);mt.r=D=>{typeof Symbol<"u"&&Symbol.toStringTag&&Object.defineProperty(D,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(D,"__esModule",{value:!0})};t={};(()=>{mt.r(t),mt.d(t,{ASTFeatureExtractor:()=>_.ASTFeatureExtractor,ASTForAudioClassification:()=>e.ASTForAudioClassification,ASTModel:()=>e.ASTModel,ASTPreTrainedModel:()=>e.ASTPreTrainedModel,AlbertForMaskedLM:()=>e.AlbertForMaskedLM,AlbertForQuestionAnswering:()=>e.AlbertForQuestionAnswering,AlbertForSequenceClassification:()=>e.AlbertForSequenceClassification,AlbertModel:()=>e.AlbertModel,AlbertPreTrainedModel:()=>e.AlbertPreTrainedModel,AlbertTokenizer:()=>i.AlbertTokenizer,ArceeForCausalLM:()=>e.ArceeForCausalLM,ArceeModel:()=>e.ArceeModel,ArceePreTrainedModel:()=>e.ArceePreTrainedModel,AudioClassificationPipeline:()=>a.AudioClassificationPipeline,AutoConfig:()=>d.AutoConfig,AutoFeatureExtractor:()=>o.AutoFeatureExtractor,AutoImageProcessor:()=>k.AutoImageProcessor,AutoModel:()=>e.AutoModel,AutoModelForAudioClassification:()=>e.AutoModelForAudioClassification,AutoModelForAudioFrameClassification:()=>e.AutoModelForAudioFrameClassification,AutoModelForAudioTextToText:()=>e.AutoModelForAudioTextToText,AutoModelForCTC:()=>e.AutoModelForCTC,AutoModelForCausalLM:()=>e.AutoModelForCausalLM,AutoModelForDepthEstimation:()=>e.AutoModelForDepthEstimation,AutoModelForDocumentQuestionAnswering:()=>e.AutoModelForDocumentQuestionAnswering,AutoModelForImageClassification:()=>e.AutoModelForImageClassification,AutoModelForImageFeatureExtraction:()=>e.AutoModelForImageFeatureExtraction,AutoModelForImageMatting:()=>e.AutoModelForImageMatting,AutoModelForImageSegmentation:()=>e.AutoModelForImageSegmentation,AutoModelForImageTextToText:()=>e.AutoModelForImageTextToText,AutoModelForImageToImage:()=>e.AutoModelForImageToImage,AutoModelForMaskGeneration:()=>e.AutoModelForMaskGeneration,AutoModelForMaskedLM:()=>e.AutoModelForMaskedLM,AutoModelForNormalEstimation:()=>e.AutoModelForNormalEstimation,AutoModelForObjectDetection:()=>e.AutoModelForObjectDetection,AutoModelForPoseEstimation:()=>e.AutoModelForPoseEstimation,AutoModelForQuestionAnswering:()=>e.AutoModelForQuestionAnswering,AutoModelForSemanticSegmentation:()=>e.AutoModelForSemanticSegmentation,AutoModelForSeq2SeqLM:()=>e.AutoModelForSeq2SeqLM,AutoModelForSequenceClassification:()=>e.AutoModelForSequenceClassification,AutoModelForSpeechSeq2Seq:()=>e.AutoModelForSpeechSeq2Seq,AutoModelForTextToSpectrogram:()=>e.AutoModelForTextToSpectrogram,AutoModelForTextToWaveform:()=>e.AutoModelForTextToWaveform,AutoModelForTokenClassification:()=>e.AutoModelForTokenClassification,AutoModelForUniversalSegmentation:()=>e.AutoModelForUniversalSegmentation,AutoModelForVision2Seq:()=>e.AutoModelForVision2Seq,AutoModelForXVector:()=>e.AutoModelForXVector,AutoModelForZeroShotObjectDetection:()=>e.AutoModelForZeroShotObjectDetection,AutoProcessor:()=>C.AutoProcessor,AutoTokenizer:()=>i.AutoTokenizer,AutomaticSpeechRecognitionPipeline:()=>a.AutomaticSpeechRecognitionPipeline,BackgroundRemovalPipeline:()=>a.BackgroundRemovalPipeline,BartForConditionalGeneration:()=>e.BartForConditionalGeneration,BartForSequenceClassification:()=>e.BartForSequenceClassification,BartModel:()=>e.BartModel,BartPretrainedModel:()=>e.BartPretrainedModel,BartTokenizer:()=>i.BartTokenizer,BaseModelOutput:()=>e.BaseModelOutput,BaseStreamer:()=>B.BaseStreamer,BeitFeatureExtractor:()=>w.BeitFeatureExtractor,BeitForImageClassification:()=>e.BeitForImageClassification,BeitModel:()=>e.BeitModel,BeitPreTrainedModel:()=>e.BeitPreTrainedModel,BertForMaskedLM:()=>e.BertForMaskedLM,BertForQuestionAnswering:()=>e.BertForQuestionAnswering,BertForSequenceClassification:()=>e.BertForSequenceClassification,BertForTokenClassification:()=>e.BertForTokenClassification,BertModel:()=>e.BertModel,BertPreTrainedModel:()=>e.BertPreTrainedModel,BertTokenizer:()=>i.BertTokenizer,BitImageProcessor:()=>w.BitImageProcessor,BlenderbotForConditionalGeneration:()=>e.BlenderbotForConditionalGeneration,BlenderbotModel:()=>e.BlenderbotModel,BlenderbotPreTrainedModel:()=>e.BlenderbotPreTrainedModel,BlenderbotSmallForConditionalGeneration:()=>e.BlenderbotSmallForConditionalGeneration,BlenderbotSmallModel:()=>e.BlenderbotSmallModel,BlenderbotSmallPreTrainedModel:()=>e.BlenderbotSmallPreTrainedModel,BlenderbotSmallTokenizer:()=>i.BlenderbotSmallTokenizer,BlenderbotTokenizer:()=>i.BlenderbotTokenizer,BloomForCausalLM:()=>e.BloomForCausalLM,BloomModel:()=>e.BloomModel,BloomPreTrainedModel:()=>e.BloomPreTrainedModel,BloomTokenizer:()=>i.BloomTokenizer,CLIPFeatureExtractor:()=>w.CLIPFeatureExtractor,CLIPImageProcessor:()=>w.CLIPImageProcessor,CLIPModel:()=>e.CLIPModel,CLIPPreTrainedModel:()=>e.CLIPPreTrainedModel,CLIPSegForImageSegmentation:()=>e.CLIPSegForImageSegmentation,CLIPSegModel:()=>e.CLIPSegModel,CLIPSegPreTrainedModel:()=>e.CLIPSegPreTrainedModel,CLIPTextModel:()=>e.CLIPTextModel,CLIPTextModelWithProjection:()=>e.CLIPTextModelWithProjection,CLIPTokenizer:()=>i.CLIPTokenizer,CLIPVisionModel:()=>e.CLIPVisionModel,CLIPVisionModelWithProjection:()=>e.CLIPVisionModelWithProjection,CamembertForMaskedLM:()=>e.CamembertForMaskedLM,CamembertForQuestionAnswering:()=>e.CamembertForQuestionAnswering,CamembertForSequenceClassification:()=>e.CamembertForSequenceClassification,CamembertForTokenClassification:()=>e.CamembertForTokenClassification,CamembertModel:()=>e.CamembertModel,CamembertPreTrainedModel:()=>e.CamembertPreTrainedModel,CamembertTokenizer:()=>i.CamembertTokenizer,CausalLMOutput:()=>e.CausalLMOutput,CausalLMOutputWithPast:()=>e.CausalLMOutputWithPast,ChineseCLIPFeatureExtractor:()=>w.ChineseCLIPFeatureExtractor,ChineseCLIPModel:()=>e.ChineseCLIPModel,ChineseCLIPPreTrainedModel:()=>e.ChineseCLIPPreTrainedModel,ClapAudioModelWithProjection:()=>e.ClapAudioModelWithProjection,ClapFeatureExtractor:()=>_.ClapFeatureExtractor,ClapModel:()=>e.ClapModel,ClapPreTrainedModel:()=>e.ClapPreTrainedModel,ClapTextModelWithProjection:()=>e.ClapTextModelWithProjection,ClassifierFreeGuidanceLogitsProcessor:()=>M.ClassifierFreeGuidanceLogitsProcessor,CodeGenForCausalLM:()=>e.CodeGenForCausalLM,CodeGenModel:()=>e.CodeGenModel,CodeGenPreTrainedModel:()=>e.CodeGenPreTrainedModel,CodeGenTokenizer:()=>i.CodeGenTokenizer,CodeLlamaTokenizer:()=>i.CodeLlamaTokenizer,CohereForCausalLM:()=>e.CohereForCausalLM,CohereModel:()=>e.CohereModel,CoherePreTrainedModel:()=>e.CoherePreTrainedModel,CohereTokenizer:()=>i.CohereTokenizer,ConvBertForMaskedLM:()=>e.ConvBertForMaskedLM,ConvBertForQuestionAnswering:()=>e.ConvBertForQuestionAnswering,ConvBertForSequenceClassification:()=>e.ConvBertForSequenceClassification,ConvBertForTokenClassification:()=>e.ConvBertForTokenClassification,ConvBertModel:()=>e.ConvBertModel,ConvBertPreTrainedModel:()=>e.ConvBertPreTrainedModel,ConvBertTokenizer:()=>i.ConvBertTokenizer,ConvNextFeatureExtractor:()=>w.ConvNextFeatureExtractor,ConvNextForImageClassification:()=>e.ConvNextForImageClassification,ConvNextImageProcessor:()=>w.ConvNextImageProcessor,ConvNextModel:()=>e.ConvNextModel,ConvNextPreTrainedModel:()=>e.ConvNextPreTrainedModel,ConvNextV2ForImageClassification:()=>e.ConvNextV2ForImageClassification,ConvNextV2Model:()=>e.ConvNextV2Model,ConvNextV2PreTrainedModel:()=>e.ConvNextV2PreTrainedModel,DFineForObjectDetection:()=>e.DFineForObjectDetection,DFineModel:()=>e.DFineModel,DFinePreTrainedModel:()=>e.DFinePreTrainedModel,DINOv3ConvNextModel:()=>e.DINOv3ConvNextModel,DINOv3ConvNextPreTrainedModel:()=>e.DINOv3ConvNextPreTrainedModel,DINOv3ViTImageProcessor:()=>w.DINOv3ViTImageProcessor,DINOv3ViTModel:()=>e.DINOv3ViTModel,DINOv3ViTPreTrainedModel:()=>e.DINOv3ViTPreTrainedModel,DPTFeatureExtractor:()=>w.DPTFeatureExtractor,DPTForDepthEstimation:()=>e.DPTForDepthEstimation,DPTImageProcessor:()=>w.DPTImageProcessor,DPTModel:()=>e.DPTModel,DPTPreTrainedModel:()=>e.DPTPreTrainedModel,DacDecoderModel:()=>e.DacDecoderModel,DacDecoderOutput:()=>e.DacDecoderOutput,DacEncoderModel:()=>e.DacEncoderModel,DacEncoderOutput:()=>e.DacEncoderOutput,DacFeatureExtractor:()=>_.DacFeatureExtractor,DacModel:()=>e.DacModel,DacPreTrainedModel:()=>e.DacPreTrainedModel,DataTypeMap:()=>u.DataTypeMap,DebertaForMaskedLM:()=>e.DebertaForMaskedLM,DebertaForQuestionAnswering:()=>e.DebertaForQuestionAnswering,DebertaForSequenceClassification:()=>e.DebertaForSequenceClassification,DebertaForTokenClassification:()=>e.DebertaForTokenClassification,DebertaModel:()=>e.DebertaModel,DebertaPreTrainedModel:()=>e.DebertaPreTrainedModel,DebertaTokenizer:()=>i.DebertaTokenizer,DebertaV2ForMaskedLM:()=>e.DebertaV2ForMaskedLM,DebertaV2ForQuestionAnswering:()=>e.DebertaV2ForQuestionAnswering,DebertaV2ForSequenceClassification:()=>e.DebertaV2ForSequenceClassification,DebertaV2ForTokenClassification:()=>e.DebertaV2ForTokenClassification,DebertaV2Model:()=>e.DebertaV2Model,DebertaV2PreTrainedModel:()=>e.DebertaV2PreTrainedModel,DebertaV2Tokenizer:()=>i.DebertaV2Tokenizer,DecisionTransformerModel:()=>e.DecisionTransformerModel,DecisionTransformerPreTrainedModel:()=>e.DecisionTransformerPreTrainedModel,DeiTFeatureExtractor:()=>w.DeiTFeatureExtractor,DeiTForImageClassification:()=>e.DeiTForImageClassification,DeiTImageProcessor:()=>w.DeiTImageProcessor,DeiTModel:()=>e.DeiTModel,DeiTPreTrainedModel:()=>e.DeiTPreTrainedModel,DepthAnythingForDepthEstimation:()=>e.DepthAnythingForDepthEstimation,DepthAnythingPreTrainedModel:()=>e.DepthAnythingPreTrainedModel,DepthEstimationPipeline:()=>a.DepthEstimationPipeline,DepthProForDepthEstimation:()=>e.DepthProForDepthEstimation,DepthProPreTrainedModel:()=>e.DepthProPreTrainedModel,DetrFeatureExtractor:()=>w.DetrFeatureExtractor,DetrForObjectDetection:()=>e.DetrForObjectDetection,DetrForSegmentation:()=>e.DetrForSegmentation,DetrImageProcessor:()=>w.DetrImageProcessor,DetrModel:()=>e.DetrModel,DetrObjectDetectionOutput:()=>e.DetrObjectDetectionOutput,DetrPreTrainedModel:()=>e.DetrPreTrainedModel,DetrSegmentationOutput:()=>e.DetrSegmentationOutput,Dinov2ForImageClassification:()=>e.Dinov2ForImageClassification,Dinov2Model:()=>e.Dinov2Model,Dinov2PreTrainedModel:()=>e.Dinov2PreTrainedModel,Dinov2WithRegistersForImageClassification:()=>e.Dinov2WithRegistersForImageClassification,Dinov2WithRegistersModel:()=>e.Dinov2WithRegistersModel,Dinov2WithRegistersPreTrainedModel:()=>e.Dinov2WithRegistersPreTrainedModel,DistilBertForMaskedLM:()=>e.DistilBertForMaskedLM,DistilBertForQuestionAnswering:()=>e.DistilBertForQuestionAnswering,DistilBertForSequenceClassification:()=>e.DistilBertForSequenceClassification,DistilBertForTokenClassification:()=>e.DistilBertForTokenClassification,DistilBertModel:()=>e.DistilBertModel,DistilBertPreTrainedModel:()=>e.DistilBertPreTrainedModel,DistilBertTokenizer:()=>i.DistilBertTokenizer,DocumentQuestionAnsweringPipeline:()=>a.DocumentQuestionAnsweringPipeline,DonutFeatureExtractor:()=>w.DonutFeatureExtractor,DonutImageProcessor:()=>w.DonutImageProcessor,DonutSwinModel:()=>e.DonutSwinModel,DonutSwinPreTrainedModel:()=>e.DonutSwinPreTrainedModel,EdgeTamModel:()=>e.EdgeTamModel,EfficientNetForImageClassification:()=>e.EfficientNetForImageClassification,EfficientNetImageProcessor:()=>w.EfficientNetImageProcessor,EfficientNetModel:()=>e.EfficientNetModel,EfficientNetPreTrainedModel:()=>e.EfficientNetPreTrainedModel,ElectraForMaskedLM:()=>e.ElectraForMaskedLM,ElectraForQuestionAnswering:()=>e.ElectraForQuestionAnswering,ElectraForSequenceClassification:()=>e.ElectraForSequenceClassification,ElectraForTokenClassification:()=>e.ElectraForTokenClassification,ElectraModel:()=>e.ElectraModel,ElectraPreTrainedModel:()=>e.ElectraPreTrainedModel,ElectraTokenizer:()=>i.ElectraTokenizer,EncodecFeatureExtractor:()=>_.EncodecFeatureExtractor,EosTokenCriteria:()=>P.EosTokenCriteria,Ernie4_5ForCausalLM:()=>e.Ernie4_5ForCausalLM,Ernie4_5Model:()=>e.Ernie4_5Model,Ernie4_5PreTrainedModel:()=>e.Ernie4_5PreTrainedModel,EsmForMaskedLM:()=>e.EsmForMaskedLM,EsmForSequenceClassification:()=>e.EsmForSequenceClassification,EsmForTokenClassification:()=>e.EsmForTokenClassification,EsmModel:()=>e.EsmModel,EsmPreTrainedModel:()=>e.EsmPreTrainedModel,EsmTokenizer:()=>i.EsmTokenizer,ExaoneForCausalLM:()=>e.ExaoneForCausalLM,ExaoneModel:()=>e.ExaoneModel,ExaonePreTrainedModel:()=>e.ExaonePreTrainedModel,FFT:()=>m.FFT,FalconForCausalLM:()=>e.FalconForCausalLM,FalconModel:()=>e.FalconModel,FalconPreTrainedModel:()=>e.FalconPreTrainedModel,FalconTokenizer:()=>i.FalconTokenizer,FastViTForImageClassification:()=>e.FastViTForImageClassification,FastViTModel:()=>e.FastViTModel,FastViTPreTrainedModel:()=>e.FastViTPreTrainedModel,FeatureExtractionPipeline:()=>a.FeatureExtractionPipeline,FeatureExtractor:()=>T.FeatureExtractor,FillMaskPipeline:()=>a.FillMaskPipeline,Florence2ForConditionalGeneration:()=>e.Florence2ForConditionalGeneration,Florence2PreTrainedModel:()=>e.Florence2PreTrainedModel,Florence2Processor:()=>b.Florence2Processor,ForcedBOSTokenLogitsProcessor:()=>M.ForcedBOSTokenLogitsProcessor,ForcedEOSTokenLogitsProcessor:()=>M.ForcedEOSTokenLogitsProcessor,GLPNFeatureExtractor:()=>w.GLPNFeatureExtractor,GLPNForDepthEstimation:()=>e.GLPNForDepthEstimation,GLPNModel:()=>e.GLPNModel,GLPNPreTrainedModel:()=>e.GLPNPreTrainedModel,GPT2LMHeadModel:()=>e.GPT2LMHeadModel,GPT2Model:()=>e.GPT2Model,GPT2PreTrainedModel:()=>e.GPT2PreTrainedModel,GPT2Tokenizer:()=>i.GPT2Tokenizer,GPTBigCodeForCausalLM:()=>e.GPTBigCodeForCausalLM,GPTBigCodeModel:()=>e.GPTBigCodeModel,GPTBigCodePreTrainedModel:()=>e.GPTBigCodePreTrainedModel,GPTJForCausalLM:()=>e.GPTJForCausalLM,GPTJModel:()=>e.GPTJModel,GPTJPreTrainedModel:()=>e.GPTJPreTrainedModel,GPTNeoForCausalLM:()=>e.GPTNeoForCausalLM,GPTNeoModel:()=>e.GPTNeoModel,GPTNeoPreTrainedModel:()=>e.GPTNeoPreTrainedModel,GPTNeoXForCausalLM:()=>e.GPTNeoXForCausalLM,GPTNeoXModel:()=>e.GPTNeoXModel,GPTNeoXPreTrainedModel:()=>e.GPTNeoXPreTrainedModel,GPTNeoXTokenizer:()=>i.GPTNeoXTokenizer,Gemma2ForCausalLM:()=>e.Gemma2ForCausalLM,Gemma2Model:()=>e.Gemma2Model,Gemma2PreTrainedModel:()=>e.Gemma2PreTrainedModel,Gemma3ForCausalLM:()=>e.Gemma3ForCausalLM,Gemma3Model:()=>e.Gemma3Model,Gemma3PreTrainedModel:()=>e.Gemma3PreTrainedModel,Gemma3nAudioFeatureExtractor:()=>_.Gemma3nAudioFeatureExtractor,Gemma3nForConditionalGeneration:()=>e.Gemma3nForConditionalGeneration,Gemma3nPreTrainedModel:()=>e.Gemma3nPreTrainedModel,Gemma3nProcessor:()=>b.Gemma3nProcessor,GemmaForCausalLM:()=>e.GemmaForCausalLM,GemmaModel:()=>e.GemmaModel,GemmaPreTrainedModel:()=>e.GemmaPreTrainedModel,GemmaTokenizer:()=>i.GemmaTokenizer,GlmForCausalLM:()=>e.GlmForCausalLM,GlmModel:()=>e.GlmModel,GlmPreTrainedModel:()=>e.GlmPreTrainedModel,GraniteForCausalLM:()=>e.GraniteForCausalLM,GraniteModel:()=>e.GraniteModel,GraniteMoeHybridForCausalLM:()=>e.GraniteMoeHybridForCausalLM,GraniteMoeHybridModel:()=>e.GraniteMoeHybridModel,GraniteMoeHybridPreTrainedModel:()=>e.GraniteMoeHybridPreTrainedModel,GranitePreTrainedModel:()=>e.GranitePreTrainedModel,Grok1Tokenizer:()=>i.Grok1Tokenizer,GroundingDinoForObjectDetection:()=>e.GroundingDinoForObjectDetection,GroundingDinoImageProcessor:()=>w.GroundingDinoImageProcessor,GroundingDinoPreTrainedModel:()=>e.GroundingDinoPreTrainedModel,GroundingDinoProcessor:()=>b.GroundingDinoProcessor,GroupViTModel:()=>e.GroupViTModel,GroupViTPreTrainedModel:()=>e.GroupViTPreTrainedModel,HeliumForCausalLM:()=>e.HeliumForCausalLM,HeliumModel:()=>e.HeliumModel,HeliumPreTrainedModel:()=>e.HeliumPreTrainedModel,HerbertTokenizer:()=>i.HerbertTokenizer,HieraForImageClassification:()=>e.HieraForImageClassification,HieraModel:()=>e.HieraModel,HieraPreTrainedModel:()=>e.HieraPreTrainedModel,HubertForCTC:()=>e.HubertForCTC,HubertForSequenceClassification:()=>e.HubertForSequenceClassification,HubertModel:()=>e.HubertModel,HubertPreTrainedModel:()=>e.HubertPreTrainedModel,IJepaForImageClassification:()=>e.IJepaForImageClassification,IJepaModel:()=>e.IJepaModel,IJepaPreTrainedModel:()=>e.IJepaPreTrainedModel,Idefics3ForConditionalGeneration:()=>e.Idefics3ForConditionalGeneration,Idefics3ImageProcessor:()=>w.Idefics3ImageProcessor,Idefics3PreTrainedModel:()=>e.Idefics3PreTrainedModel,Idefics3Processor:()=>b.Idefics3Processor,ImageClassificationPipeline:()=>a.ImageClassificationPipeline,ImageFeatureExtractionPipeline:()=>a.ImageFeatureExtractionPipeline,ImageFeatureExtractor:()=>_.ImageFeatureExtractor,ImageMattingOutput:()=>e.ImageMattingOutput,ImageProcessor:()=>x.ImageProcessor,ImageSegmentationPipeline:()=>a.ImageSegmentationPipeline,ImageToImagePipeline:()=>a.ImageToImagePipeline,ImageToTextPipeline:()=>a.ImageToTextPipeline,InterruptableStoppingCriteria:()=>P.InterruptableStoppingCriteria,JAISLMHeadModel:()=>e.JAISLMHeadModel,JAISModel:()=>e.JAISModel,JAISPreTrainedModel:()=>e.JAISPreTrainedModel,JinaCLIPImageProcessor:()=>w.JinaCLIPImageProcessor,JinaCLIPModel:()=>e.JinaCLIPModel,JinaCLIPPreTrainedModel:()=>e.JinaCLIPPreTrainedModel,JinaCLIPProcessor:()=>b.JinaCLIPProcessor,JinaCLIPTextModel:()=>e.JinaCLIPTextModel,JinaCLIPVisionModel:()=>e.JinaCLIPVisionModel,Lfm2ForCausalLM:()=>e.Lfm2ForCausalLM,Lfm2Model:()=>e.Lfm2Model,Lfm2PreTrainedModel:()=>e.Lfm2PreTrainedModel,LiteWhisperForConditionalGeneration:()=>e.LiteWhisperForConditionalGeneration,Llama4ForCausalLM:()=>e.Llama4ForCausalLM,Llama4PreTrainedModel:()=>e.Llama4PreTrainedModel,LlamaForCausalLM:()=>e.LlamaForCausalLM,LlamaModel:()=>e.LlamaModel,LlamaPreTrainedModel:()=>e.LlamaPreTrainedModel,LlamaTokenizer:()=>i.LlamaTokenizer,LlavaForConditionalGeneration:()=>e.LlavaForConditionalGeneration,LlavaOnevisionForConditionalGeneration:()=>e.LlavaOnevisionForConditionalGeneration,LlavaOnevisionImageProcessor:()=>w.LlavaOnevisionImageProcessor,LlavaPreTrainedModel:()=>e.LlavaPreTrainedModel,LlavaProcessor:()=>b.LlavaProcessor,LlavaQwen2ForCausalLM:()=>e.LlavaQwen2ForCausalLM,LogitsProcessor:()=>M.LogitsProcessor,LogitsProcessorList:()=>M.LogitsProcessorList,LogitsWarper:()=>M.LogitsWarper,LongT5ForConditionalGeneration:()=>e.LongT5ForConditionalGeneration,LongT5Model:()=>e.LongT5Model,LongT5PreTrainedModel:()=>e.LongT5PreTrainedModel,M2M100ForConditionalGeneration:()=>e.M2M100ForConditionalGeneration,M2M100Model:()=>e.M2M100Model,M2M100PreTrainedModel:()=>e.M2M100PreTrainedModel,M2M100Tokenizer:()=>i.M2M100Tokenizer,MBart50Tokenizer:()=>i.MBart50Tokenizer,MBartForCausalLM:()=>e.MBartForCausalLM,MBartForConditionalGeneration:()=>e.MBartForConditionalGeneration,MBartForSequenceClassification:()=>e.MBartForSequenceClassification,MBartModel:()=>e.MBartModel,MBartPreTrainedModel:()=>e.MBartPreTrainedModel,MBartTokenizer:()=>i.MBartTokenizer,MPNetForMaskedLM:()=>e.MPNetForMaskedLM,MPNetForQuestionAnswering:()=>e.MPNetForQuestionAnswering,MPNetForSequenceClassification:()=>e.MPNetForSequenceClassification,MPNetForTokenClassification:()=>e.MPNetForTokenClassification,MPNetModel:()=>e.MPNetModel,MPNetPreTrainedModel:()=>e.MPNetPreTrainedModel,MPNetTokenizer:()=>i.MPNetTokenizer,MT5ForConditionalGeneration:()=>e.MT5ForConditionalGeneration,MT5Model:()=>e.MT5Model,MT5PreTrainedModel:()=>e.MT5PreTrainedModel,MarianMTModel:()=>e.MarianMTModel,MarianModel:()=>e.MarianModel,MarianPreTrainedModel:()=>e.MarianPreTrainedModel,MarianTokenizer:()=>i.MarianTokenizer,Mask2FormerImageProcessor:()=>w.Mask2FormerImageProcessor,MaskFormerFeatureExtractor:()=>w.MaskFormerFeatureExtractor,MaskFormerForInstanceSegmentation:()=>e.MaskFormerForInstanceSegmentation,MaskFormerImageProcessor:()=>w.MaskFormerImageProcessor,MaskFormerModel:()=>e.MaskFormerModel,MaskFormerPreTrainedModel:()=>e.MaskFormerPreTrainedModel,MaskedLMOutput:()=>e.MaskedLMOutput,MaxLengthCriteria:()=>P.MaxLengthCriteria,Metric3DForDepthEstimation:()=>e.Metric3DForDepthEstimation,Metric3DPreTrainedModel:()=>e.Metric3DPreTrainedModel,Metric3Dv2ForDepthEstimation:()=>e.Metric3Dv2ForDepthEstimation,Metric3Dv2PreTrainedModel:()=>e.Metric3Dv2PreTrainedModel,MgpstrForSceneTextRecognition:()=>e.MgpstrForSceneTextRecognition,MgpstrModelOutput:()=>e.MgpstrModelOutput,MgpstrPreTrainedModel:()=>e.MgpstrPreTrainedModel,MgpstrProcessor:()=>b.MgpstrProcessor,MgpstrTokenizer:()=>i.MgpstrTokenizer,MimiDecoderModel:()=>e.MimiDecoderModel,MimiDecoderOutput:()=>e.MimiDecoderOutput,MimiEncoderModel:()=>e.MimiEncoderModel,MimiEncoderOutput:()=>e.MimiEncoderOutput,MimiModel:()=>e.MimiModel,MimiPreTrainedModel:()=>e.MimiPreTrainedModel,MinLengthLogitsProcessor:()=>M.MinLengthLogitsProcessor,MinNewTokensLengthLogitsProcessor:()=>M.MinNewTokensLengthLogitsProcessor,Ministral3ForCausalLM:()=>e.Ministral3ForCausalLM,Ministral3Model:()=>e.Ministral3Model,Ministral3PreTrainedModel:()=>e.Ministral3PreTrainedModel,MinistralForCausalLM:()=>e.MinistralForCausalLM,MinistralModel:()=>e.MinistralModel,MinistralPreTrainedModel:()=>e.MinistralPreTrainedModel,Mistral3ForConditionalGeneration:()=>e.Mistral3ForConditionalGeneration,MistralForCausalLM:()=>e.MistralForCausalLM,MistralModel:()=>e.MistralModel,MistralPreTrainedModel:()=>e.MistralPreTrainedModel,MobileBertForMaskedLM:()=>e.MobileBertForMaskedLM,MobileBertForQuestionAnswering:()=>e.MobileBertForQuestionAnswering,MobileBertForSequenceClassification:()=>e.MobileBertForSequenceClassification,MobileBertModel:()=>e.MobileBertModel,MobileBertPreTrainedModel:()=>e.MobileBertPreTrainedModel,MobileBertTokenizer:()=>i.MobileBertTokenizer,MobileLLMForCausalLM:()=>e.MobileLLMForCausalLM,MobileLLMModel:()=>e.MobileLLMModel,MobileLLMPreTrainedModel:()=>e.MobileLLMPreTrainedModel,MobileNetV1FeatureExtractor:()=>w.MobileNetV1FeatureExtractor,MobileNetV1ForImageClassification:()=>e.MobileNetV1ForImageClassification,MobileNetV1ForSemanticSegmentation:()=>e.MobileNetV1ForSemanticSegmentation,MobileNetV1ImageProcessor:()=>w.MobileNetV1ImageProcessor,MobileNetV1Model:()=>e.MobileNetV1Model,MobileNetV1PreTrainedModel:()=>e.MobileNetV1PreTrainedModel,MobileNetV2FeatureExtractor:()=>w.MobileNetV2FeatureExtractor,MobileNetV2ForImageClassification:()=>e.MobileNetV2ForImageClassification,MobileNetV2ForSemanticSegmentation:()=>e.MobileNetV2ForSemanticSegmentation,MobileNetV2ImageProcessor:()=>w.MobileNetV2ImageProcessor,MobileNetV2Model:()=>e.MobileNetV2Model,MobileNetV2PreTrainedModel:()=>e.MobileNetV2PreTrainedModel,MobileNetV3FeatureExtractor:()=>w.MobileNetV3FeatureExtractor,MobileNetV3ForImageClassification:()=>e.MobileNetV3ForImageClassification,MobileNetV3ForSemanticSegmentation:()=>e.MobileNetV3ForSemanticSegmentation,MobileNetV3ImageProcessor:()=>w.MobileNetV3ImageProcessor,MobileNetV3Model:()=>e.MobileNetV3Model,MobileNetV3PreTrainedModel:()=>e.MobileNetV3PreTrainedModel,MobileNetV4FeatureExtractor:()=>w.MobileNetV4FeatureExtractor,MobileNetV4ForImageClassification:()=>e.MobileNetV4ForImageClassification,MobileNetV4ForSemanticSegmentation:()=>e.MobileNetV4ForSemanticSegmentation,MobileNetV4ImageProcessor:()=>w.MobileNetV4ImageProcessor,MobileNetV4Model:()=>e.MobileNetV4Model,MobileNetV4PreTrainedModel:()=>e.MobileNetV4PreTrainedModel,MobileViTFeatureExtractor:()=>w.MobileViTFeatureExtractor,MobileViTForImageClassification:()=>e.MobileViTForImageClassification,MobileViTImageProcessor:()=>w.MobileViTImageProcessor,MobileViTModel:()=>e.MobileViTModel,MobileViTPreTrainedModel:()=>e.MobileViTPreTrainedModel,MobileViTV2ForImageClassification:()=>e.MobileViTV2ForImageClassification,MobileViTV2Model:()=>e.MobileViTV2Model,MobileViTV2PreTrainedModel:()=>e.MobileViTV2PreTrainedModel,ModelOutput:()=>e.ModelOutput,ModernBertDecoderForCausalLM:()=>e.ModernBertDecoderForCausalLM,ModernBertDecoderModel:()=>e.ModernBertDecoderModel,ModernBertDecoderPreTrainedModel:()=>e.ModernBertDecoderPreTrainedModel,ModernBertForMaskedLM:()=>e.ModernBertForMaskedLM,ModernBertForSequenceClassification:()=>e.ModernBertForSequenceClassification,ModernBertForTokenClassification:()=>e.ModernBertForTokenClassification,ModernBertModel:()=>e.ModernBertModel,ModernBertPreTrainedModel:()=>e.ModernBertPreTrainedModel,Moondream1ForConditionalGeneration:()=>e.Moondream1ForConditionalGeneration,MoonshineFeatureExtractor:()=>_.MoonshineFeatureExtractor,MoonshineForConditionalGeneration:()=>e.MoonshineForConditionalGeneration,MoonshineModel:()=>e.MoonshineModel,MoonshinePreTrainedModel:()=>e.MoonshinePreTrainedModel,MoonshineProcessor:()=>b.MoonshineProcessor,MptForCausalLM:()=>e.MptForCausalLM,MptModel:()=>e.MptModel,MptPreTrainedModel:()=>e.MptPreTrainedModel,MultiModalityCausalLM:()=>e.MultiModalityCausalLM,MultiModalityPreTrainedModel:()=>e.MultiModalityPreTrainedModel,MusicgenForCausalLM:()=>e.MusicgenForCausalLM,MusicgenForConditionalGeneration:()=>e.MusicgenForConditionalGeneration,MusicgenModel:()=>e.MusicgenModel,MusicgenPreTrainedModel:()=>e.MusicgenPreTrainedModel,NanoChatForCausalLM:()=>e.NanoChatForCausalLM,NanoChatModel:()=>e.NanoChatModel,NanoChatPreTrainedModel:()=>e.NanoChatPreTrainedModel,NeoBertForMaskedLM:()=>e.NeoBertForMaskedLM,NeoBertForQuestionAnswering:()=>e.NeoBertForQuestionAnswering,NeoBertForSequenceClassification:()=>e.NeoBertForSequenceClassification,NeoBertForTokenClassification:()=>e.NeoBertForTokenClassification,NeoBertModel:()=>e.NeoBertModel,NeoBertPreTrainedModel:()=>e.NeoBertPreTrainedModel,NllbTokenizer:()=>i.NllbTokenizer,NoBadWordsLogitsProcessor:()=>M.NoBadWordsLogitsProcessor,NoRepeatNGramLogitsProcessor:()=>M.NoRepeatNGramLogitsProcessor,NomicBertModel:()=>e.NomicBertModel,NomicBertPreTrainedModel:()=>e.NomicBertPreTrainedModel,NougatImageProcessor:()=>w.NougatImageProcessor,NougatTokenizer:()=>i.NougatTokenizer,OPTForCausalLM:()=>e.OPTForCausalLM,OPTModel:()=>e.OPTModel,OPTPreTrainedModel:()=>e.OPTPreTrainedModel,ObjectDetectionPipeline:()=>a.ObjectDetectionPipeline,Olmo2ForCausalLM:()=>e.Olmo2ForCausalLM,Olmo2Model:()=>e.Olmo2Model,Olmo2PreTrainedModel:()=>e.Olmo2PreTrainedModel,OlmoForCausalLM:()=>e.OlmoForCausalLM,OlmoModel:()=>e.OlmoModel,OlmoPreTrainedModel:()=>e.OlmoPreTrainedModel,OpenELMForCausalLM:()=>e.OpenELMForCausalLM,OpenELMModel:()=>e.OpenELMModel,OpenELMPreTrainedModel:()=>e.OpenELMPreTrainedModel,OwlViTFeatureExtractor:()=>w.OwlViTFeatureExtractor,OwlViTForObjectDetection:()=>e.OwlViTForObjectDetection,OwlViTImageProcessor:()=>w.OwlViTImageProcessor,OwlViTModel:()=>e.OwlViTModel,OwlViTPreTrainedModel:()=>e.OwlViTPreTrainedModel,OwlViTProcessor:()=>b.OwlViTProcessor,Owlv2ForObjectDetection:()=>e.Owlv2ForObjectDetection,Owlv2ImageProcessor:()=>w.Owlv2ImageProcessor,Owlv2Model:()=>e.Owlv2Model,Owlv2PreTrainedModel:()=>e.Owlv2PreTrainedModel,PaliGemmaForConditionalGeneration:()=>e.PaliGemmaForConditionalGeneration,PaliGemmaPreTrainedModel:()=>e.PaliGemmaPreTrainedModel,PaliGemmaProcessor:()=>b.PaliGemmaProcessor,ParakeetFeatureExtractor:()=>_.ParakeetFeatureExtractor,ParakeetForCTC:()=>e.ParakeetForCTC,ParakeetPreTrainedModel:()=>e.ParakeetPreTrainedModel,PatchTSMixerForPrediction:()=>e.PatchTSMixerForPrediction,PatchTSMixerModel:()=>e.PatchTSMixerModel,PatchTSMixerPreTrainedModel:()=>e.PatchTSMixerPreTrainedModel,PatchTSTForPrediction:()=>e.PatchTSTForPrediction,PatchTSTModel:()=>e.PatchTSTModel,PatchTSTPreTrainedModel:()=>e.PatchTSTPreTrainedModel,Phi3ForCausalLM:()=>e.Phi3ForCausalLM,Phi3Model:()=>e.Phi3Model,Phi3PreTrainedModel:()=>e.Phi3PreTrainedModel,Phi3VForCausalLM:()=>e.Phi3VForCausalLM,Phi3VImageProcessor:()=>w.Phi3VImageProcessor,Phi3VPreTrainedModel:()=>e.Phi3VPreTrainedModel,Phi3VProcessor:()=>b.Phi3VProcessor,PhiForCausalLM:()=>e.PhiForCausalLM,PhiModel:()=>e.PhiModel,PhiPreTrainedModel:()=>e.PhiPreTrainedModel,Pipeline:()=>a.Pipeline,PixtralImageProcessor:()=>w.PixtralImageProcessor,PixtralProcessor:()=>b.PixtralProcessor,PreTrainedModel:()=>e.PreTrainedModel,PreTrainedTokenizer:()=>i.PreTrainedTokenizer,PretrainedConfig:()=>d.PretrainedConfig,PretrainedMixin:()=>e.PretrainedMixin,Processor:()=>G.Processor,PvtForImageClassification:()=>e.PvtForImageClassification,PvtImageProcessor:()=>w.PvtImageProcessor,PvtModel:()=>e.PvtModel,PvtPreTrainedModel:()=>e.PvtPreTrainedModel,PyAnnoteFeatureExtractor:()=>_.PyAnnoteFeatureExtractor,PyAnnoteForAudioFrameClassification:()=>e.PyAnnoteForAudioFrameClassification,PyAnnoteModel:()=>e.PyAnnoteModel,PyAnnotePreTrainedModel:()=>e.PyAnnotePreTrainedModel,PyAnnoteProcessor:()=>b.PyAnnoteProcessor,QuestionAnsweringModelOutput:()=>e.QuestionAnsweringModelOutput,QuestionAnsweringPipeline:()=>a.QuestionAnsweringPipeline,Qwen2ForCausalLM:()=>e.Qwen2ForCausalLM,Qwen2Model:()=>e.Qwen2Model,Qwen2PreTrainedModel:()=>e.Qwen2PreTrainedModel,Qwen2Tokenizer:()=>i.Qwen2Tokenizer,Qwen2VLForConditionalGeneration:()=>e.Qwen2VLForConditionalGeneration,Qwen2VLImageProcessor:()=>w.Qwen2VLImageProcessor,Qwen2VLPreTrainedModel:()=>e.Qwen2VLPreTrainedModel,Qwen2VLProcessor:()=>b.Qwen2VLProcessor,Qwen3ForCausalLM:()=>e.Qwen3ForCausalLM,Qwen3Model:()=>e.Qwen3Model,Qwen3PreTrainedModel:()=>e.Qwen3PreTrainedModel,RFDetrForObjectDetection:()=>e.RFDetrForObjectDetection,RFDetrModel:()=>e.RFDetrModel,RFDetrObjectDetectionOutput:()=>e.RFDetrObjectDetectionOutput,RFDetrPreTrainedModel:()=>e.RFDetrPreTrainedModel,RTDetrForObjectDetection:()=>e.RTDetrForObjectDetection,RTDetrImageProcessor:()=>w.RTDetrImageProcessor,RTDetrModel:()=>e.RTDetrModel,RTDetrObjectDetectionOutput:()=>e.RTDetrObjectDetectionOutput,RTDetrPreTrainedModel:()=>e.RTDetrPreTrainedModel,RTDetrV2ForObjectDetection:()=>e.RTDetrV2ForObjectDetection,RTDetrV2Model:()=>e.RTDetrV2Model,RTDetrV2ObjectDetectionOutput:()=>e.RTDetrV2ObjectDetectionOutput,RTDetrV2PreTrainedModel:()=>e.RTDetrV2PreTrainedModel,RawAudio:()=>g.RawAudio,RawImage:()=>I.RawImage,RawVideo:()=>f.RawVideo,RawVideoFrame:()=>f.RawVideoFrame,RepetitionPenaltyLogitsProcessor:()=>M.RepetitionPenaltyLogitsProcessor,ResNetForImageClassification:()=>e.ResNetForImageClassification,ResNetModel:()=>e.ResNetModel,ResNetPreTrainedModel:()=>e.ResNetPreTrainedModel,RoFormerForMaskedLM:()=>e.RoFormerForMaskedLM,RoFormerForQuestionAnswering:()=>e.RoFormerForQuestionAnswering,RoFormerForSequenceClassification:()=>e.RoFormerForSequenceClassification,RoFormerForTokenClassification:()=>e.RoFormerForTokenClassification,RoFormerModel:()=>e.RoFormerModel,RoFormerPreTrainedModel:()=>e.RoFormerPreTrainedModel,RoFormerTokenizer:()=>i.RoFormerTokenizer,RobertaForMaskedLM:()=>e.RobertaForMaskedLM,RobertaForQuestionAnswering:()=>e.RobertaForQuestionAnswering,RobertaForSequenceClassification:()=>e.RobertaForSequenceClassification,RobertaForTokenClassification:()=>e.RobertaForTokenClassification,RobertaModel:()=>e.RobertaModel,RobertaPreTrainedModel:()=>e.RobertaPreTrainedModel,RobertaTokenizer:()=>i.RobertaTokenizer,Sam2ImageProcessor:()=>w.Sam2ImageProcessor,Sam2ImageSegmentationOutput:()=>e.Sam2ImageSegmentationOutput,Sam2Model:()=>e.Sam2Model,Sam2PreTrainedModel:()=>e.Sam2PreTrainedModel,Sam2Processor:()=>b.Sam2Processor,Sam2VideoProcessor:()=>b.Sam2VideoProcessor,Sam3ImageProcessor:()=>w.Sam3ImageProcessor,Sam3TrackerModel:()=>e.Sam3TrackerModel,SamImageProcessor:()=>w.SamImageProcessor,SamImageSegmentationOutput:()=>e.SamImageSegmentationOutput,SamModel:()=>e.SamModel,SamPreTrainedModel:()=>e.SamPreTrainedModel,SamProcessor:()=>b.SamProcessor,SapiensForDepthEstimation:()=>e.SapiensForDepthEstimation,SapiensForNormalEstimation:()=>e.SapiensForNormalEstimation,SapiensForSemanticSegmentation:()=>e.SapiensForSemanticSegmentation,SapiensPreTrainedModel:()=>e.SapiensPreTrainedModel,SeamlessM4TFeatureExtractor:()=>_.SeamlessM4TFeatureExtractor,SegformerFeatureExtractor:()=>w.SegformerFeatureExtractor,SegformerForImageClassification:()=>e.SegformerForImageClassification,SegformerForSemanticSegmentation:()=>e.SegformerForSemanticSegmentation,SegformerImageProcessor:()=>w.SegformerImageProcessor,SegformerModel:()=>e.SegformerModel,SegformerPreTrainedModel:()=>e.SegformerPreTrainedModel,Seq2SeqLMOutput:()=>e.Seq2SeqLMOutput,SequenceClassifierOutput:()=>e.SequenceClassifierOutput,SiglipImageProcessor:()=>w.SiglipImageProcessor,SiglipModel:()=>e.SiglipModel,SiglipPreTrainedModel:()=>e.SiglipPreTrainedModel,SiglipTextModel:()=>e.SiglipTextModel,SiglipTokenizer:()=>i.SiglipTokenizer,SiglipVisionModel:()=>e.SiglipVisionModel,SmolLM3ForCausalLM:()=>e.SmolLM3ForCausalLM,SmolLM3Model:()=>e.SmolLM3Model,SmolLM3PreTrainedModel:()=>e.SmolLM3PreTrainedModel,SmolVLMForConditionalGeneration:()=>e.SmolVLMForConditionalGeneration,SmolVLMImageProcessor:()=>w.SmolVLMImageProcessor,SmolVLMProcessor:()=>b.SmolVLMProcessor,SnacDecoderModel:()=>e.SnacDecoderModel,SnacEncoderModel:()=>e.SnacEncoderModel,SnacFeatureExtractor:()=>_.SnacFeatureExtractor,SnacModel:()=>e.SnacModel,SnacPreTrainedModel:()=>e.SnacPreTrainedModel,SpeechT5FeatureExtractor:()=>_.SpeechT5FeatureExtractor,SpeechT5ForSpeechToText:()=>e.SpeechT5ForSpeechToText,SpeechT5ForTextToSpeech:()=>e.SpeechT5ForTextToSpeech,SpeechT5HifiGan:()=>e.SpeechT5HifiGan,SpeechT5Model:()=>e.SpeechT5Model,SpeechT5PreTrainedModel:()=>e.SpeechT5PreTrainedModel,SpeechT5Processor:()=>b.SpeechT5Processor,SpeechT5Tokenizer:()=>i.SpeechT5Tokenizer,SqueezeBertForMaskedLM:()=>e.SqueezeBertForMaskedLM,SqueezeBertForQuestionAnswering:()=>e.SqueezeBertForQuestionAnswering,SqueezeBertForSequenceClassification:()=>e.SqueezeBertForSequenceClassification,SqueezeBertModel:()=>e.SqueezeBertModel,SqueezeBertPreTrainedModel:()=>e.SqueezeBertPreTrainedModel,SqueezeBertTokenizer:()=>i.SqueezeBertTokenizer,StableLmForCausalLM:()=>e.StableLmForCausalLM,StableLmModel:()=>e.StableLmModel,StableLmPreTrainedModel:()=>e.StableLmPreTrainedModel,Starcoder2ForCausalLM:()=>e.Starcoder2ForCausalLM,Starcoder2Model:()=>e.Starcoder2Model,Starcoder2PreTrainedModel:()=>e.Starcoder2PreTrainedModel,StoppingCriteria:()=>P.StoppingCriteria,StoppingCriteriaList:()=>P.StoppingCriteriaList,StyleTextToSpeech2Model:()=>e.StyleTextToSpeech2Model,StyleTextToSpeech2PreTrainedModel:()=>e.StyleTextToSpeech2PreTrainedModel,SummarizationPipeline:()=>a.SummarizationPipeline,SupertonicForConditionalGeneration:()=>e.SupertonicForConditionalGeneration,SupertonicPreTrainedModel:()=>e.SupertonicPreTrainedModel,SuppressTokensAtBeginLogitsProcessor:()=>M.SuppressTokensAtBeginLogitsProcessor,Swin2SRForImageSuperResolution:()=>e.Swin2SRForImageSuperResolution,Swin2SRImageProcessor:()=>w.Swin2SRImageProcessor,Swin2SRModel:()=>e.Swin2SRModel,Swin2SRPreTrainedModel:()=>e.Swin2SRPreTrainedModel,SwinForImageClassification:()=>e.SwinForImageClassification,SwinForSemanticSegmentation:()=>e.SwinForSemanticSegmentation,SwinModel:()=>e.SwinModel,SwinPreTrainedModel:()=>e.SwinPreTrainedModel,T5ForConditionalGeneration:()=>e.T5ForConditionalGeneration,T5Model:()=>e.T5Model,T5PreTrainedModel:()=>e.T5PreTrainedModel,T5Tokenizer:()=>i.T5Tokenizer,TableTransformerForObjectDetection:()=>e.TableTransformerForObjectDetection,TableTransformerModel:()=>e.TableTransformerModel,TableTransformerObjectDetectionOutput:()=>e.TableTransformerObjectDetectionOutput,TableTransformerPreTrainedModel:()=>e.TableTransformerPreTrainedModel,TemperatureLogitsWarper:()=>M.TemperatureLogitsWarper,Tensor:()=>u.Tensor,Text2TextGenerationPipeline:()=>a.Text2TextGenerationPipeline,TextClassificationPipeline:()=>a.TextClassificationPipeline,TextGenerationPipeline:()=>a.TextGenerationPipeline,TextStreamer:()=>B.TextStreamer,TextToAudioPipeline:()=>a.TextToAudioPipeline,TokenClassificationPipeline:()=>a.TokenClassificationPipeline,TokenClassifierOutput:()=>e.TokenClassifierOutput,TokenizerModel:()=>i.TokenizerModel,TopKLogitsWarper:()=>M.TopKLogitsWarper,TopPLogitsWarper:()=>M.TopPLogitsWarper,TrOCRForCausalLM:()=>e.TrOCRForCausalLM,TrOCRPreTrainedModel:()=>e.TrOCRPreTrainedModel,TranslationPipeline:()=>a.TranslationPipeline,UltravoxModel:()=>e.UltravoxModel,UltravoxPreTrainedModel:()=>e.UltravoxPreTrainedModel,UltravoxProcessor:()=>b.UltravoxProcessor,UniSpeechForCTC:()=>e.UniSpeechForCTC,UniSpeechForSequenceClassification:()=>e.UniSpeechForSequenceClassification,UniSpeechModel:()=>e.UniSpeechModel,UniSpeechPreTrainedModel:()=>e.UniSpeechPreTrainedModel,UniSpeechSatForAudioFrameClassification:()=>e.UniSpeechSatForAudioFrameClassification,UniSpeechSatForCTC:()=>e.UniSpeechSatForCTC,UniSpeechSatForSequenceClassification:()=>e.UniSpeechSatForSequenceClassification,UniSpeechSatModel:()=>e.UniSpeechSatModel,UniSpeechSatPreTrainedModel:()=>e.UniSpeechSatPreTrainedModel,VLChatProcessor:()=>b.VLChatProcessor,VLMImageProcessor:()=>w.VLMImageProcessor,VaultGemmaForCausalLM:()=>e.VaultGemmaForCausalLM,VaultGemmaModel:()=>e.VaultGemmaModel,VaultGemmaPreTrainedModel:()=>e.VaultGemmaPreTrainedModel,ViTFeatureExtractor:()=>w.ViTFeatureExtractor,ViTForImageClassification:()=>e.ViTForImageClassification,ViTImageProcessor:()=>w.ViTImageProcessor,ViTMAEModel:()=>e.ViTMAEModel,ViTMAEPreTrainedModel:()=>e.ViTMAEPreTrainedModel,ViTMSNForImageClassification:()=>e.ViTMSNForImageClassification,ViTMSNModel:()=>e.ViTMSNModel,ViTMSNPreTrainedModel:()=>e.ViTMSNPreTrainedModel,ViTModel:()=>e.ViTModel,ViTPreTrainedModel:()=>e.ViTPreTrainedModel,VisionEncoderDecoderModel:()=>e.VisionEncoderDecoderModel,VitMatteForImageMatting:()=>e.VitMatteForImageMatting,VitMatteImageProcessor:()=>w.VitMatteImageProcessor,VitMattePreTrainedModel:()=>e.VitMattePreTrainedModel,VitPoseForPoseEstimation:()=>e.VitPoseForPoseEstimation,VitPoseImageProcessor:()=>w.VitPoseImageProcessor,VitPosePreTrainedModel:()=>e.VitPosePreTrainedModel,VitsModel:()=>e.VitsModel,VitsModelOutput:()=>e.VitsModelOutput,VitsPreTrainedModel:()=>e.VitsPreTrainedModel,VitsTokenizer:()=>i.VitsTokenizer,VoxtralForConditionalGeneration:()=>e.VoxtralForConditionalGeneration,VoxtralProcessor:()=>b.VoxtralProcessor,Wav2Vec2BertForCTC:()=>e.Wav2Vec2BertForCTC,Wav2Vec2BertForSequenceClassification:()=>e.Wav2Vec2BertForSequenceClassification,Wav2Vec2BertModel:()=>e.Wav2Vec2BertModel,Wav2Vec2BertPreTrainedModel:()=>e.Wav2Vec2BertPreTrainedModel,Wav2Vec2CTCTokenizer:()=>i.Wav2Vec2CTCTokenizer,Wav2Vec2FeatureExtractor:()=>_.Wav2Vec2FeatureExtractor,Wav2Vec2ForAudioFrameClassification:()=>e.Wav2Vec2ForAudioFrameClassification,Wav2Vec2ForCTC:()=>e.Wav2Vec2ForCTC,Wav2Vec2ForSequenceClassification:()=>e.Wav2Vec2ForSequenceClassification,Wav2Vec2Model:()=>e.Wav2Vec2Model,Wav2Vec2PreTrainedModel:()=>e.Wav2Vec2PreTrainedModel,Wav2Vec2Processor:()=>b.Wav2Vec2Processor,Wav2Vec2ProcessorWithLM:()=>b.Wav2Vec2ProcessorWithLM,WavLMForAudioFrameClassification:()=>e.WavLMForAudioFrameClassification,WavLMForCTC:()=>e.WavLMForCTC,WavLMForSequenceClassification:()=>e.WavLMForSequenceClassification,WavLMForXVector:()=>e.WavLMForXVector,WavLMModel:()=>e.WavLMModel,WavLMPreTrainedModel:()=>e.WavLMPreTrainedModel,WeSpeakerFeatureExtractor:()=>_.WeSpeakerFeatureExtractor,WeSpeakerResNetModel:()=>e.WeSpeakerResNetModel,WeSpeakerResNetPreTrainedModel:()=>e.WeSpeakerResNetPreTrainedModel,WhisperFeatureExtractor:()=>_.WhisperFeatureExtractor,WhisperForConditionalGeneration:()=>e.WhisperForConditionalGeneration,WhisperModel:()=>e.WhisperModel,WhisperPreTrainedModel:()=>e.WhisperPreTrainedModel,WhisperProcessor:()=>b.WhisperProcessor,WhisperTextStreamer:()=>B.WhisperTextStreamer,WhisperTimeStampLogitsProcessor:()=>M.WhisperTimeStampLogitsProcessor,WhisperTokenizer:()=>i.WhisperTokenizer,XLMForQuestionAnswering:()=>e.XLMForQuestionAnswering,XLMForSequenceClassification:()=>e.XLMForSequenceClassification,XLMForTokenClassification:()=>e.XLMForTokenClassification,XLMModel:()=>e.XLMModel,XLMPreTrainedModel:()=>e.XLMPreTrainedModel,XLMRobertaForMaskedLM:()=>e.XLMRobertaForMaskedLM,XLMRobertaForQuestionAnswering:()=>e.XLMRobertaForQuestionAnswering,XLMRobertaForSequenceClassification:()=>e.XLMRobertaForSequenceClassification,XLMRobertaForTokenClassification:()=>e.XLMRobertaForTokenClassification,XLMRobertaModel:()=>e.XLMRobertaModel,XLMRobertaPreTrainedModel:()=>e.XLMRobertaPreTrainedModel,XLMRobertaTokenizer:()=>i.XLMRobertaTokenizer,XLMTokenizer:()=>i.XLMTokenizer,XLMWithLMHeadModel:()=>e.XLMWithLMHeadModel,XVectorOutput:()=>e.XVectorOutput,YolosFeatureExtractor:()=>w.YolosFeatureExtractor,YolosForObjectDetection:()=>e.YolosForObjectDetection,YolosImageProcessor:()=>w.YolosImageProcessor,YolosModel:()=>e.YolosModel,YolosObjectDetectionOutput:()=>e.YolosObjectDetectionOutput,YolosPreTrainedModel:()=>e.YolosPreTrainedModel,ZeroShotAudioClassificationPipeline:()=>a.ZeroShotAudioClassificationPipeline,ZeroShotClassificationPipeline:()=>a.ZeroShotClassificationPipeline,ZeroShotImageClassificationPipeline:()=>a.ZeroShotImageClassificationPipeline,ZeroShotObjectDetectionPipeline:()=>a.ZeroShotObjectDetectionPipeline,bankers_round:()=>m.bankers_round,cat:()=>u.cat,cos_sim:()=>m.cos_sim,dot:()=>m.dot,dynamic_time_warping:()=>m.dynamic_time_warping,env:()=>D.env,full:()=>u.full,full_like:()=>u.full_like,getCacheShapes:()=>d.getCacheShapes,hamming:()=>g.hamming,hanning:()=>g.hanning,interpolate:()=>u.interpolate,interpolate_4d:()=>u.interpolate_4d,interpolate_data:()=>m.interpolate_data,is_chinese_char:()=>i.is_chinese_char,layer_norm:()=>u.layer_norm,load_image:()=>I.load_image,load_video:()=>f.load_video,log_softmax:()=>m.log_softmax,magnitude:()=>m.magnitude,matmul:()=>u.matmul,max:()=>m.max,mean:()=>u.mean,mean_pooling:()=>u.mean_pooling,medianFilter:()=>m.medianFilter,mel_filter_bank:()=>g.mel_filter_bank,min:()=>m.min,ones:()=>u.ones,ones_like:()=>u.ones_like,permute:()=>u.permute,permute_data:()=>m.permute_data,pipeline:()=>a.pipeline,quantize_embeddings:()=>u.quantize_embeddings,rand:()=>u.rand,randn:()=>u.randn,read_audio:()=>g.read_audio,rfft:()=>u.rfft,round:()=>m.round,slice:()=>u.slice,softmax:()=>m.softmax,spectrogram:()=>g.spectrogram,stack:()=>u.stack,std_mean:()=>u.std_mean,topk:()=>u.topk,window_function:()=>g.window_function,zeros:()=>u.zeros,zeros_like:()=>u.zeros_like});var D=mt("./src/env.js"),a=mt("./src/pipelines.js"),e=mt("./src/models.js"),i=mt("./src/tokenizers.js"),d=mt("./src/configs.js"),g=mt("./src/utils/audio.js"),I=mt("./src/utils/image.js"),f=mt("./src/utils/video.js"),u=mt("./src/utils/tensor.js"),m=mt("./src/utils/maths.js"),T=mt("./src/base/feature_extraction_utils.js"),_=mt("./src/models/feature_extractors.js"),o=mt("./src/models/auto/feature_extraction_auto.js"),x=mt("./src/base/image_processors_utils.js"),w=mt("./src/models/image_processors.js"),k=mt("./src/models/auto/image_processing_auto.js"),G=mt("./src/base/processing_utils.js"),b=mt("./src/models/processors.js"),C=mt("./src/models/auto/processing_auto.js"),B=mt("./src/generation/streamers.js"),P=mt("./src/generation/stopping_criteria.js"),M=mt("./src/generation/logits_process.js")})();mm=t.ASTFeatureExtractor,hm=t.ASTForAudioClassification,Mm=t.ASTModel,fm=t.ASTPreTrainedModel,gm=t.AlbertForMaskedLM,Pm=t.AlbertForQuestionAnswering,Tm=t.AlbertForSequenceClassification,wm=t.AlbertModel,bm=t.AlbertPreTrainedModel,xm=t.AlbertTokenizer,vm=t.ArceeForCausalLM,Em=t.ArceeModel,Fm=t.ArceePreTrainedModel,Cm=t.AudioClassificationPipeline,km=t.AutoConfig,ym=t.AutoFeatureExtractor,Sm=t.AutoImageProcessor,Am=t.AutoModel,Lm=t.AutoModelForAudioClassification,Dm=t.AutoModelForAudioFrameClassification,Im=t.AutoModelForAudioTextToText,Om=t.AutoModelForCTC,Bm=t.AutoModelForCausalLM,jm=t.AutoModelForDepthEstimation,Nm=t.AutoModelForDocumentQuestionAnswering,Rm=t.AutoModelForImageClassification,Vm=t.AutoModelForImageFeatureExtraction,zm=t.AutoModelForImageMatting,Gm=t.AutoModelForImageSegmentation,Wm=t.AutoModelForImageTextToText,Um=t.AutoModelForImageToImage,$m=t.AutoModelForMaskGeneration,Km=t.AutoModelForMaskedLM,Qm=t.AutoModelForNormalEstimation,Xm=t.AutoModelForObjectDetection,Hm=t.AutoModelForPoseEstimation,Jm=t.AutoModelForQuestionAnswering,Ym=t.AutoModelForSemanticSegmentation,qm=t.AutoModelForSeq2SeqLM,Zm=t.AutoModelForSequenceClassification,eh=t.AutoModelForSpeechSeq2Seq,th=t.AutoModelForTextToSpectrogram,sh=t.AutoModelForTextToWaveform,rh=t.AutoModelForTokenClassification,oh=t.AutoModelForUniversalSegmentation,ah=t.AutoModelForVision2Seq,nh=t.AutoModelForXVector,ih=t.AutoModelForZeroShotObjectDetection,lh=t.AutoProcessor,ch=t.AutoTokenizer,_h=t.AutomaticSpeechRecognitionPipeline,dh=t.BackgroundRemovalPipeline,uh=t.BartForConditionalGeneration,ph=t.BartForSequenceClassification,mh=t.BartModel,hh=t.BartPretrainedModel,Mh=t.BartTokenizer,fh=t.BaseModelOutput,gh=t.BaseStreamer,Ph=t.BeitFeatureExtractor,Th=t.BeitForImageClassification,wh=t.BeitModel,bh=t.BeitPreTrainedModel,xh=t.BertForMaskedLM,vh=t.BertForQuestionAnswering,Eh=t.BertForSequenceClassification,Fh=t.BertForTokenClassification,Ch=t.BertModel,kh=t.BertPreTrainedModel,yh=t.BertTokenizer,Sh=t.BitImageProcessor,Ah=t.BlenderbotForConditionalGeneration,Lh=t.BlenderbotModel,Dh=t.BlenderbotPreTrainedModel,Ih=t.BlenderbotSmallForConditionalGeneration,Oh=t.BlenderbotSmallModel,Bh=t.BlenderbotSmallPreTrainedModel,jh=t.BlenderbotSmallTokenizer,Nh=t.BlenderbotTokenizer,Rh=t.BloomForCausalLM,Vh=t.BloomModel,zh=t.BloomPreTrainedModel,Gh=t.BloomTokenizer,Wh=t.CLIPFeatureExtractor,Uh=t.CLIPImageProcessor,$h=t.CLIPModel,Kh=t.CLIPPreTrainedModel,Qh=t.CLIPSegForImageSegmentation,Xh=t.CLIPSegModel,Hh=t.CLIPSegPreTrainedModel,Jh=t.CLIPTextModel,Yh=t.CLIPTextModelWithProjection,qh=t.CLIPTokenizer,Zh=t.CLIPVisionModel,eM=t.CLIPVisionModelWithProjection,tM=t.CamembertForMaskedLM,sM=t.CamembertForQuestionAnswering,rM=t.CamembertForSequenceClassification,oM=t.CamembertForTokenClassification,aM=t.CamembertModel,nM=t.CamembertPreTrainedModel,iM=t.CamembertTokenizer,lM=t.CausalLMOutput,cM=t.CausalLMOutputWithPast,_M=t.ChineseCLIPFeatureExtractor,dM=t.ChineseCLIPModel,uM=t.ChineseCLIPPreTrainedModel,pM=t.ClapAudioModelWithProjection,mM=t.ClapFeatureExtractor,hM=t.ClapModel,MM=t.ClapPreTrainedModel,fM=t.ClapTextModelWithProjection,gM=t.ClassifierFreeGuidanceLogitsProcessor,PM=t.CodeGenForCausalLM,TM=t.CodeGenModel,wM=t.CodeGenPreTrainedModel,bM=t.CodeGenTokenizer,xM=t.CodeLlamaTokenizer,vM=t.CohereForCausalLM,EM=t.CohereModel,FM=t.CoherePreTrainedModel,CM=t.CohereTokenizer,kM=t.ConvBertForMaskedLM,yM=t.ConvBertForQuestionAnswering,SM=t.ConvBertForSequenceClassification,AM=t.ConvBertForTokenClassification,LM=t.ConvBertModel,DM=t.ConvBertPreTrainedModel,IM=t.ConvBertTokenizer,OM=t.ConvNextFeatureExtractor,BM=t.ConvNextForImageClassification,jM=t.ConvNextImageProcessor,NM=t.ConvNextModel,RM=t.ConvNextPreTrainedModel,VM=t.ConvNextV2ForImageClassification,zM=t.ConvNextV2Model,GM=t.ConvNextV2PreTrainedModel,WM=t.DFineForObjectDetection,UM=t.DFineModel,$M=t.DFinePreTrainedModel,KM=t.DINOv3ConvNextModel,QM=t.DINOv3ConvNextPreTrainedModel,XM=t.DINOv3ViTImageProcessor,HM=t.DINOv3ViTModel,JM=t.DINOv3ViTPreTrainedModel,YM=t.DPTFeatureExtractor,qM=t.DPTForDepthEstimation,ZM=t.DPTImageProcessor,ef=t.DPTModel,tf=t.DPTPreTrainedModel,sf=t.DacDecoderModel,rf=t.DacDecoderOutput,of=t.DacEncoderModel,af=t.DacEncoderOutput,nf=t.DacFeatureExtractor,lf=t.DacModel,cf=t.DacPreTrainedModel,_f=t.DataTypeMap,df=t.DebertaForMaskedLM,uf=t.DebertaForQuestionAnswering,pf=t.DebertaForSequenceClassification,mf=t.DebertaForTokenClassification,hf=t.DebertaModel,Mf=t.DebertaPreTrainedModel,ff=t.DebertaTokenizer,gf=t.DebertaV2ForMaskedLM,Pf=t.DebertaV2ForQuestionAnswering,Tf=t.DebertaV2ForSequenceClassification,wf=t.DebertaV2ForTokenClassification,bf=t.DebertaV2Model,xf=t.DebertaV2PreTrainedModel,vf=t.DebertaV2Tokenizer,Ef=t.DecisionTransformerModel,Ff=t.DecisionTransformerPreTrainedModel,Cf=t.DeiTFeatureExtractor,kf=t.DeiTForImageClassification,yf=t.DeiTImageProcessor,Sf=t.DeiTModel,Af=t.DeiTPreTrainedModel,Lf=t.DepthAnythingForDepthEstimation,Df=t.DepthAnythingPreTrainedModel,If=t.DepthEstimationPipeline,Of=t.DepthProForDepthEstimation,Bf=t.DepthProPreTrainedModel,jf=t.DetrFeatureExtractor,Nf=t.DetrForObjectDetection,Rf=t.DetrForSegmentation,Vf=t.DetrImageProcessor,zf=t.DetrModel,Gf=t.DetrObjectDetectionOutput,Wf=t.DetrPreTrainedModel,Uf=t.DetrSegmentationOutput,$f=t.Dinov2ForImageClassification,Kf=t.Dinov2Model,Qf=t.Dinov2PreTrainedModel,Xf=t.Dinov2WithRegistersForImageClassification,Hf=t.Dinov2WithRegistersModel,Jf=t.Dinov2WithRegistersPreTrainedModel,Yf=t.DistilBertForMaskedLM,qf=t.DistilBertForQuestionAnswering,Zf=t.DistilBertForSequenceClassification,eg=t.DistilBertForTokenClassification,tg=t.DistilBertModel,sg=t.DistilBertPreTrainedModel,rg=t.DistilBertTokenizer,og=t.DocumentQuestionAnsweringPipeline,ag=t.DonutFeatureExtractor,ng=t.DonutImageProcessor,ig=t.DonutSwinModel,lg=t.DonutSwinPreTrainedModel,cg=t.EdgeTamModel,_g=t.EfficientNetForImageClassification,dg=t.EfficientNetImageProcessor,ug=t.EfficientNetModel,pg=t.EfficientNetPreTrainedModel,mg=t.ElectraForMaskedLM,hg=t.ElectraForQuestionAnswering,Mg=t.ElectraForSequenceClassification,fg=t.ElectraForTokenClassification,gg=t.ElectraModel,Pg=t.ElectraPreTrainedModel,Tg=t.ElectraTokenizer,wg=t.EncodecFeatureExtractor,bg=t.EosTokenCriteria,xg=t.Ernie4_5ForCausalLM,vg=t.Ernie4_5Model,Eg=t.Ernie4_5PreTrainedModel,Fg=t.EsmForMaskedLM,Cg=t.EsmForSequenceClassification,kg=t.EsmForTokenClassification,yg=t.EsmModel,Sg=t.EsmPreTrainedModel,Ag=t.EsmTokenizer,Lg=t.ExaoneForCausalLM,Dg=t.ExaoneModel,Ig=t.ExaonePreTrainedModel,Og=t.FFT,Bg=t.FalconForCausalLM,jg=t.FalconModel,Ng=t.FalconPreTrainedModel,Rg=t.FalconTokenizer,Vg=t.FastViTForImageClassification,zg=t.FastViTModel,Gg=t.FastViTPreTrainedModel,Wg=t.FeatureExtractionPipeline,Ug=t.FeatureExtractor,$g=t.FillMaskPipeline,Kg=t.Florence2ForConditionalGeneration,Qg=t.Florence2PreTrainedModel,Xg=t.Florence2Processor,Hg=t.ForcedBOSTokenLogitsProcessor,Jg=t.ForcedEOSTokenLogitsProcessor,Yg=t.GLPNFeatureExtractor,qg=t.GLPNForDepthEstimation,Zg=t.GLPNModel,eP=t.GLPNPreTrainedModel,tP=t.GPT2LMHeadModel,sP=t.GPT2Model,rP=t.GPT2PreTrainedModel,oP=t.GPT2Tokenizer,aP=t.GPTBigCodeForCausalLM,nP=t.GPTBigCodeModel,iP=t.GPTBigCodePreTrainedModel,lP=t.GPTJForCausalLM,cP=t.GPTJModel,_P=t.GPTJPreTrainedModel,dP=t.GPTNeoForCausalLM,uP=t.GPTNeoModel,pP=t.GPTNeoPreTrainedModel,mP=t.GPTNeoXForCausalLM,hP=t.GPTNeoXModel,MP=t.GPTNeoXPreTrainedModel,fP=t.GPTNeoXTokenizer,gP=t.Gemma2ForCausalLM,PP=t.Gemma2Model,TP=t.Gemma2PreTrainedModel,wP=t.Gemma3ForCausalLM,bP=t.Gemma3Model,xP=t.Gemma3PreTrainedModel,vP=t.Gemma3nAudioFeatureExtractor,EP=t.Gemma3nForConditionalGeneration,FP=t.Gemma3nPreTrainedModel,CP=t.Gemma3nProcessor,kP=t.GemmaForCausalLM,yP=t.GemmaModel,SP=t.GemmaPreTrainedModel,AP=t.GemmaTokenizer,LP=t.GlmForCausalLM,DP=t.GlmModel,IP=t.GlmPreTrainedModel,OP=t.GraniteForCausalLM,BP=t.GraniteModel,jP=t.GraniteMoeHybridForCausalLM,NP=t.GraniteMoeHybridModel,RP=t.GraniteMoeHybridPreTrainedModel,VP=t.GranitePreTrainedModel,zP=t.Grok1Tokenizer,GP=t.GroundingDinoForObjectDetection,WP=t.GroundingDinoImageProcessor,UP=t.GroundingDinoPreTrainedModel,$P=t.GroundingDinoProcessor,KP=t.GroupViTModel,QP=t.GroupViTPreTrainedModel,XP=t.HeliumForCausalLM,HP=t.HeliumModel,JP=t.HeliumPreTrainedModel,YP=t.HerbertTokenizer,qP=t.HieraForImageClassification,ZP=t.HieraModel,eT=t.HieraPreTrainedModel,tT=t.HubertForCTC,sT=t.HubertForSequenceClassification,rT=t.HubertModel,oT=t.HubertPreTrainedModel,aT=t.IJepaForImageClassification,nT=t.IJepaModel,iT=t.IJepaPreTrainedModel,lT=t.Idefics3ForConditionalGeneration,cT=t.Idefics3ImageProcessor,_T=t.Idefics3PreTrainedModel,dT=t.Idefics3Processor,uT=t.ImageClassificationPipeline,pT=t.ImageFeatureExtractionPipeline,mT=t.ImageFeatureExtractor,hT=t.ImageMattingOutput,MT=t.ImageProcessor,fT=t.ImageSegmentationPipeline,gT=t.ImageToImagePipeline,PT=t.ImageToTextPipeline,TT=t.InterruptableStoppingCriteria,wT=t.JAISLMHeadModel,bT=t.JAISModel,xT=t.JAISPreTrainedModel,vT=t.JinaCLIPImageProcessor,ET=t.JinaCLIPModel,FT=t.JinaCLIPPreTrainedModel,CT=t.JinaCLIPProcessor,kT=t.JinaCLIPTextModel,yT=t.JinaCLIPVisionModel,ST=t.Lfm2ForCausalLM,AT=t.Lfm2Model,LT=t.Lfm2PreTrainedModel,DT=t.LiteWhisperForConditionalGeneration,IT=t.Llama4ForCausalLM,OT=t.Llama4PreTrainedModel,BT=t.LlamaForCausalLM,jT=t.LlamaModel,NT=t.LlamaPreTrainedModel,RT=t.LlamaTokenizer,VT=t.LlavaForConditionalGeneration,zT=t.LlavaOnevisionForConditionalGeneration,GT=t.LlavaOnevisionImageProcessor,WT=t.LlavaPreTrainedModel,UT=t.LlavaProcessor,$T=t.LlavaQwen2ForCausalLM,KT=t.LogitsProcessor,QT=t.LogitsProcessorList,XT=t.LogitsWarper,HT=t.LongT5ForConditionalGeneration,JT=t.LongT5Model,YT=t.LongT5PreTrainedModel,qT=t.M2M100ForConditionalGeneration,ZT=t.M2M100Model,ew=t.M2M100PreTrainedModel,tw=t.M2M100Tokenizer,sw=t.MBart50Tokenizer,rw=t.MBartForCausalLM,ow=t.MBartForConditionalGeneration,aw=t.MBartForSequenceClassification,nw=t.MBartModel,iw=t.MBartPreTrainedModel,lw=t.MBartTokenizer,cw=t.MPNetForMaskedLM,_w=t.MPNetForQuestionAnswering,dw=t.MPNetForSequenceClassification,uw=t.MPNetForTokenClassification,pw=t.MPNetModel,mw=t.MPNetPreTrainedModel,hw=t.MPNetTokenizer,Mw=t.MT5ForConditionalGeneration,fw=t.MT5Model,gw=t.MT5PreTrainedModel,Pw=t.MarianMTModel,Tw=t.MarianModel,ww=t.MarianPreTrainedModel,bw=t.MarianTokenizer,xw=t.Mask2FormerImageProcessor,vw=t.MaskFormerFeatureExtractor,Ew=t.MaskFormerForInstanceSegmentation,Fw=t.MaskFormerImageProcessor,Cw=t.MaskFormerModel,kw=t.MaskFormerPreTrainedModel,yw=t.MaskedLMOutput,Sw=t.MaxLengthCriteria,Aw=t.Metric3DForDepthEstimation,Lw=t.Metric3DPreTrainedModel,Dw=t.Metric3Dv2ForDepthEstimation,Iw=t.Metric3Dv2PreTrainedModel,Ow=t.MgpstrForSceneTextRecognition,Bw=t.MgpstrModelOutput,jw=t.MgpstrPreTrainedModel,Nw=t.MgpstrProcessor,Rw=t.MgpstrTokenizer,Vw=t.MimiDecoderModel,zw=t.MimiDecoderOutput,Gw=t.MimiEncoderModel,Ww=t.MimiEncoderOutput,Uw=t.MimiModel,$w=t.MimiPreTrainedModel,Kw=t.MinLengthLogitsProcessor,Qw=t.MinNewTokensLengthLogitsProcessor,Xw=t.Ministral3ForCausalLM,Hw=t.Ministral3Model,Jw=t.Ministral3PreTrainedModel,Yw=t.MinistralForCausalLM,qw=t.MinistralModel,Zw=t.MinistralPreTrainedModel,eb=t.Mistral3ForConditionalGeneration,tb=t.MistralForCausalLM,sb=t.MistralModel,rb=t.MistralPreTrainedModel,ob=t.MobileBertForMaskedLM,ab=t.MobileBertForQuestionAnswering,nb=t.MobileBertForSequenceClassification,ib=t.MobileBertModel,lb=t.MobileBertPreTrainedModel,cb=t.MobileBertTokenizer,_b=t.MobileLLMForCausalLM,db=t.MobileLLMModel,ub=t.MobileLLMPreTrainedModel,pb=t.MobileNetV1FeatureExtractor,mb=t.MobileNetV1ForImageClassification,hb=t.MobileNetV1ForSemanticSegmentation,Mb=t.MobileNetV1ImageProcessor,fb=t.MobileNetV1Model,gb=t.MobileNetV1PreTrainedModel,Pb=t.MobileNetV2FeatureExtractor,Tb=t.MobileNetV2ForImageClassification,wb=t.MobileNetV2ForSemanticSegmentation,bb=t.MobileNetV2ImageProcessor,xb=t.MobileNetV2Model,vb=t.MobileNetV2PreTrainedModel,Eb=t.MobileNetV3FeatureExtractor,Fb=t.MobileNetV3ForImageClassification,Cb=t.MobileNetV3ForSemanticSegmentation,kb=t.MobileNetV3ImageProcessor,yb=t.MobileNetV3Model,Sb=t.MobileNetV3PreTrainedModel,Ab=t.MobileNetV4FeatureExtractor,Lb=t.MobileNetV4ForImageClassification,Db=t.MobileNetV4ForSemanticSegmentation,Ib=t.MobileNetV4ImageProcessor,Ob=t.MobileNetV4Model,Bb=t.MobileNetV4PreTrainedModel,jb=t.MobileViTFeatureExtractor,Nb=t.MobileViTForImageClassification,Rb=t.MobileViTImageProcessor,Vb=t.MobileViTModel,zb=t.MobileViTPreTrainedModel,Gb=t.MobileViTV2ForImageClassification,Wb=t.MobileViTV2Model,Ub=t.MobileViTV2PreTrainedModel,$b=t.ModelOutput,Kb=t.ModernBertDecoderForCausalLM,Qb=t.ModernBertDecoderModel,Xb=t.ModernBertDecoderPreTrainedModel,Hb=t.ModernBertForMaskedLM,Jb=t.ModernBertForSequenceClassification,Yb=t.ModernBertForTokenClassification,qb=t.ModernBertModel,Zb=t.ModernBertPreTrainedModel,ex=t.Moondream1ForConditionalGeneration,tx=t.MoonshineFeatureExtractor,sx=t.MoonshineForConditionalGeneration,rx=t.MoonshineModel,ox=t.MoonshinePreTrainedModel,ax=t.MoonshineProcessor,nx=t.MptForCausalLM,ix=t.MptModel,lx=t.MptPreTrainedModel,cx=t.MultiModalityCausalLM,_x=t.MultiModalityPreTrainedModel,dx=t.MusicgenForCausalLM,ux=t.MusicgenForConditionalGeneration,px=t.MusicgenModel,mx=t.MusicgenPreTrainedModel,hx=t.NanoChatForCausalLM,Mx=t.NanoChatModel,fx=t.NanoChatPreTrainedModel,gx=t.NeoBertForMaskedLM,Px=t.NeoBertForQuestionAnswering,Tx=t.NeoBertForSequenceClassification,wx=t.NeoBertForTokenClassification,bx=t.NeoBertModel,xx=t.NeoBertPreTrainedModel,vx=t.NllbTokenizer,Ex=t.NoBadWordsLogitsProcessor,Fx=t.NoRepeatNGramLogitsProcessor,Cx=t.NomicBertModel,kx=t.NomicBertPreTrainedModel,yx=t.NougatImageProcessor,Sx=t.NougatTokenizer,Ax=t.OPTForCausalLM,Lx=t.OPTModel,Dx=t.OPTPreTrainedModel,Ix=t.ObjectDetectionPipeline,Ox=t.Olmo2ForCausalLM,Bx=t.Olmo2Model,jx=t.Olmo2PreTrainedModel,Nx=t.OlmoForCausalLM,Rx=t.OlmoModel,Vx=t.OlmoPreTrainedModel,zx=t.OpenELMForCausalLM,Gx=t.OpenELMModel,Wx=t.OpenELMPreTrainedModel,Ux=t.OwlViTFeatureExtractor,$x=t.OwlViTForObjectDetection,Kx=t.OwlViTImageProcessor,Qx=t.OwlViTModel,Xx=t.OwlViTPreTrainedModel,Hx=t.OwlViTProcessor,Jx=t.Owlv2ForObjectDetection,Yx=t.Owlv2ImageProcessor,qx=t.Owlv2Model,Zx=t.Owlv2PreTrainedModel,ev=t.PaliGemmaForConditionalGeneration,tv=t.PaliGemmaPreTrainedModel,sv=t.PaliGemmaProcessor,rv=t.ParakeetFeatureExtractor,ov=t.ParakeetForCTC,av=t.ParakeetPreTrainedModel,nv=t.PatchTSMixerForPrediction,iv=t.PatchTSMixerModel,lv=t.PatchTSMixerPreTrainedModel,cv=t.PatchTSTForPrediction,_v=t.PatchTSTModel,dv=t.PatchTSTPreTrainedModel,uv=t.Phi3ForCausalLM,pv=t.Phi3Model,mv=t.Phi3PreTrainedModel,hv=t.Phi3VForCausalLM,Mv=t.Phi3VImageProcessor,fv=t.Phi3VPreTrainedModel,gv=t.Phi3VProcessor,Pv=t.PhiForCausalLM,Tv=t.PhiModel,wv=t.PhiPreTrainedModel,bv=t.Pipeline,xv=t.PixtralImageProcessor,vv=t.PixtralProcessor,Ev=t.PreTrainedModel,Fv=t.PreTrainedTokenizer,Cv=t.PretrainedConfig,kv=t.PretrainedMixin,yv=t.Processor,Sv=t.PvtForImageClassification,Av=t.PvtImageProcessor,Lv=t.PvtModel,Dv=t.PvtPreTrainedModel,Iv=t.PyAnnoteFeatureExtractor,Ov=t.PyAnnoteForAudioFrameClassification,Bv=t.PyAnnoteModel,jv=t.PyAnnotePreTrainedModel,Nv=t.PyAnnoteProcessor,Rv=t.QuestionAnsweringModelOutput,Vv=t.QuestionAnsweringPipeline,zv=t.Qwen2ForCausalLM,Gv=t.Qwen2Model,Wv=t.Qwen2PreTrainedModel,Uv=t.Qwen2Tokenizer,$v=t.Qwen2VLForConditionalGeneration,Kv=t.Qwen2VLImageProcessor,Qv=t.Qwen2VLPreTrainedModel,Xv=t.Qwen2VLProcessor,Hv=t.Qwen3ForCausalLM,Jv=t.Qwen3Model,Yv=t.Qwen3PreTrainedModel,qv=t.RFDetrForObjectDetection,Zv=t.RFDetrModel,eE=t.RFDetrObjectDetectionOutput,tE=t.RFDetrPreTrainedModel,sE=t.RTDetrForObjectDetection,rE=t.RTDetrImageProcessor,oE=t.RTDetrModel,aE=t.RTDetrObjectDetectionOutput,nE=t.RTDetrPreTrainedModel,iE=t.RTDetrV2ForObjectDetection,lE=t.RTDetrV2Model,cE=t.RTDetrV2ObjectDetectionOutput,_E=t.RTDetrV2PreTrainedModel,dE=t.RawAudio,uE=t.RawImage,pE=t.RawVideo,mE=t.RawVideoFrame,hE=t.RepetitionPenaltyLogitsProcessor,ME=t.ResNetForImageClassification,fE=t.ResNetModel,gE=t.ResNetPreTrainedModel,PE=t.RoFormerForMaskedLM,TE=t.RoFormerForQuestionAnswering,wE=t.RoFormerForSequenceClassification,bE=t.RoFormerForTokenClassification,xE=t.RoFormerModel,vE=t.RoFormerPreTrainedModel,EE=t.RoFormerTokenizer,FE=t.RobertaForMaskedLM,CE=t.RobertaForQuestionAnswering,kE=t.RobertaForSequenceClassification,yE=t.RobertaForTokenClassification,SE=t.RobertaModel,AE=t.RobertaPreTrainedModel,LE=t.RobertaTokenizer,DE=t.Sam2ImageProcessor,IE=t.Sam2ImageSegmentationOutput,OE=t.Sam2Model,BE=t.Sam2PreTrainedModel,jE=t.Sam2Processor,NE=t.Sam2VideoProcessor,RE=t.Sam3ImageProcessor,VE=t.Sam3TrackerModel,zE=t.SamImageProcessor,GE=t.SamImageSegmentationOutput,WE=t.SamModel,UE=t.SamPreTrainedModel,$E=t.SamProcessor,KE=t.SapiensForDepthEstimation,QE=t.SapiensForNormalEstimation,XE=t.SapiensForSemanticSegmentation,HE=t.SapiensPreTrainedModel,JE=t.SeamlessM4TFeatureExtractor,YE=t.SegformerFeatureExtractor,qE=t.SegformerForImageClassification,ZE=t.SegformerForSemanticSegmentation,eF=t.SegformerImageProcessor,tF=t.SegformerModel,sF=t.SegformerPreTrainedModel,rF=t.Seq2SeqLMOutput,oF=t.SequenceClassifierOutput,aF=t.SiglipImageProcessor,nF=t.SiglipModel,iF=t.SiglipPreTrainedModel,lF=t.SiglipTextModel,cF=t.SiglipTokenizer,_F=t.SiglipVisionModel,dF=t.SmolLM3ForCausalLM,uF=t.SmolLM3Model,pF=t.SmolLM3PreTrainedModel,mF=t.SmolVLMForConditionalGeneration,hF=t.SmolVLMImageProcessor,MF=t.SmolVLMProcessor,fF=t.SnacDecoderModel,gF=t.SnacEncoderModel,PF=t.SnacFeatureExtractor,TF=t.SnacModel,wF=t.SnacPreTrainedModel,bF=t.SpeechT5FeatureExtractor,xF=t.SpeechT5ForSpeechToText,vF=t.SpeechT5ForTextToSpeech,EF=t.SpeechT5HifiGan,FF=t.SpeechT5Model,CF=t.SpeechT5PreTrainedModel,kF=t.SpeechT5Processor,yF=t.SpeechT5Tokenizer,SF=t.SqueezeBertForMaskedLM,AF=t.SqueezeBertForQuestionAnswering,LF=t.SqueezeBertForSequenceClassification,DF=t.SqueezeBertModel,IF=t.SqueezeBertPreTrainedModel,OF=t.SqueezeBertTokenizer,BF=t.StableLmForCausalLM,jF=t.StableLmModel,NF=t.StableLmPreTrainedModel,RF=t.Starcoder2ForCausalLM,VF=t.Starcoder2Model,zF=t.Starcoder2PreTrainedModel,GF=t.StoppingCriteria,WF=t.StoppingCriteriaList,UF=t.StyleTextToSpeech2Model,$F=t.StyleTextToSpeech2PreTrainedModel,KF=t.SummarizationPipeline,QF=t.SupertonicForConditionalGeneration,XF=t.SupertonicPreTrainedModel,HF=t.SuppressTokensAtBeginLogitsProcessor,JF=t.Swin2SRForImageSuperResolution,YF=t.Swin2SRImageProcessor,qF=t.Swin2SRModel,ZF=t.Swin2SRPreTrainedModel,eC=t.SwinForImageClassification,tC=t.SwinForSemanticSegmentation,sC=t.SwinModel,rC=t.SwinPreTrainedModel,oC=t.T5ForConditionalGeneration,aC=t.T5Model,nC=t.T5PreTrainedModel,iC=t.T5Tokenizer,lC=t.TableTransformerForObjectDetection,cC=t.TableTransformerModel,_C=t.TableTransformerObjectDetectionOutput,dC=t.TableTransformerPreTrainedModel,uC=t.TemperatureLogitsWarper,pC=t.Tensor,mC=t.Text2TextGenerationPipeline,hC=t.TextClassificationPipeline,MC=t.TextGenerationPipeline,fC=t.TextStreamer,gC=t.TextToAudioPipeline,PC=t.TokenClassificationPipeline,TC=t.TokenClassifierOutput,wC=t.TokenizerModel,bC=t.TopKLogitsWarper,xC=t.TopPLogitsWarper,vC=t.TrOCRForCausalLM,EC=t.TrOCRPreTrainedModel,FC=t.TranslationPipeline,CC=t.UltravoxModel,kC=t.UltravoxPreTrainedModel,yC=t.UltravoxProcessor,SC=t.UniSpeechForCTC,AC=t.UniSpeechForSequenceClassification,LC=t.UniSpeechModel,DC=t.UniSpeechPreTrainedModel,IC=t.UniSpeechSatForAudioFrameClassification,OC=t.UniSpeechSatForCTC,BC=t.UniSpeechSatForSequenceClassification,jC=t.UniSpeechSatModel,NC=t.UniSpeechSatPreTrainedModel,RC=t.VLChatProcessor,VC=t.VLMImageProcessor,zC=t.VaultGemmaForCausalLM,GC=t.VaultGemmaModel,WC=t.VaultGemmaPreTrainedModel,UC=t.ViTFeatureExtractor,$C=t.ViTForImageClassification,KC=t.ViTImageProcessor,QC=t.ViTMAEModel,XC=t.ViTMAEPreTrainedModel,HC=t.ViTMSNForImageClassification,JC=t.ViTMSNModel,YC=t.ViTMSNPreTrainedModel,qC=t.ViTModel,ZC=t.ViTPreTrainedModel,ek=t.VisionEncoderDecoderModel,tk=t.VitMatteForImageMatting,sk=t.VitMatteImageProcessor,rk=t.VitMattePreTrainedModel,ok=t.VitPoseForPoseEstimation,ak=t.VitPoseImageProcessor,nk=t.VitPosePreTrainedModel,ik=t.VitsModel,lk=t.VitsModelOutput,ck=t.VitsPreTrainedModel,_k=t.VitsTokenizer,dk=t.VoxtralForConditionalGeneration,uk=t.VoxtralProcessor,pk=t.Wav2Vec2BertForCTC,mk=t.Wav2Vec2BertForSequenceClassification,hk=t.Wav2Vec2BertModel,Mk=t.Wav2Vec2BertPreTrainedModel,fk=t.Wav2Vec2CTCTokenizer,gk=t.Wav2Vec2FeatureExtractor,Pk=t.Wav2Vec2ForAudioFrameClassification,Tk=t.Wav2Vec2ForCTC,wk=t.Wav2Vec2ForSequenceClassification,bk=t.Wav2Vec2Model,xk=t.Wav2Vec2PreTrainedModel,vk=t.Wav2Vec2Processor,Ek=t.Wav2Vec2ProcessorWithLM,Fk=t.WavLMForAudioFrameClassification,Ck=t.WavLMForCTC,kk=t.WavLMForSequenceClassification,yk=t.WavLMForXVector,Sk=t.WavLMModel,Ak=t.WavLMPreTrainedModel,Lk=t.WeSpeakerFeatureExtractor,Dk=t.WeSpeakerResNetModel,Ik=t.WeSpeakerResNetPreTrainedModel,Ok=t.WhisperFeatureExtractor,Bk=t.WhisperForConditionalGeneration,jk=t.WhisperModel,Nk=t.WhisperPreTrainedModel,Rk=t.WhisperProcessor,Vk=t.WhisperTextStreamer,zk=t.WhisperTimeStampLogitsProcessor,Gk=t.WhisperTokenizer,Wk=t.XLMForQuestionAnswering,Uk=t.XLMForSequenceClassification,$k=t.XLMForTokenClassification,Kk=t.XLMModel,Qk=t.XLMPreTrainedModel,Xk=t.XLMRobertaForMaskedLM,Hk=t.XLMRobertaForQuestionAnswering,Jk=t.XLMRobertaForSequenceClassification,Yk=t.XLMRobertaForTokenClassification,qk=t.XLMRobertaModel,Zk=t.XLMRobertaPreTrainedModel,ey=t.XLMRobertaTokenizer,ty=t.XLMTokenizer,sy=t.XLMWithLMHeadModel,ry=t.XVectorOutput,oy=t.YolosFeatureExtractor,ay=t.YolosForObjectDetection,ny=t.YolosImageProcessor,iy=t.YolosModel,ly=t.YolosObjectDetectionOutput,cy=t.YolosPreTrainedModel,_y=t.ZeroShotAudioClassificationPipeline,dy=t.ZeroShotClassificationPipeline,uy=t.ZeroShotImageClassificationPipeline,py=t.ZeroShotObjectDetectionPipeline,my=t.bankers_round,hy=t.cat,My=t.cos_sim,fy=t.dot,gy=t.dynamic_time_warping,Py=t.env,Ty=t.full,wy=t.full_like,by=t.getCacheShapes,xy=t.hamming,vy=t.hanning,Ey=t.interpolate,Fy=t.interpolate_4d,Cy=t.interpolate_data,ky=t.is_chinese_char,yy=t.layer_norm,Sy=t.load_image,Ay=t.load_video,Ly=t.log_softmax,Dy=t.magnitude,Iy=t.matmul,Oy=t.max,By=t.mean,jy=t.mean_pooling,Ny=t.medianFilter,Ry=t.mel_filter_bank,Vy=t.min,zy=t.ones,Gy=t.ones_like,Wy=t.permute,Uy=t.permute_data,$y=t.pipeline,Ky=t.quantize_embeddings,Qy=t.rand,Xy=t.randn,Hy=t.read_audio,Jy=t.rfft,Yy=t.round,qy=t.slice,Zy=t.softmax,eS=t.spectrogram,tS=t.stack,sS=t.std_mean,rS=t.topk,oS=t.window_function,aS=t.zeros,nS=t.zeros_like});var pr=require("node:worker_threads"),{modelId:lS,dimensions:Qa,vendorModel:Xa}=pr.workerData,Ur=null,Ya=null,Wr=null,qa=!1,Ha=null;async function cS(){if(!Ur){if(qa)throw new Error(Ha??"pipeline init previously failed");if(Wr||(Wr=(async()=>{let D=await Promise.resolve().then(()=>(qu(),Yu)),{pipeline:a,env:e,layer_norm:i}=D;e.allowRemoteModels=!Xa,e.allowLocalModels=!0,Xa&&(e.localModelPath=Xa.localModelPath,e.allowRemoteModels=!1),Ur=await a("feature-extraction",lS,{dtype:"q8",device:"cpu"}),Ya=i})().catch(D=>{throw qa=!0,Ha=D instanceof Error?D.message:String(D),Wr=null,Za({type:"init-error",error:Ha}),D})),await Wr,!Ur)throw new Error("pipeline init completed but pipe is null")}}var ir=[],Ja=!1;function _S(D){if(D.priority==="high"){let a=0;for(;a<ir.length&&ir[a].priority==="high";)a++;ir.splice(a,0,D)}else ir.push(D);dS()}async function dS(){if(!Ja){for(Ja=!0;ir.length>0;){let D=ir.shift();await pS(D)}Ja=!1}}function uS(D){return!!(/^\d{6,}$/.test(D)||/out.of.memory|alloc.*fail|oom/i.test(D))}async function pS(D){try{await cS();let a=await Ur(D.texts,{pooling:"mean",truncation:!0}),e=a.dims[a.dims.length-1],i=Qa<e,d;i?d=Ya(a,[e]).slice(null,[0,Qa]).normalize(2,-1):d=Ya(a,[e]).normalize(2,-1);let g=D.texts.length,I=[],f=i?Qa:e;for(let u=0;u<g;u++){let m=u*f,T=new Float32Array(f);T.set(d.data.subarray(m,m+f)),I.push(T)}Za({type:"result",id:D.id,vectors:I})}catch(a){if(!qa){let e=a instanceof Error?a.message:String(a),i=uS(e)?`ONNX runtime out of memory (batch=${D.texts.length}, longest\u2248${Math.max(...D.texts.map(d=>d.length))} chars). Try reducing batch size. Raw: ${e}`:e;Za({type:"error",id:D.id,error:i})}}}function Za(D){pr.parentPort.postMessage(D)}pr.parentPort.on("message",D=>{switch(D.type){case"embed":_S(D);break;case"shutdown":process.exit(0);break}});
|