@omnimedia/omnitool 1.1.0-95 → 1.1.0-96
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/package.json +1 -1
- package/s/features/bg-remover/bg-remover.ts +26 -0
- package/s/features/bg-remover/default-spec.ts +11 -0
- package/s/features/bg-remover/types.ts +27 -0
- package/s/features/bg-remover/worker.bundle.ts +51 -0
- package/s/features/{speech/transcribe/parts → parts}/load-pipe.ts +3 -5
- package/s/features/parts/types.ts +19 -0
- package/s/features/speech/transcribe/default-spec.ts +2 -2
- package/s/features/speech/transcribe/types.ts +6 -16
- package/s/features/speech/transcribe/worker.bundle.ts +4 -3
- package/s/index.html.ts +2 -2
- package/s/timeline/parts/item.ts +15 -3
- package/s/timeline/parts/media.ts +11 -0
- package/s/timeline/renderers/parts/handy.ts +16 -0
- package/s/timeline/renderers/parts/samplers/visual/parts/defaults.ts +7 -1
- package/s/timeline/renderers/parts/samplers/visual/parts/image-sink.ts +51 -0
- package/s/timeline/renderers/parts/samplers/visual/parts/sample.ts +7 -0
- package/s/timeline/renderers/parts/samplers/visual/parts/types.ts +2 -1
- package/s/timeline/renderers/parts/samplers/visual/sampler.ts +8 -5
- package/s/timeline/sugar/helpers.ts +9 -0
- package/s/timeline/sugar/o.ts +19 -0
- package/x/demo/demo.bundle.min.js +100 -100
- package/x/demo/demo.bundle.min.js.map +4 -4
- package/x/features/bg-remover/bg-remover.d.ts +5 -0
- package/x/features/bg-remover/bg-remover.js +18 -0
- package/x/features/bg-remover/bg-remover.js.map +1 -0
- package/x/features/bg-remover/default-spec.d.ts +2 -0
- package/x/features/bg-remover/default-spec.js +6 -0
- package/x/features/bg-remover/default-spec.js.map +1 -0
- package/x/features/bg-remover/types.d.ts +20 -0
- package/x/features/bg-remover/types.js +2 -0
- package/x/features/bg-remover/types.js.map +1 -0
- package/x/features/bg-remover/worker.bundle.d.ts +1 -0
- package/x/features/bg-remover/worker.bundle.js +38 -0
- package/x/features/bg-remover/worker.bundle.js.map +1 -0
- package/x/features/bg-remover/worker.bundle.min.js +2916 -0
- package/x/features/bg-remover/worker.bundle.min.js.map +7 -0
- package/x/features/parts/load-pipe.d.ts +2 -0
- package/x/features/{speech/transcribe/parts → parts}/load-pipe.js +1 -1
- package/x/features/parts/load-pipe.js.map +1 -0
- package/x/features/parts/types.d.ts +15 -0
- package/x/features/parts/types.js +2 -0
- package/x/features/parts/types.js.map +1 -0
- package/x/features/speech/transcribe/default-spec.js +2 -2
- package/x/features/speech/transcribe/default-spec.js.map +1 -1
- package/x/features/speech/transcribe/types.d.ts +5 -14
- package/x/features/speech/transcribe/worker.bundle.js +3 -2
- package/x/features/speech/transcribe/worker.bundle.js.map +1 -1
- package/x/features/speech/transcribe/worker.bundle.min.js +1 -1
- package/x/features/speech/transcribe/worker.bundle.min.js.map +3 -3
- package/x/index.html +4 -4
- package/x/index.html.js +2 -2
- package/x/tests.bundle.min.js +103 -103
- package/x/tests.bundle.min.js.map +4 -4
- package/x/tests.html +1 -1
- package/x/timeline/parts/item.d.ts +14 -4
- package/x/timeline/parts/item.js +1 -0
- package/x/timeline/parts/item.js.map +1 -1
- package/x/timeline/parts/media.d.ts +1 -0
- package/x/timeline/parts/media.js +8 -0
- package/x/timeline/parts/media.js.map +1 -1
- package/x/timeline/renderers/parts/handy.d.ts +1 -0
- package/x/timeline/renderers/parts/handy.js +11 -0
- package/x/timeline/renderers/parts/handy.js.map +1 -1
- package/x/timeline/renderers/parts/samplers/visual/parts/defaults.d.ts +4 -1
- package/x/timeline/renderers/parts/samplers/visual/parts/defaults.js +3 -0
- package/x/timeline/renderers/parts/samplers/visual/parts/defaults.js.map +1 -1
- package/x/timeline/renderers/parts/samplers/visual/parts/image-sink.d.ts +11 -0
- package/x/timeline/renderers/parts/samplers/visual/parts/image-sink.js +36 -0
- package/x/timeline/renderers/parts/samplers/visual/parts/image-sink.js.map +1 -0
- package/x/timeline/renderers/parts/samplers/visual/parts/sample.js +6 -0
- package/x/timeline/renderers/parts/samplers/visual/parts/sample.js.map +1 -1
- package/x/timeline/renderers/parts/samplers/visual/parts/types.d.ts +2 -1
- package/x/timeline/renderers/parts/samplers/visual/parts/{sink.js → video-sink.js} +1 -1
- package/x/timeline/renderers/parts/samplers/visual/parts/video-sink.js.map +1 -0
- package/x/timeline/renderers/parts/samplers/visual/sampler.js +8 -5
- package/x/timeline/renderers/parts/samplers/visual/sampler.js.map +1 -1
- package/x/timeline/sugar/helpers.d.ts +3 -0
- package/x/timeline/sugar/helpers.js +3 -0
- package/x/timeline/sugar/helpers.js.map +1 -1
- package/x/timeline/sugar/o.d.ts +3 -0
- package/x/timeline/sugar/o.js +12 -0
- package/x/timeline/sugar/o.js.map +1 -1
- package/x/features/speech/transcribe/parts/load-pipe.d.ts +0 -2
- package/x/features/speech/transcribe/parts/load-pipe.js.map +0 -1
- package/x/timeline/renderers/parts/samplers/visual/parts/sink.js.map +0 -1
- /package/s/timeline/renderers/parts/samplers/visual/parts/{sink.ts → video-sink.ts} +0 -0
- /package/x/timeline/renderers/parts/samplers/visual/parts/{sink.d.ts → video-sink.d.ts} +0 -0
|
@@ -2848,7 +2848,7 @@ ${C}${f}${P}
|
|
|
2848
2848
|
${x}${v}`+F.repeat(d)+`${x}`,b}function c(d,g,h,x){return`${g}${x}`+h.repeat(d)+`${g}`}function _(d,g,h,x,F,v){return d===0&&g===0?c(h,x,F,v):l(h,d,g,x,F,v)}class u extends s.Processor{static image_processor_class=o.AutoImageProcessor;static tokenizer_class=a.AutoTokenizer;static uses_processor_config=!0;fake_image_token="<fake_token_around_image>";image_token="<image>";global_img_token="<global-img>";async _call(g,h=null,x={}){x.return_row_col_info??=!0;let F;h&&(F=await this.image_processor(h,x)),Array.isArray(g)||(g=[g]);let v=F.rows??[new Array(g.length).fill(0)],b=F.cols??[new Array(g.length).fill(0)],C=this.config.image_seq_len,y=[],P=[];for(let f=0;f<g.length;++f){let E=g[f],D=v[f],O=b[f];y.push((0,i.count)(E,this.image_token));let U=D.map((X,J)=>_(X,O[J],C,this.fake_image_token,this.image_token,this.global_img_token)),W=E.split(this.image_token);if(W.length===0)throw new Error("The image token should be present in the text.");let z=W[0];for(let X=0;X<U.length;++X)z+=U[X]+W[X+1];P.push(z)}return{...this.tokenizer(P),...F}}}}),"./src/models/image_processors.js":((e,r,t)=>{t.r(r),t.d(r,{BeitFeatureExtractor:()=>s.BeitFeatureExtractor,BitImageProcessor:()=>o.BitImageProcessor,CLIPFeatureExtractor:()=>n.CLIPFeatureExtractor,CLIPImageProcessor:()=>n.CLIPImageProcessor,ChineseCLIPFeatureExtractor:()=>a.ChineseCLIPFeatureExtractor,ConvNextFeatureExtractor:()=>i.ConvNextFeatureExtractor,ConvNextImageProcessor:()=>i.ConvNextImageProcessor,DINOv3ViTImageProcessor:()=>_.DINOv3ViTImageProcessor,DPTFeatureExtractor:()=>d.DPTFeatureExtractor,DPTImageProcessor:()=>d.DPTImageProcessor,DeiTFeatureExtractor:()=>l.DeiTFeatureExtractor,DeiTImageProcessor:()=>l.DeiTImageProcessor,DetrFeatureExtractor:()=>c.DetrFeatureExtractor,DetrImageProcessor:()=>c.DetrImageProcessor,DonutFeatureExtractor:()=>u.DonutFeatureExtractor,DonutImageProcessor:()=>u.DonutImageProcessor,EfficientNetImageProcessor:()=>g.EfficientNetImageProcessor,GLPNFeatureExtractor:()=>h.GLPNFeatureExtractor,GroundingDinoImageProcessor:()=>x.GroundingDinoImageProcessor,Idefics3ImageProcessor:()=>F.Idefics3ImageProcessor,JinaCLIPImageProcessor:()=>b.JinaCLIPImageProcessor,LlavaOnevisionImageProcessor:()=>C.LlavaOnevisionImageProcessor,Mask2FormerImageProcessor:()=>y.Mask2FormerImageProcessor,MaskFormerFeatureExtractor:()=>P.MaskFormerFeatureExtractor,MaskFormerImageProcessor:()=>P.MaskFormerImageProcessor,MobileNetV1FeatureExtractor:()=>I.MobileNetV1FeatureExtractor,MobileNetV1ImageProcessor:()=>I.MobileNetV1ImageProcessor,MobileNetV2FeatureExtractor:()=>f.MobileNetV2FeatureExtractor,MobileNetV2ImageProcessor:()=>f.MobileNetV2ImageProcessor,MobileNetV3FeatureExtractor:()=>E.MobileNetV3FeatureExtractor,MobileNetV3ImageProcessor:()=>E.MobileNetV3ImageProcessor,MobileNetV4FeatureExtractor:()=>D.MobileNetV4FeatureExtractor,MobileNetV4ImageProcessor:()=>D.MobileNetV4ImageProcessor,MobileViTFeatureExtractor:()=>O.MobileViTFeatureExtractor,MobileViTImageProcessor:()=>O.MobileViTImageProcessor,NougatImageProcessor:()=>U.NougatImageProcessor,OwlViTFeatureExtractor:()=>z.OwlViTFeatureExtractor,OwlViTImageProcessor:()=>z.OwlViTImageProcessor,Owlv2ImageProcessor:()=>W.Owlv2ImageProcessor,Phi3VImageProcessor:()=>X.Phi3VImageProcessor,PixtralImageProcessor:()=>J.PixtralImageProcessor,PvtImageProcessor:()=>q.PvtImageProcessor,Qwen2VLImageProcessor:()=>re.Qwen2VLImageProcessor,RTDetrImageProcessor:()=>oe.RTDetrImageProcessor,Sam2ImageProcessor:()=>ye.Sam2ImageProcessor,Sam3ImageProcessor:()=>Y.Sam3ImageProcessor,SamImageProcessor:()=>ne.SamImageProcessor,SegformerFeatureExtractor:()=>H.SegformerFeatureExtractor,SegformerImageProcessor:()=>H.SegformerImageProcessor,SiglipImageProcessor:()=>R.SiglipImageProcessor,SmolVLMImageProcessor:()=>L.SmolVLMImageProcessor,Swin2SRImageProcessor:()=>ee.Swin2SRImageProcessor,VLMImageProcessor:()=>v.VLMImageProcessor,ViTFeatureExtractor:()=>ue.ViTFeatureExtractor,ViTImageProcessor:()=>ue.ViTImageProcessor,VitMatteImageProcessor:()=>ke.VitMatteImageProcessor,VitPoseImageProcessor:()=>Ie.VitPoseImageProcessor,YolosFeatureExtractor:()=>Le.YolosFeatureExtractor,YolosImageProcessor:()=>Le.YolosImageProcessor});var s=t("./src/models/beit/image_processing_beit.js"),o=t("./src/models/bit/image_processing_bit.js"),a=t("./src/models/chinese_clip/image_processing_chinese_clip.js"),n=t("./src/models/clip/image_processing_clip.js"),i=t("./src/models/convnext/image_processing_convnext.js"),l=t("./src/models/deit/image_processing_deit.js"),c=t("./src/models/detr/image_processing_detr.js"),_=t("./src/models/dinov3_vit/image_processing_dinov3_vit.js"),u=t("./src/models/donut/image_processing_donut.js"),d=t("./src/models/dpt/image_processing_dpt.js"),g=t("./src/models/efficientnet/image_processing_efficientnet.js"),h=t("./src/models/glpn/image_processing_glpn.js"),x=t("./src/models/grounding_dino/image_processing_grounding_dino.js"),F=t("./src/models/idefics3/image_processing_idefics3.js"),v=t("./src/models/janus/image_processing_janus.js"),b=t("./src/models/jina_clip/image_processing_jina_clip.js"),C=t("./src/models/llava_onevision/image_processing_llava_onevision.js"),y=t("./src/models/mask2former/image_processing_mask2former.js"),P=t("./src/models/maskformer/image_processing_maskformer.js"),I=t("./src/models/mobilenet_v1/image_processing_mobilenet_v1.js"),f=t("./src/models/mobilenet_v2/image_processing_mobilenet_v2.js"),E=t("./src/models/mobilenet_v3/image_processing_mobilenet_v3.js"),D=t("./src/models/mobilenet_v4/image_processing_mobilenet_v4.js"),O=t("./src/models/mobilevit/image_processing_mobilevit.js"),U=t("./src/models/nougat/image_processing_nougat.js"),W=t("./src/models/owlv2/image_processing_owlv2.js"),z=t("./src/models/owlvit/image_processing_owlvit.js"),X=t("./src/models/phi3_v/image_processing_phi3_v.js"),J=t("./src/models/pixtral/image_processing_pixtral.js"),q=t("./src/models/pvt/image_processing_pvt.js"),re=t("./src/models/qwen2_vl/image_processing_qwen2_vl.js"),oe=t("./src/models/rt_detr/image_processing_rt_detr.js"),ne=t("./src/models/sam/image_processing_sam.js"),ye=t("./src/models/sam2/image_processing_sam2.js"),Y=t("./src/models/sam3/image_processing_sam3.js"),H=t("./src/models/segformer/image_processing_segformer.js"),R=t("./src/models/siglip/image_processing_siglip.js"),L=t("./src/models/smolvlm/image_processing_smolvlm.js"),ee=t("./src/models/swin2sr/image_processing_swin2sr.js"),ue=t("./src/models/vit/image_processing_vit.js"),ke=t("./src/models/vitmatte/image_processing_vitmatte.js"),Ie=t("./src/models/vitpose/image_processing_vitpose.js"),Le=t("./src/models/yolos/image_processing_yolos.js")}),"./src/models/janus/image_processing_janus.js":((e,r,t)=>{t.r(r),t.d(r,{VLMImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{constructor(n){super({do_pad:!0,pad_size:{width:n.image_size,height:n.image_size},...n}),this.constant_values=this.config.background_color.map(i=>i*this.rescale_factor)}pad_image(n,i,l,c){return super.pad_image(n,i,l,{constant_values:this.constant_values,center:!0,...c})}}}),"./src/models/janus/processing_janus.js":((e,r,t)=>{t.r(r),t.d(r,{VLChatProcessor:()=>c});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js"),n=t("./src/utils/core.js"),i=t("./src/utils/tensor.js"),l=t("./src/utils/image.js");class c extends s.Processor{static image_processor_class=o.AutoImageProcessor;static tokenizer_class=a.AutoTokenizer;static uses_processor_config=!0;constructor(u,d,g){super(u,d,g),this.image_tag=this.config.image_tag,this.image_start_tag=this.config.image_start_tag,this.image_end_tag=this.config.image_end_tag,this.num_image_tokens=this.config.num_image_tokens}async _call(u,{images:d=null,chat_template:g="default"}={}){d?Array.isArray(d)||(d=[d]):d=await Promise.all(u.filter(O=>O.images).flatMap(O=>O.images).map(O=>l.RawImage.read(O)));let h=this.tokenizer,x=h.apply_chat_template(u,{tokenize:!1,add_generation_prompt:!0,chat_template:g}),F=O=>h.encode(O,{add_special_tokens:!1}),v=x.split(this.image_tag),b=v.length-1;if(d.length!==b)throw new Error(`Number of images provided (${d.length}) does not match number of "${this.image_tag}" image tags (${b})`);let[C,y,P]=h.model.convert_tokens_to_ids([this.image_tag,this.image_start_tag,this.image_end_tag]),I=F(v[0]),f=new Array(I.length).fill(!1);for(let O=1;O<v.length;++O){let U=new Array(this.num_image_tokens).fill(C),W=F(v[O]);I=(0,n.mergeArrays)(I,[y],U,[P],W);let z=new Array(this.num_image_tokens).fill(!0);f=(0,n.mergeArrays)(f,[!1],z,[!1],new Array(W.length).fill(!1))}let E=[1,I.length],D={input_ids:new i.Tensor("int64",I,E),attention_mask:new i.Tensor("int64",new Array(I.length).fill(1),E),images_seq_mask:new i.Tensor("bool",f,E),images_emb_mask:new i.Tensor("bool",new Array(b*this.num_image_tokens).fill(!0),[1,b,this.num_image_tokens])};if(d&&d.length>0){let O=await this.image_processor(d);return O.pixel_values.unsqueeze_(0),{...D,...O}}return D}}}),"./src/models/jina_clip/image_processing_jina_clip.js":((e,r,t)=>{t.r(r),t.d(r,{JinaCLIPImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{constructor(n){let{resize_mode:i,fill_color:l,interpolation:c,size:_,...u}=n,d=i==="squash"?{width:_,height:_}:i==="shortest"?{shortest_edge:_}:{longest_edge:_},g=c==="bicubic"?3:2;super({...u,size:d,resample:g,do_center_crop:!0,crop_size:_,do_normalize:!0})}}}),"./src/models/jina_clip/processing_jina_clip.js":((e,r,t)=>{t.r(r),t.d(r,{JinaCLIPProcessor:()=>n});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js");class n extends s.Processor{static tokenizer_class=a.AutoTokenizer;static image_processor_class=o.AutoImageProcessor;async _call(l=null,c=null,_={}){if(!l&&!c)throw new Error("Either text or images must be provided");let u=l?this.tokenizer(l,_):{},d=c?await this.image_processor(c,_):{};return{...u,...d}}}}),"./src/models/llava/processing_llava.js":((e,r,t)=>{t.r(r),t.d(r,{LlavaProcessor:()=>n});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js");class n extends s.Processor{static tokenizer_class=a.AutoTokenizer;static image_processor_class=o.AutoImageProcessor;static uses_processor_config=!0;async _call(l,c=null,_={}){let u=await this.image_processor(l,_);if(c){let[g,h]=u.pixel_values.dims.slice(-2),{image_token:x,patch_size:F,num_additional_image_tokens:v}=this.config,b=Math.floor(g/F)*Math.floor(h/F)+v;c=structuredClone(c),Array.isArray(c)||(c=[c]);for(let C=0;C<c.length;++C)c[C]=c[C].replace(x,x.repeat(b))}let d=c?this.tokenizer(c,_):{};return{...u,...d}}}}),"./src/models/llava_onevision/image_processing_llava_onevision.js":((e,r,t)=>{t.r(r),t.d(r,{LlavaOnevisionImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}}),"./src/models/mask2former/image_processing_mask2former.js":((e,r,t)=>{t.r(r),t.d(r,{Mask2FormerImageProcessor:()=>o});var s=t("./src/models/maskformer/image_processing_maskformer.js");class o extends s.MaskFormerImageProcessor{}}),"./src/models/maskformer/image_processing_maskformer.js":((e,r,t)=>{t.r(r),t.d(r,{MaskFormerFeatureExtractor:()=>a,MaskFormerImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{post_process_panoptic_segmentation(...i){return(0,s.post_process_panoptic_segmentation)(...i)}post_process_instance_segmentation(...i){return(0,s.post_process_instance_segmentation)(...i)}}class a extends o{}}),"./src/models/mgp_str/processing_mgp_str.js":((e,r,t)=>{t.r(r),t.d(r,{MgpstrProcessor:()=>l});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js"),n=t("./src/utils/maths.js");let i={char:["char_decode",1],bpe:["bpe_decode",2],wp:["wp_decode",102]};class l extends s.Processor{static tokenizer_class=a.AutoTokenizer;static image_processor_class=o.AutoImageProcessor;get char_tokenizer(){return this.components.char_tokenizer}get bpe_tokenizer(){return this.components.bpe_tokenizer}get wp_tokenizer(){return this.components.wp_tokenizer}_decode_helper(_,u){if(!i.hasOwnProperty(u))throw new Error(`Format ${u} is not supported.`);let[d,g]=i[u],h=this[d].bind(this),[x,F]=_.dims,v=[],b=[],C=_.tolist();for(let P=0;P<x;++P){let I=C[P],f=[],E=[];for(let O=1;O<F;++O){let[U,W]=(0,n.max)((0,n.softmax)(I[O]));if(E.push(U),W==g)break;f.push(W)}let D=E.length>0?E.reduce((O,U)=>O*U,1):0;b.push(f),v.push(D)}return[h(b),v]}char_decode(_){return this.char_tokenizer.batch_decode(_).map(u=>u.replaceAll(" ",""))}bpe_decode(_){return this.bpe_tokenizer.batch_decode(_)}wp_decode(_){return this.wp_tokenizer.batch_decode(_).map(u=>u.replaceAll(" ",""))}batch_decode([_,u,d]){let[g,h]=this._decode_helper(_,"char"),[x,F]=this._decode_helper(u,"bpe"),[v,b]=this._decode_helper(d,"wp"),C=[],y=[];for(let P=0;P<g.length;++P){let[I,f]=(0,n.max)([h[P],F[P],b[P]]);C.push([g[P],x[P],v[P]][f]),y.push(I)}return{generated_text:C,scores:y,char_preds:g,bpe_preds:x,wp_preds:v}}static async from_pretrained(..._){let u=await super.from_pretrained(..._),d=await a.AutoTokenizer.from_pretrained("Xenova/gpt2"),g=await a.AutoTokenizer.from_pretrained("Xenova/bert-base-uncased");return u.components={image_processor:u.image_processor,char_tokenizer:u.tokenizer,bpe_tokenizer:d,wp_tokenizer:g},u}async _call(_,u=null){let d=await this.image_processor(_);return u&&(d.labels=this.tokenizer(u).input_ids),d}}}),"./src/models/mobilenet_v1/image_processing_mobilenet_v1.js":((e,r,t)=>{t.r(r),t.d(r,{MobileNetV1FeatureExtractor:()=>a,MobileNetV1ImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}class a extends o{}}),"./src/models/mobilenet_v2/image_processing_mobilenet_v2.js":((e,r,t)=>{t.r(r),t.d(r,{MobileNetV2FeatureExtractor:()=>a,MobileNetV2ImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}class a extends o{}}),"./src/models/mobilenet_v3/image_processing_mobilenet_v3.js":((e,r,t)=>{t.r(r),t.d(r,{MobileNetV3FeatureExtractor:()=>a,MobileNetV3ImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}class a extends o{}}),"./src/models/mobilenet_v4/image_processing_mobilenet_v4.js":((e,r,t)=>{t.r(r),t.d(r,{MobileNetV4FeatureExtractor:()=>a,MobileNetV4ImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}class a extends o{}}),"./src/models/mobilevit/image_processing_mobilevit.js":((e,r,t)=>{t.r(r),t.d(r,{MobileViTFeatureExtractor:()=>a,MobileViTImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}class a extends o{}}),"./src/models/moonshine/feature_extraction_moonshine.js":((e,r,t)=>{t.r(r),t.d(r,{MoonshineFeatureExtractor:()=>a});var s=t("./src/base/feature_extraction_utils.js"),o=t("./src/utils/tensor.js");class a extends s.FeatureExtractor{async _call(i){(0,s.validate_audio_inputs)(i,"MoonshineFeatureExtractor"),i instanceof Float64Array&&(i=new Float32Array(i));let l=[1,i.length];return{input_values:new o.Tensor("float32",i,l)}}}}),"./src/models/moonshine/processing_moonshine.js":((e,r,t)=>{t.r(r),t.d(r,{MoonshineProcessor:()=>n});var s=t("./src/models/auto/feature_extraction_auto.js"),o=t("./src/tokenizers.js"),a=t("./src/base/processing_utils.js");class n extends a.Processor{static tokenizer_class=o.AutoTokenizer;static feature_extractor_class=s.AutoFeatureExtractor;async _call(l){return await this.feature_extractor(l)}}}),"./src/models/nougat/image_processing_nougat.js":((e,r,t)=>{t.r(r),t.d(r,{NougatImageProcessor:()=>o});var s=t("./src/models/donut/image_processing_donut.js");class o extends s.DonutImageProcessor{}}),"./src/models/owlv2/image_processing_owlv2.js":((e,r,t)=>{t.r(r),t.d(r,{Owlv2ImageProcessor:()=>o});var s=t("./src/models/owlvit/image_processing_owlvit.js");class o extends s.OwlViTImageProcessor{}}),"./src/models/owlvit/image_processing_owlvit.js":((e,r,t)=>{t.r(r),t.d(r,{OwlViTFeatureExtractor:()=>a,OwlViTImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{post_process_object_detection(...i){return(0,s.post_process_object_detection)(...i)}}class a extends o{}}),"./src/models/owlvit/processing_owlvit.js":((e,r,t)=>{t.r(r),t.d(r,{OwlViTProcessor:()=>n});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js");class n extends s.Processor{static tokenizer_class=a.AutoTokenizer;static image_processor_class=o.AutoImageProcessor}}),"./src/models/paligemma/processing_paligemma.js":((e,r,t)=>{t.r(r),t.d(r,{PaliGemmaProcessor:()=>l});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js");let n="<image>";function i(c,_,u,d,g){return`${d.repeat(u*g)}${_}${c}
|
|
2849
2849
|
`}class l extends s.Processor{static tokenizer_class=a.AutoTokenizer;static image_processor_class=o.AutoImageProcessor;static uses_processor_config=!1;async _call(_,u=null,d={}){u||(console.warn("You are using PaliGemma without a text prefix. It will perform as a picture-captioning model."),u=""),Array.isArray(_)||(_=[_]),Array.isArray(u)||(u=[u]);let g=this.tokenizer.bos_token,h=this.image_processor.config.image_seq_length,x;u.some(b=>b.includes(n))?x=u.map(b=>{let C=b.replaceAll(n,n.repeat(h)),y=C.lastIndexOf(n),P=y===-1?0:y+n.length;return C.slice(0,P)+g+C.slice(P)+`
|
|
2850
2850
|
`}):(console.warn("You are passing both `text` and `images` to `PaliGemmaProcessor`. The processor expects special image tokens in the text, as many tokens as there are images per each text. It is recommended to add `<image>` tokens in the very beginning of your text. For this call, we will infer how many images each text has and add special tokens."),x=u.map(b=>i(b,g,h,n,_.length)));let F=this.tokenizer(x,d);return{...await this.image_processor(_,d),...F}}}}),"./src/models/parakeet/feature_extraction_parakeet.js":((e,r,t)=>{t.r(r),t.d(r,{ParakeetFeatureExtractor:()=>i});var s=t("./src/base/feature_extraction_utils.js"),o=t("./src/utils/tensor.js"),a=t("./src/utils/audio.js");let n=1e-5;class i extends s.FeatureExtractor{constructor(c){super(c),this.config.mel_filters??=(0,a.mel_filter_bank)(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,this.config.sampling_rate/2,this.config.sampling_rate,"slaney","slaney");let _=(0,a.window_function)(this.config.win_length,"hann",{periodic:!1});this.window=new Float64Array(this.config.n_fft);let u=Math.floor((this.config.n_fft-this.config.win_length)/2);this.window.set(_,u)}async _extract_fbank_features(c){let _=this.config.preemphasis;c=new Float64Array(c);for(let d=c.length-1;d>=1;--d)c[d]-=_*c[d-1];return await(0,a.spectrogram)(c,this.window,this.window.length,this.config.hop_length,{fft_length:this.config.n_fft,power:2,mel_filters:this.config.mel_filters,log_mel:"log",mel_floor:-1/0,pad_mode:"constant",center:!0,transpose:!0,mel_offset:2**-24})}async _call(c){(0,s.validate_audio_inputs)(c,"ParakeetFeatureExtractor");let _=await this._extract_fbank_features(c),u=Math.floor((c.length+Math.floor(this.config.n_fft/2)*2-this.config.n_fft)/this.config.hop_length),d=_.data;d.fill(0,u*_.dims[1]);let[g,h]=_.dims,x=new Float64Array(h),F=new Float64Array(h);for(let C=0;C<u;++C){let y=C*h;for(let P=0;P<h;++P){let I=d[y+P];x[P]+=I,F[P]+=I*I}}let v=u>1?u-1:1;for(let C=0;C<h;++C){let y=x[C]/u,P=(F[C]-u*y*y)/v,f=1/(Math.sqrt(P)+n);for(let E=0;E<u;++E){let D=E*h+C;d[D]=(d[D]-y)*f}}let b=new BigInt64Array(g);return b.fill(1n,0,u),{input_features:_.unsqueeze_(0),attention_mask:new o.Tensor("int64",b,[1,g])}}}}),"./src/models/phi3_v/image_processing_phi3_v.js":((e,r,t)=>{t.r(r),t.d(r,{Phi3VImageProcessor:()=>_});var s=t("./src/base/image_processors_utils.js"),o=t("./src/utils/tensor.js");let a=336,n=[2,3],{ceil:i,floor:l,sqrt:c}=Math;class _ extends s.ImageProcessor{constructor(d){super({...d,do_normalize:!0,do_pad:!0,pad_size:"custom",do_convert_rgb:!0,do_resize:!0}),this._num_crops=d.num_crops}calc_num_image_tokens_from_image_size(d,g){let{num_img_tokens:h}=this.config;return l((l(g/a)*l(d/a)+1)*h+1+(l(g/a)+1)*c(h))}get_resize_output_image_size(d,g){let h=this._num_crops,[x,F]=d.size,v=x/F,b=1;for(;b*Math.ceil(b/v)<=h;)b+=1;b-=1;let C=Math.floor(b*336),y=Math.floor(C/v);return[C,y]}pad_image(d,g,h,x={}){let[F,v]=g,b=a*i(F/a),C=a*i(v/a),y=[1,1,1].map((P,I)=>(P-this.image_mean[I])/this.image_std[I]);return super.pad_image(d,g,{width:C,height:b},{center:!0,constant_values:y,...x})}async _call(d,{num_crops:g=null}={}){if(this._num_crops=g??=this.config.num_crops,g<4||c(g)%1!==0)throw new Error("num_crops must be a square number >= 4");Array.isArray(d)||(d=[d]);let h=d.length,x=await Promise.all(d.map(f=>this.preprocess(f))),F=x.map(f=>f.original_size),v=x.map(f=>f.reshaped_input_size),b=[];for(let{pixel_values:f}of x){f.unsqueeze_(0);let[E,D]=f.dims.slice(-2),O=await(0,o.interpolate_4d)(f,{size:[a,a],mode:"bicubic"});if(g>0){let U=[],W=c(g),z=l(D/W),X=l(E/W);for(let q=0;q<W;++q)for(let re=0;re<W;++re){let oe,ne,ye,Y;q===W-1?(ne=E-X,Y=E):(ne=q*X,Y=(q+1)*X),re===W-1?(oe=D-z,ye=D):(oe=re*z,ye=(re+1)*z);let H=[ne,oe],R=[Y,ye],L=await(0,o.slice)(f,H,R,n);U.push(L)}let J=await(0,o.interpolate_4d)((0,o.cat)(U,0),{size:[a,a],mode:"bicubic"});b.push((0,o.cat)([O,J],0))}else b.push(O)}let C=(0,o.stack)(b,0),y=v.map(f=>f.map(E=>a*i(E/a))),P=new o.Tensor("int64",y.flat(),[h,2]),I=y.map(([f,E])=>this.calc_num_image_tokens_from_image_size(E,f));return{pixel_values:C,original_sizes:F,reshaped_input_sizes:v,image_sizes:P,num_img_tokens:I}}}}),"./src/models/phi3_v/processing_phi3_v.js":((e,r,t)=>{t.r(r),t.d(r,{Phi3VProcessor:()=>c});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js"),n=t("./src/utils/image.js");let i="<|image|>",l=/<\|image_\d+\|>/g;class c extends s.Processor{static image_processor_class=o.AutoImageProcessor;static tokenizer_class=a.AutoTokenizer;async _call(u,d=null,{padding:g=!0,truncation:h=!0,num_crops:x=null}={}){Array.isArray(u)||(u=[u]);let F,v;if(d){v=await this.image_processor(d,{num_crops:x});let{num_img_tokens:b}=v,C=u.map((P,I)=>P.split(l).join(i.repeat(b[I])));F=this.tokenizer(C,{padding:g,truncation:h});let y=this.tokenizer.model.convert_tokens_to_ids([i])[0];F.input_ids.map_(P=>P==y?-P:P)}else F=this.tokenizer(u);return{...F,...v}}}}),"./src/models/pixtral/image_processing_pixtral.js":((e,r,t)=>{t.r(r),t.d(r,{PixtralImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{get_resize_output_image_size(n,i){let{longest_edge:l}=i;if(l===void 0)throw new Error("size must contain 'longest_edge'");let[c,_]=n.size,u=Math.max(c,_)/l,d=c,g=_;u>1&&(d=Math.floor(c/u),g=Math.floor(_/u));let{patch_size:h,spatial_merge_size:x}=this.config;if(!x)throw new Error("config must contain 'spatial_merge_size'");let F=h*x,v=Math.floor((d-1)/F)+1,b=Math.floor((g-1)/F)+1;return[v*F,b*F]}}}),"./src/models/pixtral/processing_pixtral.js":((e,r,t)=>{t.r(r),t.d(r,{PixtralProcessor:()=>n});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js");class n extends s.Processor{static tokenizer_class=a.AutoTokenizer;static image_processor_class=o.AutoImageProcessor;static uses_processor_config=!0;async _call(l,c=null,_={}){let u=await this.image_processor(l,_);if(c){let[g,h]=u.pixel_values.dims.slice(-2),{image_token:x,image_break_token:F,image_end_token:v,patch_size:b,spatial_merge_size:C}=this.config,y=b*C,P=Math.floor(g/y),I=Math.floor(h/y);c=structuredClone(c),Array.isArray(c)||(c=[c]);for(let f=0;f<c.length;++f){let E=x.repeat(I),D=E+F,O=E+v,U=D.repeat(P-1)+O;c[f]=c[f].replace(x,U)}}let d=c?this.tokenizer(c,_):{};return{...u,...d}}}}),"./src/models/processors.js":((e,r,t)=>{t.r(r),t.d(r,{Florence2Processor:()=>s.Florence2Processor,Gemma3nProcessor:()=>o.Gemma3nProcessor,GroundingDinoProcessor:()=>a.GroundingDinoProcessor,Idefics3Processor:()=>n.Idefics3Processor,JinaCLIPProcessor:()=>l.JinaCLIPProcessor,LlavaProcessor:()=>c.LlavaProcessor,MgpstrProcessor:()=>_.MgpstrProcessor,MoonshineProcessor:()=>u.MoonshineProcessor,OwlViTProcessor:()=>d.OwlViTProcessor,PaliGemmaProcessor:()=>g.PaliGemmaProcessor,Phi3VProcessor:()=>h.Phi3VProcessor,PixtralProcessor:()=>x.PixtralProcessor,PyAnnoteProcessor:()=>F.PyAnnoteProcessor,Qwen2VLProcessor:()=>v.Qwen2VLProcessor,Sam2Processor:()=>C.Sam2Processor,Sam2VideoProcessor:()=>C.Sam2VideoProcessor,SamProcessor:()=>b.SamProcessor,SmolVLMProcessor:()=>y.SmolVLMProcessor,SpeechT5Processor:()=>P.SpeechT5Processor,UltravoxProcessor:()=>I.UltravoxProcessor,VLChatProcessor:()=>i.VLChatProcessor,VoxtralProcessor:()=>f.VoxtralProcessor,Wav2Vec2Processor:()=>E.Wav2Vec2Processor,Wav2Vec2ProcessorWithLM:()=>D.Wav2Vec2ProcessorWithLM,WhisperProcessor:()=>O.WhisperProcessor});var s=t("./src/models/florence2/processing_florence2.js"),o=t("./src/models/gemma3n/processing_gemma3n.js"),a=t("./src/models/grounding_dino/processing_grounding_dino.js"),n=t("./src/models/idefics3/processing_idefics3.js"),i=t("./src/models/janus/processing_janus.js"),l=t("./src/models/jina_clip/processing_jina_clip.js"),c=t("./src/models/llava/processing_llava.js"),_=t("./src/models/mgp_str/processing_mgp_str.js"),u=t("./src/models/moonshine/processing_moonshine.js"),d=t("./src/models/owlvit/processing_owlvit.js"),g=t("./src/models/paligemma/processing_paligemma.js"),h=t("./src/models/phi3_v/processing_phi3_v.js"),x=t("./src/models/pixtral/processing_pixtral.js"),F=t("./src/models/pyannote/processing_pyannote.js"),v=t("./src/models/qwen2_vl/processing_qwen2_vl.js"),b=t("./src/models/sam/processing_sam.js"),C=t("./src/models/sam2/processing_sam2.js"),y=t("./src/models/smolvlm/processing_smolvlm.js"),P=t("./src/models/speecht5/processing_speecht5.js"),I=t("./src/models/ultravox/processing_ultravox.js"),f=t("./src/models/voxtral/processing_voxtral.js"),E=t("./src/models/wav2vec2/processing_wav2vec2.js"),D=t("./src/models/wav2vec2_with_lm/processing_wav2vec2_with_lm.js"),O=t("./src/models/whisper/processing_whisper.js")}),"./src/models/pvt/image_processing_pvt.js":((e,r,t)=>{t.r(r),t.d(r,{PvtImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}}),"./src/models/pyannote/feature_extraction_pyannote.js":((e,r,t)=>{t.r(r),t.d(r,{PyAnnoteFeatureExtractor:()=>n});var s=t("./src/base/feature_extraction_utils.js"),o=t("./src/utils/tensor.js"),a=t("./src/utils/maths.js");class n extends s.FeatureExtractor{async _call(l){(0,s.validate_audio_inputs)(l,"PyAnnoteFeatureExtractor"),l instanceof Float64Array&&(l=new Float32Array(l));let c=[1,1,l.length];return{input_values:new o.Tensor("float32",l,c)}}samples_to_frames(l){return(l-this.config.offset)/this.config.step}post_process_speaker_diarization(l,c){let _=c/this.samples_to_frames(c)/this.config.sampling_rate,u=[];for(let d of l.tolist()){let g=[],h=-1;for(let x=0;x<d.length;++x){let F=(0,a.softmax)(d[x]),[v,b]=(0,a.max)(F),[C,y]=[x,x+1];b!==h?(h=b,g.push({id:b,start:C,end:y,score:v})):(g.at(-1).end=y,g.at(-1).score+=v)}u.push(g.map(({id:x,start:F,end:v,score:b})=>({id:x,start:F*_,end:v*_,confidence:b/(v-F)})))}return u}}}),"./src/models/pyannote/processing_pyannote.js":((e,r,t)=>{t.r(r),t.d(r,{PyAnnoteProcessor:()=>a});var s=t("./src/base/processing_utils.js"),o=t("./src/models/pyannote/feature_extraction_pyannote.js");class a extends s.Processor{static feature_extractor_class=o.PyAnnoteFeatureExtractor;async _call(i){return await this.feature_extractor(i)}post_process_speaker_diarization(...i){return this.feature_extractor.post_process_speaker_diarization(...i)}get sampling_rate(){return this.feature_extractor.config.sampling_rate}}}),"./src/models/qwen2_vl/image_processing_qwen2_vl.js":((e,r,t)=>{t.r(r),t.d(r,{Qwen2VLImageProcessor:()=>a});var s=t("./src/base/image_processors_utils.js"),o=t("./src/utils/tensor.js");class a extends s.ImageProcessor{async _call(i,...l){let{pixel_values:c,original_sizes:_,reshaped_input_sizes:u}=await super._call(i,...l),d=c,{temporal_patch_size:g,merge_size:h,patch_size:x}=this.config;d.dims[0]===1&&(d=(0,o.cat)(Array.from({length:g},()=>d),0));let F=d.dims[0]/g,v=d.dims[1],b=Math.floor(d.dims[2]/x),C=Math.floor(d.dims[3]/x),y=d.view(F,g,v,Math.floor(b/h),h,x,Math.floor(C/h),h,x).permute(0,3,6,4,7,2,1,5,8).view(F*b*C,v*g*x*x),P=new o.Tensor("int64",[F,b,C],[1,3]);return{pixel_values:y,image_grid_thw:P,original_sizes:_,reshaped_input_sizes:u}}}}),"./src/models/qwen2_vl/processing_qwen2_vl.js":((e,r,t)=>{t.r(r),t.d(r,{Qwen2VLProcessor:()=>i});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js"),a=t("./src/tokenizers.js"),n=t("./src/utils/image.js");class i extends s.Processor{static image_processor_class=o.AutoImageProcessor;static tokenizer_class=a.AutoTokenizer;async _call(c,_=null,...u){Array.isArray(c)||(c=[c]);let d,g;if(_&&(d=await this.image_processor(_),g=d.image_grid_thw),g){let x=this.image_processor.config.merge_size**2,F=0,v=g.tolist();c=c.map(b=>{for(;b.includes("<|image_pad|>");){let C=Number(v[F++].reduce((y,P)=>y*P,1n));b=b.replace("<|image_pad|>","<|placeholder|>".repeat(Math.floor(C/x)))}return b.replaceAll("<|placeholder|>","<|image_pad|>")})}return{...this.tokenizer(c),...d}}}}),"./src/models/rt_detr/image_processing_rt_detr.js":((e,r,t)=>{t.r(r),t.d(r,{RTDetrImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{post_process_object_detection(...n){return(0,s.post_process_object_detection)(...n)}}}),"./src/models/sam/image_processing_sam.js":((e,r,t)=>{t.r(r),t.d(r,{SamImageProcessor:()=>n});var s=t("./src/base/image_processors_utils.js"),o=t("./src/utils/core.js"),a=t("./src/utils/tensor.js");class n extends s.ImageProcessor{reshape_input_points(l,c,_,u=!1){l=structuredClone(l);let d=(0,o.calculateDimensions)(l);if(d.length===3)u||(d=[1,...d]),l=[l];else if(d.length!==4)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");for(let g=0;g<l.length;++g){let[h,x]=c[g],[F,v]=_[g],b=[v/x,F/h];for(let C=0;C<l[g].length;++C)for(let y=0;y<l[g][C].length;++y)for(let P=0;P<l[g][C][y].length;++P)l[g][C][y][P]*=b[P%2]}return new a.Tensor("float32",Float32Array.from(l.flat(1/0)),d)}add_input_labels(l,c){let _=(0,o.calculateDimensions)(l);if(_.length===2)_=[1,..._],l=[l];else if(_.length!==3)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");if(_.some((u,d)=>u!==c.dims[d]))throw Error(`The first ${_.length} dimensions of 'input_points' and 'input_labels' must be the same.`);return new a.Tensor("int64",l.flat(1/0).map(BigInt),_)}async _call(l,{input_points:c=null,input_labels:_=null,input_boxes:u=null}={}){let d=await super._call(l);if(c&&(d.input_points=this.reshape_input_points(c,d.original_sizes,d.reshaped_input_sizes)),_){if(!d.input_points)throw Error("`input_points` must be provided if `input_labels` are provided.");d.input_labels=this.add_input_labels(_,d.input_points)}return u&&(d.input_boxes=this.reshape_input_points(u,d.original_sizes,d.reshaped_input_sizes,!0)),d}async post_process_masks(l,c,_,{mask_threshold:u=0,binarize:d=!0,pad_size:g=null}={}){let h=[];g=g??this.pad_size??this.size;let x=[g.height,g.width];for(let F=0;F<c.length;++F){let v=c[F],b=_[F],C=await(0,a.interpolate_4d)(l[F],{mode:"bilinear",size:x});if(C=C.slice(null,null,[0,b[0]],[0,b[1]]),C=await(0,a.interpolate_4d)(C,{mode:"bilinear",size:v}),d){let y=C.data,P=new Uint8Array(y.length);for(let I=0;I<y.length;++I)y[I]>u&&(P[I]=1);C=new a.Tensor("bool",P,C.dims)}h.push(C)}return h}generate_crop_boxes(l,c,{crop_n_layers:_=0,overlap_ratio:u=512/1500,points_per_crop:d=32,crop_n_points_downscale_factor:g=1}={}){}}}),"./src/models/sam/processing_sam.js":((e,r,t)=>{t.r(r),t.d(r,{SamProcessor:()=>a});var s=t("./src/base/processing_utils.js"),o=t("./src/models/auto/image_processing_auto.js");class a extends s.Processor{static image_processor_class=o.AutoImageProcessor;async _call(...i){return await this.image_processor(...i)}post_process_masks(...i){return this.image_processor.post_process_masks(...i)}reshape_input_points(...i){return this.image_processor.reshape_input_points(...i)}}}),"./src/models/sam2/image_processing_sam2.js":((e,r,t)=>{t.r(r),t.d(r,{Sam2ImageProcessor:()=>s.SamImageProcessor});var s=t("./src/models/sam/image_processing_sam.js")}),"./src/models/sam2/processing_sam2.js":((e,r,t)=>{t.r(r),t.d(r,{Sam2Processor:()=>o,Sam2VideoProcessor:()=>a});var s=t("./src/models/sam/processing_sam.js");class o extends s.SamProcessor{}class a extends o{}}),"./src/models/sam3/image_processing_sam3.js":((e,r,t)=>{t.r(r),t.d(r,{Sam3ImageProcessor:()=>s.Sam2ImageProcessor});var s=t("./src/models/sam2/image_processing_sam2.js")}),"./src/models/seamless_m4t/feature_extraction_seamless_m4t.js":((e,r,t)=>{t.r(r),t.d(r,{SeamlessM4TFeatureExtractor:()=>n});var s=t("./src/base/feature_extraction_utils.js"),o=t("./src/utils/tensor.js"),a=t("./src/utils/audio.js");class n extends s.FeatureExtractor{constructor(l){super(l);let c=this.config.sampling_rate,_=(0,a.mel_filter_bank)(257,this.config.num_mel_bins,20,Math.floor(c/2),c,null,"kaldi",!0);this.mel_filters=_,this.window=(0,a.window_function)(400,"povey",{periodic:!1})}async _extract_fbank_features(l,c){return l=l.map(_=>_*32768),(0,a.spectrogram)(l,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:c,transpose:!0})}async _call(l,{padding:c=!0,pad_to_multiple_of:_=2,do_normalize_per_mel_bins:u=!0,return_attention_mask:d=!0}={}){(0,s.validate_audio_inputs)(l,"SeamlessM4TFeatureExtractor");let g=await this._extract_fbank_features(l,this.config.max_length);if(u){let[P,I]=g.dims,f=g.data;for(let E=0;E<I;++E){let D=0;for(let z=0;z<P;++z)D+=f[z*I+E];let O=D/P,U=0;for(let z=0;z<P;++z)U+=(f[z*I+E]-O)**2;U/=P-1;let W=Math.sqrt(U+1e-7);for(let z=0;z<P;++z){let X=z*I+E;f[X]=(f[X]-O)/W}}}let h;if(c){let[P,I]=g.dims,f=g.data,E=P%_;if(E>0){let D=new Float32Array(I*(P+E));D.set(f),D.fill(this.config.padding_value,f.length);let O=P+E;g=new o.Tensor(g.type,D,[O,I]),d&&(h=new o.Tensor("int64",new BigInt64Array(O),[1,O]),h.data.fill(1n,0,P))}}let[x,F]=g.dims,v=this.config.stride;if(x%v!==0)throw new Error(`The number of frames (${x}) must be a multiple of the stride (${v}).`);let C=g.view(1,Math.floor(x/v),F*v),y={input_features:C};if(d){let P=C.dims[1],I=new BigInt64Array(P);if(h){let f=h.data;for(let E=1,D=0;E<x;E+=v,++D)I[D]=f[E]}else I.fill(1n);y.attention_mask=new o.Tensor("int64",I,[1,P])}return y}}}),"./src/models/segformer/image_processing_segformer.js":((e,r,t)=>{t.r(r),t.d(r,{SegformerFeatureExtractor:()=>a,SegformerImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{post_process_semantic_segmentation(...i){return(0,s.post_process_semantic_segmentation)(...i)}}class a extends o{}}),"./src/models/siglip/image_processing_siglip.js":((e,r,t)=>{t.r(r),t.d(r,{SiglipImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}}),"./src/models/smolvlm/image_processing_smolvlm.js":((e,r,t)=>{t.r(r),t.d(r,{SmolVLMImageProcessor:()=>s.Idefics3ImageProcessor});var s=t("./src/models/idefics3/image_processing_idefics3.js")}),"./src/models/smolvlm/processing_smolvlm.js":((e,r,t)=>{t.r(r),t.d(r,{SmolVLMProcessor:()=>s.Idefics3Processor});var s=t("./src/models/idefics3/processing_idefics3.js")}),"./src/models/snac/feature_extraction_snac.js":((e,r,t)=>{t.r(r),t.d(r,{SnacFeatureExtractor:()=>o});var s=t("./src/models/dac/feature_extraction_dac.js");class o extends s.DacFeatureExtractor{}}),"./src/models/speecht5/feature_extraction_speecht5.js":((e,r,t)=>{t.r(r),t.d(r,{SpeechT5FeatureExtractor:()=>o});var s=t("./src/base/feature_extraction_utils.js");class o extends s.FeatureExtractor{}}),"./src/models/speecht5/processing_speecht5.js":((e,r,t)=>{t.r(r),t.d(r,{SpeechT5Processor:()=>n});var s=t("./src/base/processing_utils.js"),o=t("./src/tokenizers.js"),a=t("./src/models/auto/feature_extraction_auto.js");class n extends s.Processor{static tokenizer_class=o.AutoTokenizer;static feature_extractor_class=a.AutoFeatureExtractor;async _call(l){return await this.feature_extractor(l)}}}),"./src/models/swin2sr/image_processing_swin2sr.js":((e,r,t)=>{t.r(r),t.d(r,{Swin2SRImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{pad_image(n,i,l,c={}){let[_,u,d]=i;return super.pad_image(n,i,{width:u+(l-u%l)%l,height:_+(l-_%l)%l},{mode:"symmetric",center:!1,constant_values:-1,...c})}}}),"./src/models/ultravox/processing_ultravox.js":((e,r,t)=>{t.r(r),t.d(r,{UltravoxProcessor:()=>n});var s=t("./src/models/auto/feature_extraction_auto.js"),o=t("./src/tokenizers.js"),a=t("./src/base/processing_utils.js");class n extends a.Processor{static tokenizer_class=o.AutoTokenizer;static feature_extractor_class=s.AutoFeatureExtractor;static uses_processor_config=!0;async _call(l,c=null,_={}){if(Array.isArray(l))throw new Error("Batched inputs are not supported yet.");let u={};if(c){let g=c.length,{input_features:h}=await this.feature_extractor(c,{..._,max_length:g}),x=Math.round(g/this.config.encoder_ds_factor+1e-4),F=1+Math.ceil(x/this.config.stack_factor);u.audio_token_len=[F],u.audio_values=h;let v=this.config.audio_placeholder;if(!l.includes(v))throw new Error(`The input text does not contain the image token ${v}.`);l=l.replaceAll(v,v.repeat(F))}return{...this.tokenizer(l,{add_special_tokens:!1,..._}),...u}}}}),"./src/models/vit/image_processing_vit.js":((e,r,t)=>{t.r(r),t.d(r,{ViTFeatureExtractor:()=>a,ViTImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{}class a extends o{}}),"./src/models/vitmatte/image_processing_vitmatte.js":((e,r,t)=>{t.r(r),t.d(r,{VitMatteImageProcessor:()=>a});var s=t("./src/base/image_processors_utils.js"),o=t("./src/utils/tensor.js");class a extends s.ImageProcessor{async _call(i,l){Array.isArray(i)||(i=[i]),Array.isArray(l)||(l=[l]);let c=await Promise.all(i.map(d=>this.preprocess(d))),_=await Promise.all(l.map(d=>this.preprocess(d,{do_normalize:!1,do_convert_rgb:!1,do_convert_grayscale:!0})));return{pixel_values:(0,o.stack)(c.map((d,g)=>(0,o.cat)([d.pixel_values,_[g].pixel_values],0)),0),original_sizes:c.map(d=>d.original_size),reshaped_input_sizes:c.map(d=>d.reshaped_input_size)}}}}),"./src/models/vitpose/image_processing_vitpose.js":((e,r,t)=>{t.r(r),t.d(r,{VitPoseImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{post_process_pose_estimation(n,i,{threshold:l=null}={}){let c=n.tolist(),[_,u,d,g]=n.dims,h=[];for(let x=0;x<_;++x){let F=c[x],v=i[x],b=[];for(let C=0;C<v.length;++C){let y=v[C],P=[],I=[],f=[],E=y.at(-2)/g,D=y.at(-1)/d;for(let O=0;O<F.length;++O){let[U,W]=[0,0],z=0,X=-1/0,J=F[O];for(let re=0;re<J.length;++re){let oe=J[re];for(let ne=0;ne<oe.length;++ne){let ye=oe[ne];z+=ye,X=Math.max(X,ye),U+=(ne+.5)*ye,W+=re*ye}}if(l!=null&&X<l)continue;let q=[E*U/z,D*W/z];P.push(q),f.push(O),I.push(X)}b.push({bbox:y,scores:I,labels:f,keypoints:P})}h.push(b)}return h}}}),"./src/models/voxtral/processing_voxtral.js":((e,r,t)=>{t.r(r),t.d(r,{VoxtralProcessor:()=>u});var s=t("./src/models/auto/feature_extraction_auto.js"),o=t("./src/tokenizers.js"),a=t("./src/base/processing_utils.js"),n=t("./src/utils/tensor.js");let i="[AUDIO]",l="[BEGIN_AUDIO]",c=375;function _(d,g){let h=[];for(let x=0;x<d.length;x+=g)h.push(d.subarray(x,Math.min(x+g,d.length)));return h}class u extends a.Processor{static tokenizer_class=o.AutoTokenizer;static feature_extractor_class=s.AutoFeatureExtractor;static uses_processor_config=!1;async _call(g,h=null,x={}){if(Array.isArray(g))throw new Error("Batched inputs are not supported yet.");let F={};if(h){if(!g.includes(i))throw new Error(`The input text does not contain the audio token ${i}.`);Array.isArray(h)||(h=[h]);let b=g.split(i),C=b.length-1;if(C!==h.length)throw new Error(`The number of audio inputs (${h.length}) does not match the number of audio tokens in the text (${C}).`);let y=this.feature_extractor.config.n_samples,P=h.map(O=>_(O,y)),I=P.map(O=>O.length),f=P.flat(),E=(await Promise.all(f.map(O=>this.feature_extractor(O,x)))).map(O=>O.input_features);F.audio_values=E.length>1?(0,n.cat)(E,0):E[0];let D=b[0];for(let O=0;O<I.length;++O){D+=l;for(let U=0;U<I[O];++U)D+=i.repeat(c);D+=b[O+1]}g=D}return{...this.tokenizer(g,{add_special_tokens:!1,...x}),...F}}}}),"./src/models/wav2vec2/feature_extraction_wav2vec2.js":((e,r,t)=>{t.r(r),t.d(r,{Wav2Vec2FeatureExtractor:()=>a});var s=t("./src/base/feature_extraction_utils.js"),o=t("./src/utils/tensor.js");class a extends s.FeatureExtractor{_zero_mean_unit_var_norm(i){let c=i.reduce((u,d)=>u+d,0)/i.length,_=i.reduce((u,d)=>u+(d-c)**2,0)/i.length;return i.map(u=>(u-c)/Math.sqrt(_+1e-7))}async _call(i){(0,s.validate_audio_inputs)(i,"Wav2Vec2FeatureExtractor"),i instanceof Float64Array&&(i=new Float32Array(i));let l=i;this.config.do_normalize&&(l=this._zero_mean_unit_var_norm(l));let c=[1,l.length];return{input_values:new o.Tensor("float32",l,c),attention_mask:new o.Tensor("int64",new BigInt64Array(l.length).fill(1n),c)}}}}),"./src/models/wav2vec2/processing_wav2vec2.js":((e,r,t)=>{t.r(r),t.d(r,{Wav2Vec2Processor:()=>n});var s=t("./src/tokenizers.js"),o=t("./src/models/auto/feature_extraction_auto.js"),a=t("./src/base/processing_utils.js");class n extends a.Processor{static tokenizer_class=s.AutoTokenizer;static feature_extractor_class=o.AutoFeatureExtractor;async _call(l){return await this.feature_extractor(l)}}}),"./src/models/wav2vec2_with_lm/processing_wav2vec2_with_lm.js":((e,r,t)=>{t.r(r),t.d(r,{Wav2Vec2ProcessorWithLM:()=>n});var s=t("./src/tokenizers.js"),o=t("./src/models/auto/feature_extraction_auto.js"),a=t("./src/base/processing_utils.js");class n extends a.Processor{static tokenizer_class=s.AutoTokenizer;static feature_extractor_class=o.AutoFeatureExtractor;async _call(l){return await this.feature_extractor(l)}}}),"./src/models/wespeaker/feature_extraction_wespeaker.js":((e,r,t)=>{t.r(r),t.d(r,{WeSpeakerFeatureExtractor:()=>n});var s=t("./src/base/feature_extraction_utils.js"),o=t("./src/utils/tensor.js"),a=t("./src/utils/audio.js");class n extends s.FeatureExtractor{constructor(l){super(l);let c=this.config.sampling_rate,_=(0,a.mel_filter_bank)(257,this.config.num_mel_bins,20,Math.floor(c/2),c,null,"kaldi",!0);this.mel_filters=_,this.window=(0,a.window_function)(400,"hamming",{periodic:!1}),this.min_num_frames=this.config.min_num_frames}async _extract_fbank_features(l){return l=l.map(c=>c*32768),(0,a.spectrogram)(l,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,transpose:!0,min_num_frames:this.min_num_frames})}async _call(l){(0,s.validate_audio_inputs)(l,"WeSpeakerFeatureExtractor");let c=(await this._extract_fbank_features(l)).unsqueeze_(0);if(this.config.fbank_centering_span===null){let _=c.mean(1).data,u=c.data,[d,g,h]=c.dims;for(let x=0;x<d;++x){let F=x*g*h,v=x*h;for(let b=0;b<g;++b){let C=F+b*h;for(let y=0;y<h;++y)u[C+y]-=_[v+y]}}}return{input_features:c}}}}),"./src/models/whisper/common_whisper.js":((e,r,t)=>{t.r(r),t.d(r,{WHISPER_LANGUAGE_MAPPING:()=>o,WHISPER_TO_LANGUAGE_CODE_MAPPING:()=>a,whisper_language_to_code:()=>n});let s=[["en","english"],["zh","chinese"],["de","german"],["es","spanish"],["ru","russian"],["ko","korean"],["fr","french"],["ja","japanese"],["pt","portuguese"],["tr","turkish"],["pl","polish"],["ca","catalan"],["nl","dutch"],["ar","arabic"],["sv","swedish"],["it","italian"],["id","indonesian"],["hi","hindi"],["fi","finnish"],["vi","vietnamese"],["he","hebrew"],["uk","ukrainian"],["el","greek"],["ms","malay"],["cs","czech"],["ro","romanian"],["da","danish"],["hu","hungarian"],["ta","tamil"],["no","norwegian"],["th","thai"],["ur","urdu"],["hr","croatian"],["bg","bulgarian"],["lt","lithuanian"],["la","latin"],["mi","maori"],["ml","malayalam"],["cy","welsh"],["sk","slovak"],["te","telugu"],["fa","persian"],["lv","latvian"],["bn","bengali"],["sr","serbian"],["az","azerbaijani"],["sl","slovenian"],["kn","kannada"],["et","estonian"],["mk","macedonian"],["br","breton"],["eu","basque"],["is","icelandic"],["hy","armenian"],["ne","nepali"],["mn","mongolian"],["bs","bosnian"],["kk","kazakh"],["sq","albanian"],["sw","swahili"],["gl","galician"],["mr","marathi"],["pa","punjabi"],["si","sinhala"],["km","khmer"],["sn","shona"],["yo","yoruba"],["so","somali"],["af","afrikaans"],["oc","occitan"],["ka","georgian"],["be","belarusian"],["tg","tajik"],["sd","sindhi"],["gu","gujarati"],["am","amharic"],["yi","yiddish"],["lo","lao"],["uz","uzbek"],["fo","faroese"],["ht","haitian creole"],["ps","pashto"],["tk","turkmen"],["nn","nynorsk"],["mt","maltese"],["sa","sanskrit"],["lb","luxembourgish"],["my","myanmar"],["bo","tibetan"],["tl","tagalog"],["mg","malagasy"],["as","assamese"],["tt","tatar"],["haw","hawaiian"],["ln","lingala"],["ha","hausa"],["ba","bashkir"],["jw","javanese"],["su","sundanese"]],o=new Map(s),a=new Map([...s.map(([i,l])=>[l,i]),["burmese","my"],["valencian","ca"],["flemish","nl"],["haitian","ht"],["letzeburgesch","lb"],["pushto","ps"],["panjabi","pa"],["moldavian","ro"],["moldovan","ro"],["sinhalese","si"],["castilian","es"]]);function n(i){i=i.toLowerCase();let l=a.get(i);if(l===void 0){let c=i.match(/^<\|([a-z]{2})\|>$/);if(c&&(i=c[1]),o.has(i))l=i;else{let u=i.length===2?o.keys():o.values();throw new Error(`Language "${i}" is not supported. Must be one of: ${JSON.stringify(Array.from(u))}`)}}return l}}),"./src/models/whisper/feature_extraction_whisper.js":((e,r,t)=>{t.r(r),t.d(r,{WhisperFeatureExtractor:()=>i});var s=t("./src/base/feature_extraction_utils.js"),o=t("./src/utils/tensor.js"),a=t("./src/utils/audio.js"),n=t("./src/utils/maths.js");class i extends s.FeatureExtractor{constructor(c){super(c),this.config.mel_filters??=(0,a.mel_filter_bank)(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,8e3,this.config.sampling_rate,"slaney","slaney"),this.window=(0,a.window_function)(this.config.n_fft,"hann")}async _extract_fbank_features(c){let _=await(0,a.spectrogram)(c,this.window,this.config.n_fft,this.config.hop_length,{power:2,mel_filters:this.config.mel_filters,log_mel:"log10",max_num_frames:Math.min(Math.floor(c.length/this.config.hop_length),this.config.nb_max_frames)}),u=_.data,d=(0,n.max)(u)[0];for(let g=0;g<u.length;++g)u[g]=(Math.max(u[g],d-8)+4)/4;return _}async _call(c,{max_length:_=null}={}){(0,s.validate_audio_inputs)(c,"WhisperFeatureExtractor");let u,d=_??this.config.n_samples;return c.length>d?(c.length>this.config.n_samples&&console.warn("Attempting to extract features for audio longer than 30 seconds. If using a pipeline to extract transcript from a long audio clip, remember to specify `chunk_length_s` and/or `stride_length_s`."),u=c.slice(0,d)):(u=new Float32Array(d),u.set(c)),{input_features:(await this._extract_fbank_features(u)).unsqueeze_(0)}}}}),"./src/models/whisper/generation_whisper.js":((e,r,t)=>{t.r(r),t.d(r,{WhisperGenerationConfig:()=>o});var s=t("./src/generation/configuration_utils.js");class o extends s.GenerationConfig{return_timestamps=null;return_token_timestamps=null;num_frames=null;alignment_heads=null;task=null;language=null;no_timestamps_token_id=null;prompt_ids=null;is_multilingual=null;lang_to_id=null;task_to_id=null;max_initial_timestamp_index=1}}),"./src/models/whisper/processing_whisper.js":((e,r,t)=>{t.r(r),t.d(r,{WhisperProcessor:()=>n});var s=t("./src/models/auto/feature_extraction_auto.js"),o=t("./src/tokenizers.js"),a=t("./src/base/processing_utils.js");class n extends a.Processor{static tokenizer_class=o.AutoTokenizer;static feature_extractor_class=s.AutoFeatureExtractor;async _call(l){return await this.feature_extractor(l)}}}),"./src/models/yolos/image_processing_yolos.js":((e,r,t)=>{t.r(r),t.d(r,{YolosFeatureExtractor:()=>a,YolosImageProcessor:()=>o});var s=t("./src/base/image_processors_utils.js");class o extends s.ImageProcessor{post_process_object_detection(...i){return(0,s.post_process_object_detection)(...i)}}class a extends o{}}),"./src/ops/registry.js":((e,r,t)=>{t.r(r),t.d(r,{TensorOpRegistry:()=>n});var s=t("./src/backends/onnx.js"),o=t("./src/utils/tensor.js");let a=async(i,l,c)=>{let _=await(0,s.createInferenceSession)(new Uint8Array(i),l);return(async u=>{let d=(0,s.isONNXProxy)(),g=Object.fromEntries(Object.entries(u).map(([x,F])=>[x,(d?F.clone():F).ort_tensor])),h=await(0,s.runInferenceSession)(_,g);return Array.isArray(c)?c.map(x=>new o.Tensor(h[x])):new o.Tensor(h[c])})};class n{static session_options={};static get nearest_interpolate_4d(){return this._nearest_interpolate_4d||(this._nearest_interpolate_4d=a([8,10,18,0,58,129,1,10,41,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,18,10,4,109,111,100,101,34,7,110,101,97,114,101,115,116,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,21],this.session_options,"y")),this._nearest_interpolate_4d}static get bilinear_interpolate_4d(){return this._bilinear_interpolate_4d||(this._bilinear_interpolate_4d=a([8,9,18,0,58,128,1,10,40,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,17,10,4,109,111,100,101,34,6,108,105,110,101,97,114,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bilinear_interpolate_4d}static get bicubic_interpolate_4d(){return this._bicubic_interpolate_4d||(this._bicubic_interpolate_4d=a([8,9,18,0,58,127,10,39,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,16,10,4,109,111,100,101,34,5,99,117,98,105,99,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bicubic_interpolate_4d}static get matmul(){return this._matmul||(this._matmul=a([8,9,18,0,58,55,10,17,10,1,97,10,1,98,18,1,99,34,6,77,97,116,77,117,108,18,1,114,90,9,10,1,97,18,4,10,2,8,1,90,9,10,1,98,18,4,10,2,8,1,98,9,10,1,99,18,4,10,2,8,1,66,2,16,20],this.session_options,"c")),this._matmul}static get stft(){return this._stft||(this._stft=a([8,7,18,0,58,148,1,10,38,10,1,115,10,1,106,10,1,119,10,1,108,18,1,111,34,4,83,84,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,115,90,26,10,1,115,18,21,10,19,8,1,18,15,10,3,18,1,98,10,3,18,1,115,10,3,18,1,99,90,11,10,1,106,18,6,10,4,8,7,18,0,90,16,10,1,119,18,11,10,9,8,1,18,5,10,3,18,1,119,90,11,10,1,108,18,6,10,4,8,7,18,0,98,31,10,1,111,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,102,10,3,18,1,100,10,3,18,1,99,66,2,16,17],this.session_options,"o")),this._stft}static get rfft(){return this._rfft||(this._rfft=a([8,9,18,0,58,97,10,33,10,1,120,10,0,10,1,97,18,1,121,34,3,68,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,100,90,21,10,1,120,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,90,11,10,1,97,18,6,10,4,8,7,18,0,98,21,10,1,121,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,66,2,16,20],this.session_options,"y")),this._rfft}static get top_k(){return this._top_k||(this._top_k=a([8,10,18,0,58,73,10,18,10,1,120,10,1,107,18,1,118,18,1,105,34,4,84,111,112,75,18,1,116,90,9,10,1,120,18,4,10,2,8,1,90,15,10,1,107,18,10,10,8,8,7,18,4,10,2,8,1,98,9,10,1,118,18,4,10,2,8,1,98,9,10,1,105,18,4,10,2,8,7,66,2,16,21],this.session_options,["v","i"])),this._top_k}static get slice(){return this._slice||(this._slice=a([8,7,18,0,58,96,10,25,10,1,120,10,1,115,10,1,101,10,1,97,10,1,116,18,1,121,34,5,83,108,105,99,101,18,1,114,90,9,10,1,120,18,4,10,2,8,1,90,9,10,1,115,18,4,10,2,8,7,90,9,10,1,101,18,4,10,2,8,7,90,9,10,1,97,18,4,10,2,8,7,90,9,10,1,116,18,4,10,2,8,7,98,9,10,1,121,18,4,10,2,8,1,66,2,16,13],this.session_options,"y")),this._slice}}}),"./src/pipelines.js":((e,r,t)=>{t.r(r),t.d(r,{AudioClassificationPipeline:()=>z,AutomaticSpeechRecognitionPipeline:()=>J,BackgroundRemovalPipeline:()=>ne,DepthEstimationPipeline:()=>ue,DocumentQuestionAnsweringPipeline:()=>R,FeatureExtractionPipeline:()=>U,FillMaskPipeline:()=>y,ImageClassificationPipeline:()=>re,ImageFeatureExtractionPipeline:()=>W,ImageSegmentationPipeline:()=>oe,ImageToImagePipeline:()=>ee,ImageToTextPipeline:()=>q,ObjectDetectionPipeline:()=>Y,Pipeline:()=>F,QuestionAnsweringPipeline:()=>C,SummarizationPipeline:()=>I,Text2TextGenerationPipeline:()=>P,TextClassificationPipeline:()=>v,TextGenerationPipeline:()=>D,TextToAudioPipeline:()=>L,TokenClassificationPipeline:()=>b,TranslationPipeline:()=>f,ZeroShotAudioClassificationPipeline:()=>X,ZeroShotClassificationPipeline:()=>O,ZeroShotImageClassificationPipeline:()=>ye,ZeroShotObjectDetectionPipeline:()=>H,pipeline:()=>Le});var s=t("./src/tokenizers.js"),o=t("./src/models.js"),a=t("./src/models/auto/processing_auto.js"),n=t("./src/base/processing_utils.js"),i=t("./src/utils/generic.js"),l=t("./src/utils/core.js"),c=t("./src/utils/maths.js"),_=t("./src/utils/audio.js"),u=t("./src/utils/tensor.js"),d=t("./src/utils/image.js");async function g(we){return Array.isArray(we)||(we=[we]),await Promise.all(we.map(A=>d.RawImage.read(A)))}async function h(we,A){return Array.isArray(we)||(we=[we]),await Promise.all(we.map(le=>typeof le=="string"||le instanceof URL?(0,_.read_audio)(le,A):le instanceof Float64Array?new Float32Array(le):le))}function x(we,A){A&&(we=we.map(ve=>ve|0));let[le,ge,be,Ae]=we;return{xmin:le,ymin:ge,xmax:be,ymax:Ae}}class F extends i.Callable{constructor({task:A,model:le,tokenizer:ge=null,processor:be=null}){super(),this.task=A,this.model=le,this.tokenizer=ge,this.processor=be}async dispose(){await this.model.dispose()}}class v extends F{constructor(A){super(A)}async _call(A,{top_k:le=1}={}){let ge=this.tokenizer(A,{padding:!0,truncation:!0}),be=await this.model(ge),Ae=this.model.config.problem_type==="multi_label_classification"?Pe=>Pe.sigmoid():Pe=>new u.Tensor("float32",(0,c.softmax)(Pe.data),Pe.dims),ve=this.model.config.id2label,pe=[];for(let Pe of be.logits){let fe=Ae(Pe),Te=await(0,u.topk)(fe,le),We=Te[0].tolist(),Re=Te[1].tolist().map((Ne,ot)=>({label:ve?ve[Ne]:`LABEL_${Ne}`,score:We[ot]}));le===1?pe.push(...Re):pe.push(Re)}return Array.isArray(A)||le===1?pe:pe[0]}}class b extends F{constructor(A){super(A)}async _call(A,{ignore_labels:le=["O"]}={}){let ge=Array.isArray(A),be=this.tokenizer(ge?A:[A],{padding:!0,truncation:!0}),ve=(await this.model(be)).logits,pe=this.model.config.id2label,Pe=[];for(let fe=0;fe<ve.dims[0];++fe){let Te=be.input_ids[fe],We=ve[fe],$e=[];for(let Re=0;Re<We.dims[0];++Re){let Ne=We[Re],ot=(0,c.max)(Ne.data)[1],De=pe?pe[ot]:`LABEL_${ot}`;if(le.includes(De))continue;let Qe=this.tokenizer.decode([Te[Re].item()],{skip_special_tokens:!0});if(Qe==="")continue;let je=(0,c.softmax)(Ne.data);$e.push({entity:De,score:je[ot],index:Re,word:Qe})}Pe.push($e)}return ge?Pe:Pe[0]}}class C extends F{constructor(A){super(A)}async _call(A,le,{top_k:ge=1}={}){let be=this.tokenizer(A,{text_pair:le,padding:!0,truncation:!0}),{start_logits:Ae,end_logits:ve}=await this.model(be),pe=be.input_ids.tolist(),Pe=be.attention_mask.tolist(),fe=this.tokenizer.all_special_ids,Te=[];for(let We=0;We<Ae.dims[0];++We){let $e=pe[We],Re=$e.findIndex(Ke=>Ke==this.tokenizer.sep_token_id),Ne=Pe[We].map((Ke,bt)=>Ke==1&&(bt===0||bt>Re&&fe.findIndex(At=>At==$e[bt])===-1)),ot=Ae[We].tolist(),De=ve[We].tolist();for(let Ke=1;Ke<ot.length;++Ke)(Pe[We]==0||Ke<=Re||fe.findIndex(bt=>bt==$e[Ke])!==-1)&&(ot[Ke]=-1/0,De[Ke]=-1/0);let Qe=(0,c.softmax)(ot).map((Ke,bt)=>[Ke,bt]),je=(0,c.softmax)(De).map((Ke,bt)=>[Ke,bt]);Qe[0][0]=0,je[0][0]=0;let pt=(0,l.product)(Qe,je).filter(Ke=>Ke[0][1]<=Ke[1][1]).map(Ke=>[Ke[0][1],Ke[1][1],Ke[0][0]*Ke[1][0]]).sort((Ke,bt)=>bt[2]-Ke[2]);for(let Ke=0;Ke<Math.min(pt.length,ge);++Ke){let[bt,At,Lt]=pt[Ke],fr=$e.slice(bt,At+1),zt=this.tokenizer.decode(fr,{skip_special_tokens:!0});Te.push({answer:zt,score:Lt})}}return ge===1?Te[0]:Te}}class y extends F{constructor(A){super(A)}async _call(A,{top_k:le=5}={}){let ge=this.tokenizer(A,{padding:!0,truncation:!0}),{logits:be}=await this.model(ge),Ae=[],ve=ge.input_ids.tolist();for(let pe=0;pe<ve.length;++pe){let Pe=ve[pe],fe=Pe.findIndex(Ne=>Ne==this.tokenizer.mask_token_id);if(fe===-1)throw Error(`Mask token (${this.tokenizer.mask_token}) not found in text.`);let Te=be[pe][fe],We=await(0,u.topk)(new u.Tensor("float32",(0,c.softmax)(Te.data),Te.dims),le),$e=We[0].tolist(),Re=We[1].tolist();Ae.push(Re.map((Ne,ot)=>{let De=Pe.slice();return De[fe]=Ne,{score:$e[ot],token:Number(Ne),token_str:this.tokenizer.decode([Ne]),sequence:this.tokenizer.decode(De,{skip_special_tokens:!0})}}))}return Array.isArray(A)?Ae:Ae[0]}}class P extends F{_key="generated_text";constructor(A){super(A)}async _call(A,le={}){Array.isArray(A)||(A=[A]),this.model.config.prefix&&(A=A.map(Pe=>this.model.config.prefix+Pe));let ge=this.model.config.task_specific_params;ge&&ge[this.task]&&ge[this.task].prefix&&(A=A.map(Pe=>ge[this.task].prefix+Pe));let be=this.tokenizer,Ae={padding:!0,truncation:!0},ve;this instanceof f&&"_build_translation_inputs"in be?ve=be._build_translation_inputs(A,Ae,le):ve=be(A,Ae);let pe=await this.model.generate({...ve,...le});return be.batch_decode(pe,{skip_special_tokens:!0}).map(Pe=>({[this._key]:Pe}))}}class I extends P{_key="summary_text";constructor(A){super(A)}}class f extends P{_key="translation_text";constructor(A){super(A)}}function E(we){return Array.isArray(we)&&we.every(A=>"role"in A&&"content"in A)}class D extends F{constructor(A){super(A)}async _call(A,le={}){let ge=!1,be=!1,Ae=le.add_special_tokens??(this.tokenizer.add_bos_token||this.tokenizer.add_eos_token)??!1,ve;if(typeof A=="string")ve=A=[A];else if(Array.isArray(A)&&A.every(Re=>typeof Re=="string"))ge=!0,ve=A;else{if(E(A))A=[A];else if(Array.isArray(A)&&A.every(E))ge=!0;else throw new Error("Input must be a string, an array of strings, a Chat, or an array of Chats");be=!0,ve=A.map(Re=>this.tokenizer.apply_chat_template(Re,{tokenize:!1,add_generation_prompt:!0})),Ae=!1}let pe=be?!1:le.return_full_text??!0;this.tokenizer.padding_side="left";let Pe=this.tokenizer(ve,{add_special_tokens:Ae,padding:!0,truncation:!0}),fe=await this.model.generate({...Pe,...le}),Te=this.tokenizer.batch_decode(fe,{skip_special_tokens:!0}),We;!pe&&Pe.input_ids.dims.at(-1)>0&&(We=this.tokenizer.batch_decode(Pe.input_ids,{skip_special_tokens:!0}).map(Re=>Re.length));let $e=Array.from({length:A.length},Re=>[]);for(let Re=0;Re<Te.length;++Re){let Ne=Math.floor(Re/fe.dims[0]*A.length);We&&(Te[Re]=Te[Re].slice(We[Ne])),$e[Ne].push({generated_text:be?[...A[Ne],{role:"assistant",content:Te[Re]}]:Te[Re]})}return!ge&&$e.length===1?$e[0]:$e}}class O extends F{constructor(A){super(A),this.label2id=Object.fromEntries(Object.entries(this.model.config.label2id).map(([le,ge])=>[le.toLowerCase(),ge])),this.entailment_id=this.label2id.entailment,this.entailment_id===void 0&&(console.warn("Could not find 'entailment' in label2id mapping. Using 2 as entailment_id."),this.entailment_id=2),this.contradiction_id=this.label2id.contradiction??this.label2id.not_entailment,this.contradiction_id===void 0&&(console.warn("Could not find 'contradiction' in label2id mapping. Using 0 as contradiction_id."),this.contradiction_id=0)}async _call(A,le,{hypothesis_template:ge="This example is {}.",multi_label:be=!1}={}){let Ae=Array.isArray(A);Ae||(A=[A]),Array.isArray(le)||(le=[le]);let ve=le.map(fe=>ge.replace("{}",fe)),pe=be||le.length===1,Pe=[];for(let fe of A){let Te=[];for(let Re of ve){let Ne=this.tokenizer(fe,{text_pair:Re,padding:!0,truncation:!0}),ot=await this.model(Ne);pe?Te.push([ot.logits.data[this.contradiction_id],ot.logits.data[this.entailment_id]]):Te.push(ot.logits.data[this.entailment_id])}let $e=(pe?Te.map(Re=>(0,c.softmax)(Re)[1]):(0,c.softmax)(Te)).map((Re,Ne)=>[Re,Ne]).sort((Re,Ne)=>Ne[0]-Re[0]);Pe.push({sequence:fe,labels:$e.map(Re=>le[Re[1]]),scores:$e.map(Re=>Re[0])})}return Ae?Pe:Pe[0]}}class U extends F{constructor(A){super(A)}async _call(A,{pooling:le="none",normalize:ge=!1,quantize:be=!1,precision:Ae="binary"}={}){let ve=this.tokenizer(A,{padding:!0,truncation:!0}),pe=await this.model(ve),Pe=pe.last_hidden_state??pe.logits??pe.token_embeddings;switch(le){case"none":break;case"mean":Pe=(0,u.mean_pooling)(Pe,ve.attention_mask);break;case"first_token":case"cls":Pe=Pe.slice(null,0);break;case"last_token":case"eos":Pe=Pe.slice(null,-1);break;default:throw Error(`Pooling method '${le}' not supported.`)}return ge&&(Pe=Pe.normalize(2,-1)),be&&(Pe=(0,u.quantize_embeddings)(Pe,Ae)),Pe}}class W extends F{constructor(A){super(A)}async _call(A,{pool:le=null}={}){let ge=await g(A),{pixel_values:be}=await this.processor(ge),Ae=await this.model({pixel_values:be}),ve;if(le){if(!("pooler_output"in Ae))throw Error("No pooled output was returned. Make sure the model has a 'pooler' layer when using the 'pool' option.");ve=Ae.pooler_output}else ve=Ae.last_hidden_state??Ae.logits??Ae.image_embeds;return ve}}class z extends F{constructor(A){super(A)}async _call(A,{top_k:le=5}={}){let ge=this.processor.feature_extractor.config.sampling_rate,be=await h(A,ge),Ae=this.model.config.id2label,ve=[];for(let pe of be){let Pe=await this.processor(pe),Te=(await this.model(Pe)).logits[0],We=await(0,u.topk)(new u.Tensor("float32",(0,c.softmax)(Te.data),Te.dims),le),$e=We[0].tolist(),Ne=We[1].tolist().map((ot,De)=>({label:Ae?Ae[ot]:`LABEL_${ot}`,score:$e[De]}));ve.push(Ne)}return Array.isArray(A)?ve:ve[0]}}class X extends F{constructor(A){super(A)}async _call(A,le,{hypothesis_template:ge="This is a sound of {}."}={}){let be=!Array.isArray(A);be&&(A=[A]);let Ae=le.map(Te=>ge.replace("{}",Te)),ve=this.tokenizer(Ae,{padding:!0,truncation:!0}),pe=this.processor.feature_extractor.config.sampling_rate,Pe=await h(A,pe),fe=[];for(let Te of Pe){let We=await this.processor(Te),$e=await this.model({...ve,...We}),Re=(0,c.softmax)($e.logits_per_audio.data);fe.push([...Re].map((Ne,ot)=>({score:Ne,label:le[ot]})))}return be?fe[0]:fe}}class J extends F{constructor(A){super(A)}async _call(A,le={}){switch(this.model.config.model_type){case"whisper":case"lite-whisper":return this._call_whisper(A,le);case"wav2vec2":case"wav2vec2-bert":case"unispeech":case"unispeech-sat":case"hubert":case"parakeet_ctc":return this._call_wav2vec2(A,le);case"moonshine":return this._call_moonshine(A,le);default:throw new Error(`AutomaticSpeechRecognitionPipeline does not support model type '${this.model.config.model_type}'.`)}}async _call_wav2vec2(A,le){le.language&&console.warn('`language` parameter is not yet supported for `wav2vec2` models, defaulting to "English".'),le.task&&console.warn('`task` parameter is not yet supported for `wav2vec2` models, defaulting to "transcribe".');let ge=!Array.isArray(A);ge&&(A=[A]);let be=this.processor.feature_extractor.config.sampling_rate,Ae=await h(A,be),ve=[];for(let pe of Ae){let Pe=await this.processor(pe),Te=(await this.model(Pe)).logits[0],We=[];for(let Re of Te)We.push((0,c.max)(Re.data)[1]);let $e=this.tokenizer.decode(We,{skip_special_tokens:!0}).trim();ve.push({text:$e})}return ge?ve[0]:ve}async _call_whisper(A,le){let ge=le.return_timestamps??!1,be=le.chunk_length_s??0,Ae=le.force_full_sequences??!1,ve=le.stride_length_s??null,pe={...le};ge==="word"&&(pe.return_token_timestamps=!0,pe.return_timestamps=!1);let Pe=!Array.isArray(A);Pe&&(A=[A]);let fe=this.processor.feature_extractor.config.chunk_length/this.model.config.max_source_positions,Te=this.processor.feature_extractor.config.hop_length,We=this.processor.feature_extractor.config.sampling_rate,$e=await h(A,We),Re=[];for(let Ne of $e){let ot=[];if(be>0){if(ve===null)ve=be/6;else if(be<=ve)throw Error("`chunk_length_s` must be larger than `stride_length_s`.");let je=We*be,pt=We*ve,Ke=je-2*pt,bt=0;for(;;){let At=bt+je,Lt=Ne.subarray(bt,At),fr=await this.processor(Lt),zt=bt===0,yr=At>=Ne.length;if(ot.push({stride:[Lt.length,zt?0:pt,yr?0:pt],input_features:fr.input_features,is_last:yr}),yr)break;bt+=Ke}}else ot=[{stride:[Ne.length,0,0],input_features:(await this.processor(Ne)).input_features,is_last:!0}];for(let je of ot){pe.num_frames=Math.floor(je.stride[0]/Te);let pt=await this.model.generate({inputs:je.input_features,...pe});ge==="word"?(je.tokens=pt.sequences.tolist()[0],je.token_timestamps=pt.token_timestamps.tolist()[0].map(Ke=>(0,c.round)(Ke,2))):je.tokens=pt[0].tolist(),je.stride=je.stride.map(Ke=>Ke/We)}let[De,Qe]=this.tokenizer._decode_asr(ot,{time_precision:fe,return_timestamps:ge,force_full_sequences:Ae});Re.push({text:De,...Qe})}return Pe?Re[0]:Re}async _call_moonshine(A,le){let ge=!Array.isArray(A);ge&&(A=[A]);let be=this.processor.feature_extractor.config.sampling_rate,Ae=await h(A,be),ve=[];for(let pe of Ae){let Pe=await this.processor(pe),fe=Math.floor(pe.length/be)*6,Te=await this.model.generate({max_new_tokens:fe,...le,...Pe}),We=this.processor.batch_decode(Te,{skip_special_tokens:!0})[0];ve.push({text:We})}return ge?ve[0]:ve}}class q extends F{constructor(A){super(A)}async _call(A,le={}){let ge=Array.isArray(A),be=await g(A),{pixel_values:Ae}=await this.processor(be),ve=[];for(let pe of Ae){pe.dims=[1,...pe.dims];let Pe=await this.model.generate({inputs:pe,...le}),fe=this.tokenizer.batch_decode(Pe,{skip_special_tokens:!0}).map(Te=>({generated_text:Te.trim()}));ve.push(fe)}return ge?ve:ve[0]}}class re extends F{constructor(A){super(A)}async _call(A,{top_k:le=5}={}){let ge=await g(A),{pixel_values:be}=await this.processor(ge),Ae=await this.model({pixel_values:be}),ve=this.model.config.id2label,pe=[];for(let Pe of Ae.logits){let fe=await(0,u.topk)(new u.Tensor("float32",(0,c.softmax)(Pe.data),Pe.dims),le),Te=fe[0].tolist(),$e=fe[1].tolist().map((Re,Ne)=>({label:ve?ve[Re]:`LABEL_${Re}`,score:Te[Ne]}));pe.push($e)}return Array.isArray(A)?pe:pe[0]}}class oe extends F{constructor(A){super(A),this.subtasks_mapping={panoptic:"post_process_panoptic_segmentation",instance:"post_process_instance_segmentation",semantic:"post_process_semantic_segmentation"}}async _call(A,{threshold:le=.5,mask_threshold:ge=.5,overlap_mask_area_threshold:be=.8,label_ids_to_fuse:Ae=null,target_sizes:ve=null,subtask:pe=null}={}){if(Array.isArray(A)&&A.length!==1)throw Error("Image segmentation pipeline currently only supports a batch size of 1.");let fe=await g(A),Te=fe.map(je=>[je.height,je.width]),We=await this.processor(fe),{inputNames:$e,outputNames:Re}=this.model.sessions.model;if(!$e.includes("pixel_values")){if($e.length!==1)throw Error(`Expected a single input name, but got ${$e.length} inputs: ${$e}.`);let je=$e[0];if(je in We)throw Error(`Input name ${je} already exists in the inputs.`);We[je]=We.pixel_values}let Ne=await this.model(We),ot=null;if(pe!==null)ot=this.subtasks_mapping[pe];else if(this.processor.image_processor){for(let[je,pt]of Object.entries(this.subtasks_mapping))if(pt in this.processor.image_processor){ot=this.processor.image_processor[pt].bind(this.processor.image_processor),pe=je;break}}let De=this.model.config.id2label,Qe=[];if(pe)if(pe==="panoptic"||pe==="instance"){let je=ot(Ne,le,ge,be,Ae,ve??Te)[0],pt=je.segmentation;for(let Ke of je.segments_info){let bt=new Uint8ClampedArray(pt.data.length);for(let Lt=0;Lt<pt.data.length;++Lt)pt.data[Lt]===Ke.id&&(bt[Lt]=255);let At=new d.RawImage(bt,pt.dims[1],pt.dims[0],1);Qe.push({score:Ke.score,label:De[Ke.label_id],mask:At})}}else if(pe==="semantic"){let{segmentation:je,labels:pt}=ot(Ne,ve??Te)[0];for(let Ke of pt){let bt=new Uint8ClampedArray(je.data.length);for(let Lt=0;Lt<je.data.length;++Lt)je.data[Lt]===Ke&&(bt[Lt]=255);let At=new d.RawImage(bt,je.dims[1],je.dims[0],1);Qe.push({score:null,label:De[Ke],mask:At})}}else throw Error(`Subtask ${pe} not supported.`);else{let pt=Ne[Re[0]];for(let Ke=0;Ke<Te.length;++Ke){let bt=Te[Ke],At=pt[Ke];At.data.some(fr=>fr<-1e-5||fr>1+1e-5)&&At.sigmoid_();let Lt=await d.RawImage.fromTensor(At.mul_(255).to("uint8")).resize(bt[1],bt[0]);Qe.push({label:null,score:null,mask:Lt})}}return Qe}}class ne extends oe{constructor(A){super(A)}async _call(A,le={}){if(Array.isArray(A)&&A.length!==1)throw Error("Background removal pipeline currently only supports a batch size of 1.");let be=await g(A),Ae=await super._call(A,le);return be.map((pe,Pe)=>{let fe=pe.clone();return fe.putAlpha(Ae[Pe].mask),fe})}}class ye extends F{constructor(A){super(A)}async _call(A,le,{hypothesis_template:ge="This is a photo of {}"}={}){let be=Array.isArray(A),Ae=await g(A),ve=le.map($e=>ge.replace("{}",$e)),pe=this.tokenizer(ve,{padding:this.model.config.model_type==="siglip"?"max_length":!0,truncation:!0}),{pixel_values:Pe}=await this.processor(Ae),fe=await this.model({...pe,pixel_values:Pe}),Te=this.model.config.model_type==="siglip"?$e=>$e.sigmoid().data:$e=>(0,c.softmax)($e.data),We=[];for(let $e of fe.logits_per_image){let Ne=[...Te($e)].map((ot,De)=>({score:ot,label:le[De]}));Ne.sort((ot,De)=>De.score-ot.score),We.push(Ne)}return be?We:We[0]}}class Y extends F{constructor(A){super(A)}async _call(A,{threshold:le=.9,percentage:ge=!1}={}){let be=Array.isArray(A);if(be&&A.length!==1)throw Error("Object detection pipeline currently only supports a batch size of 1.");let Ae=await g(A),ve=ge?null:Ae.map(Re=>[Re.height,Re.width]),{pixel_values:pe,pixel_mask:Pe}=await this.processor(Ae),fe=await this.model({pixel_values:pe,pixel_mask:Pe}),Te=this.processor.image_processor.post_process_object_detection(fe,le,ve),We=this.model.config.id2label,$e=Te.map(Re=>Re.boxes.map((Ne,ot)=>({score:Re.scores[ot],label:We[Re.classes[ot]],box:x(Ne,!ge)})));return be?$e:$e[0]}}class H extends F{constructor(A){super(A)}async _call(A,le,{threshold:ge=.1,top_k:be=null,percentage:Ae=!1}={}){let ve=Array.isArray(A),pe=await g(A),Pe=this.tokenizer(le,{padding:!0,truncation:!0}),fe=await this.processor(pe),Te=[];for(let We=0;We<pe.length;++We){let $e=pe[We],Re=Ae?null:[[$e.height,$e.width]],Ne=fe.pixel_values[We].unsqueeze_(0),ot=await this.model({...Pe,pixel_values:Ne}),De;if("post_process_grounded_object_detection"in this.processor){let Qe=this.processor.post_process_grounded_object_detection(ot,Pe.input_ids,{box_threshold:ge,text_threshold:ge,target_sizes:Re})[0];De=Qe.boxes.map((je,pt)=>({score:Qe.scores[pt],label:Qe.labels[pt],box:x(je,!Ae)}))}else{let Qe=this.processor.image_processor.post_process_object_detection(ot,ge,Re,!0)[0];De=Qe.boxes.map((je,pt)=>({score:Qe.scores[pt],label:le[Qe.classes[pt]],box:x(je,!Ae)}))}De.sort((Qe,je)=>je.score-Qe.score),be!==null&&(De=De.slice(0,be)),Te.push(De)}return ve?Te:Te[0]}}class R extends F{constructor(A){super(A)}async _call(A,le,ge={}){let be=(await g(A))[0],{pixel_values:Ae}=await this.processor(be),ve=`<s_docvqa><s_question>${le}</s_question><s_answer>`,pe=this.tokenizer(ve,{add_special_tokens:!1,padding:!0,truncation:!0}).input_ids,Pe=await this.model.generate({inputs:Ae,max_length:this.model.config.decoder.max_position_embeddings,decoder_input_ids:pe,...ge}),Te=this.tokenizer.batch_decode(Pe)[0].match(/<s_answer>(.*?)<\/s_answer>/),We=null;return Te&&Te.length>=2&&(We=Te[1].trim()),[{answer:We}]}}class L extends F{DEFAULT_VOCODER_ID="Xenova/speecht5_hifigan";constructor(A){super(A),this.vocoder=A.vocoder??null}async _prepare_speaker_embeddings(A){if((typeof A=="string"||A instanceof URL)&&(A=new Float32Array(await(await fetch(A)).arrayBuffer())),A instanceof Float32Array)A=new u.Tensor("float32",A,[A.length]);else if(!(A instanceof u.Tensor))throw new Error("Speaker embeddings must be a `Tensor`, `Float32Array`, `string`, or `URL`.");return A}async _call(A,{speaker_embeddings:le=null,num_inference_steps:ge,speed:be}={}){return this.processor?this._call_text_to_spectrogram(A,{speaker_embeddings:le}):this.model.config.model_type==="supertonic"?this._call_supertonic(A,{speaker_embeddings:le,num_inference_steps:ge,speed:be}):this._call_text_to_waveform(A)}async _call_supertonic(A,{speaker_embeddings:le,num_inference_steps:ge,speed:be}){if(!le)throw new Error("Speaker embeddings must be provided for Supertonic models.");le=await this._prepare_speaker_embeddings(le);let{sampling_rate:Ae,style_dim:ve}=this.model.config;le=le.view(1,-1,ve);let pe=this.tokenizer(A,{padding:!0,truncation:!0}),{waveform:Pe}=await this.model.generate_speech({...pe,style:le,num_inference_steps:ge,speed:be});return new _.RawAudio(Pe.data,Ae)}async _call_text_to_waveform(A){let le=this.tokenizer(A,{padding:!0,truncation:!0}),{waveform:ge}=await this.model(le),be=this.model.config.sampling_rate;return new _.RawAudio(ge.data,be)}async _call_text_to_spectrogram(A,{speaker_embeddings:le}){this.vocoder||(console.log("No vocoder specified, using default HifiGan vocoder."),this.vocoder=await o.AutoModel.from_pretrained(this.DEFAULT_VOCODER_ID,{dtype:"fp32"}));let{input_ids:ge}=this.tokenizer(A,{padding:!0,truncation:!0});le=await this._prepare_speaker_embeddings(le),le=le.view(1,-1);let{waveform:be}=await this.model.generate_speech(ge,le,{vocoder:this.vocoder}),Ae=this.processor.feature_extractor.config.sampling_rate;return new _.RawAudio(be.data,Ae)}}class ee extends F{constructor(A){super(A)}async _call(A){let le=await g(A),ge=await this.processor(le),be=await this.model(ge),Ae=[];for(let ve of be.reconstruction){let pe=ve.squeeze().clamp_(0,1).mul_(255).round_().to("uint8");Ae.push(d.RawImage.fromTensor(pe))}return Ae.length>1?Ae:Ae[0]}}class ue extends F{constructor(A){super(A)}async _call(A){let le=await g(A),ge=await this.processor(le),{predicted_depth:be}=await this.model(ge),Ae=[];for(let ve=0;ve<le.length;++ve){let pe=be[ve],[Pe,fe]=pe.dims.slice(-2),[Te,We]=le[ve].size,$e=(await(0,u.interpolate_4d)(pe.view(1,1,Pe,fe),{size:[We,Te],mode:"bilinear"})).view(We,Te),Re=$e.min().item(),Ne=$e.max().item(),ot=$e.sub(Re).div_(Ne-Re).mul_(255).to("uint8").unsqueeze(0),De=d.RawImage.fromTensor(ot);Ae.push({predicted_depth:$e,depth:De})}return Ae.length>1?Ae:Ae[0]}}let ke=Object.freeze({"text-classification":{tokenizer:s.AutoTokenizer,pipeline:v,model:o.AutoModelForSequenceClassification,default:{model:"Xenova/distilbert-base-uncased-finetuned-sst-2-english"},type:"text"},"token-classification":{tokenizer:s.AutoTokenizer,pipeline:b,model:o.AutoModelForTokenClassification,default:{model:"Xenova/bert-base-multilingual-cased-ner-hrl"},type:"text"},"question-answering":{tokenizer:s.AutoTokenizer,pipeline:C,model:o.AutoModelForQuestionAnswering,default:{model:"Xenova/distilbert-base-cased-distilled-squad"},type:"text"},"fill-mask":{tokenizer:s.AutoTokenizer,pipeline:y,model:o.AutoModelForMaskedLM,default:{model:"Xenova/bert-base-uncased"},type:"text"},summarization:{tokenizer:s.AutoTokenizer,pipeline:I,model:o.AutoModelForSeq2SeqLM,default:{model:"Xenova/distilbart-cnn-6-6"},type:"text"},translation:{tokenizer:s.AutoTokenizer,pipeline:f,model:o.AutoModelForSeq2SeqLM,default:{model:"Xenova/t5-small"},type:"text"},"text2text-generation":{tokenizer:s.AutoTokenizer,pipeline:P,model:o.AutoModelForSeq2SeqLM,default:{model:"Xenova/flan-t5-small"},type:"text"},"text-generation":{tokenizer:s.AutoTokenizer,pipeline:D,model:o.AutoModelForCausalLM,default:{model:"Xenova/gpt2"},type:"text"},"zero-shot-classification":{tokenizer:s.AutoTokenizer,pipeline:O,model:o.AutoModelForSequenceClassification,default:{model:"Xenova/distilbert-base-uncased-mnli"},type:"text"},"audio-classification":{pipeline:z,model:o.AutoModelForAudioClassification,processor:a.AutoProcessor,default:{model:"Xenova/wav2vec2-base-superb-ks"},type:"audio"},"zero-shot-audio-classification":{tokenizer:s.AutoTokenizer,pipeline:X,model:o.AutoModel,processor:a.AutoProcessor,default:{model:"Xenova/clap-htsat-unfused"},type:"multimodal"},"automatic-speech-recognition":{tokenizer:s.AutoTokenizer,pipeline:J,model:[o.AutoModelForSpeechSeq2Seq,o.AutoModelForCTC],processor:a.AutoProcessor,default:{model:"Xenova/whisper-tiny.en"},type:"multimodal"},"text-to-audio":{tokenizer:s.AutoTokenizer,pipeline:L,model:[o.AutoModelForTextToWaveform,o.AutoModelForTextToSpectrogram],processor:[a.AutoProcessor,null],default:{model:"Xenova/speecht5_tts"},type:"text"},"image-to-text":{tokenizer:s.AutoTokenizer,pipeline:q,model:o.AutoModelForVision2Seq,processor:a.AutoProcessor,default:{model:"Xenova/vit-gpt2-image-captioning"},type:"multimodal"},"image-classification":{pipeline:re,model:o.AutoModelForImageClassification,processor:a.AutoProcessor,default:{model:"Xenova/vit-base-patch16-224"},type:"multimodal"},"image-segmentation":{pipeline:oe,model:[o.AutoModelForImageSegmentation,o.AutoModelForSemanticSegmentation,o.AutoModelForUniversalSegmentation],processor:a.AutoProcessor,default:{model:"Xenova/detr-resnet-50-panoptic"},type:"multimodal"},"background-removal":{pipeline:ne,model:[o.AutoModelForImageSegmentation,o.AutoModelForSemanticSegmentation,o.AutoModelForUniversalSegmentation],processor:a.AutoProcessor,default:{model:"Xenova/modnet"},type:"image"},"zero-shot-image-classification":{tokenizer:s.AutoTokenizer,pipeline:ye,model:o.AutoModel,processor:a.AutoProcessor,default:{model:"Xenova/clip-vit-base-patch32"},type:"multimodal"},"object-detection":{pipeline:Y,model:o.AutoModelForObjectDetection,processor:a.AutoProcessor,default:{model:"Xenova/detr-resnet-50"},type:"multimodal"},"zero-shot-object-detection":{tokenizer:s.AutoTokenizer,pipeline:H,model:o.AutoModelForZeroShotObjectDetection,processor:a.AutoProcessor,default:{model:"Xenova/owlvit-base-patch32"},type:"multimodal"},"document-question-answering":{tokenizer:s.AutoTokenizer,pipeline:R,model:o.AutoModelForDocumentQuestionAnswering,processor:a.AutoProcessor,default:{model:"Xenova/donut-base-finetuned-docvqa"},type:"multimodal"},"image-to-image":{pipeline:ee,model:o.AutoModelForImageToImage,processor:a.AutoProcessor,default:{model:"Xenova/swin2SR-classical-sr-x2-64"},type:"image"},"depth-estimation":{pipeline:ue,model:o.AutoModelForDepthEstimation,processor:a.AutoProcessor,default:{model:"Xenova/dpt-large"},type:"image"},"feature-extraction":{tokenizer:s.AutoTokenizer,pipeline:U,model:o.AutoModel,default:{model:"Xenova/all-MiniLM-L6-v2"},type:"text"},"image-feature-extraction":{processor:a.AutoProcessor,pipeline:W,model:[o.AutoModelForImageFeatureExtraction,o.AutoModel],default:{model:"Xenova/vit-base-patch16-224-in21k"},type:"image"}}),Ie=Object.freeze({"sentiment-analysis":"text-classification",ner:"token-classification",asr:"automatic-speech-recognition","text-to-speech":"text-to-audio",embeddings:"feature-extraction"});async function Le(we,A=null,{progress_callback:le=null,config:ge=null,cache_dir:be=null,local_files_only:Ae=!1,revision:ve="main",device:pe=null,dtype:Pe=null,subfolder:fe="onnx",use_external_data_format:Te=null,model_file_name:We=null,session_options:$e={}}={}){we=Ie[we]??we;let Re=ke[we.split("_",1)[0]];if(!Re)throw Error(`Unsupported pipeline: ${we}. Must be one of [${Object.keys(ke)}]`);A||(A=Re.default.model,console.log(`No model specified. Using default model: "${A}".`));let Ne={progress_callback:le,config:ge,cache_dir:be,local_files_only:Ae,revision:ve,device:pe,dtype:Pe,subfolder:fe,use_external_data_format:Te,model_file_name:We,session_options:$e},ot=new Map([["tokenizer",Re.tokenizer],["model",Re.model],["processor",Re.processor]]),De=await rt(ot,A,Ne);De.task=we,(0,l.dispatchCallback)(le,{status:"ready",task:we,model:A});let Qe=Re.pipeline;return new Qe(De)}async function rt(we,A,le){let ge=Object.create(null),be=[];for(let[Ae,ve]of we.entries()){if(!ve)continue;let pe;Array.isArray(ve)?pe=new Promise(async(Pe,fe)=>{let Te;for(let We of ve){if(We===null){Pe(null);return}try{Pe(await We.from_pretrained(A,le));return}catch($e){if($e.message?.includes("Unsupported model type"))Te=$e;else if($e.message?.includes("Could not locate file"))Te=$e;else{fe($e);return}}}fe(Te)}):pe=ve.from_pretrained(A,le),ge[Ae]=pe,be.push(pe)}await Promise.all(be);for(let[Ae,ve]of Object.entries(ge))ge[Ae]=await ve;return ge}}),"./src/tokenizers.js":((e,r,t)=>{t.r(r),t.d(r,{AlbertTokenizer:()=>qt,AutoTokenizer:()=>Wo,BartTokenizer:()=>qe,BertTokenizer:()=>Cs,BlenderbotSmallTokenizer:()=>Ue,BlenderbotTokenizer:()=>ze,BloomTokenizer:()=>Nt,CLIPTokenizer:()=>As,CamembertTokenizer:()=>Z,CodeGenTokenizer:()=>Is,CodeLlamaTokenizer:()=>Or,CohereTokenizer:()=>Ds,ConvBertTokenizer:()=>Q,DebertaTokenizer:()=>St,DebertaV2Tokenizer:()=>Xr,DistilBertTokenizer:()=>K,ElectraTokenizer:()=>xe,EsmTokenizer:()=>gr,FalconTokenizer:()=>_s,GPT2Tokenizer:()=>ut,GPTNeoXTokenizer:()=>Fs,GemmaTokenizer:()=>as,Grok1Tokenizer:()=>Nr,HerbertTokenizer:()=>k,LlamaTokenizer:()=>ur,M2M100Tokenizer:()=>_r,MBart50Tokenizer:()=>tt,MBartTokenizer:()=>wt,MPNetTokenizer:()=>Lr,MarianTokenizer:()=>ns,MgpstrTokenizer:()=>Vs,MobileBertTokenizer:()=>Ss,NllbTokenizer:()=>ar,NougatTokenizer:()=>Ht,PreTrainedTokenizer:()=>ft,Qwen2Tokenizer:()=>Ns,RoFormerTokenizer:()=>N,RobertaTokenizer:()=>gt,SiglipTokenizer:()=>$s,SpeechT5Tokenizer:()=>at,SqueezeBertTokenizer:()=>Qr,T5Tokenizer:()=>et,TokenizerModel:()=>U,VitsTokenizer:()=>js,Wav2Vec2CTCTokenizer:()=>Wr,WhisperTokenizer:()=>ps,XLMRobertaTokenizer:()=>Cr,XLMTokenizer:()=>ce,is_chinese_char:()=>C});var s=t("./src/utils/generic.js"),o=t("./src/utils/core.js"),a=t("./src/utils/hub.js"),n=t("./src/utils/maths.js"),i=t("./src/utils/tensor.js"),l=t("./src/utils/data-structures.js"),c=t("./node_modules/@huggingface/jinja/dist/index.js"),_=t("./src/models/whisper/common_whisper.js");async function u(de,S){let G=await Promise.all([(0,a.getModelJSON)(de,"tokenizer.json",!0,S),(0,a.getModelJSON)(de,"tokenizer_config.json",!0,S)]);return S.legacy!==null&&(G[1].legacy=S.legacy),G}function d(de,S){let G=[],te=0;for(let se of de.matchAll(S)){let me=se[0];te<se.index&&G.push(de.slice(te,se.index)),me.length>0&&G.push(me),te=se.index+me.length}return te<de.length&&G.push(de.slice(te)),G}function g(de,S=!0){if(de.Regex!==void 0){let G=de.Regex.replace(/\\([#&~])/g,"$1");for(let[te,se]of D)G=G.replaceAll(te,se);return new RegExp(G,"gu")}else if(de.String!==void 0){let G=(0,o.escapeRegExp)(de.String);return new RegExp(S?G:`(${G})`,"gu")}else return console.warn("Unknown pattern type:",de),null}function h(de){return new Map(Object.entries(de))}function x(de){let S=de.dims;switch(S.length){case 1:return de.tolist();case 2:if(S[0]!==1)throw new Error("Unable to decode tensor with `batch size !== 1`. Use `tokenizer.batch_decode(...)` for batched inputs.");return de.tolist()[0];default:throw new Error(`Expected tensor to have 1-2 dimensions, got ${S.length}.`)}}function F(de){return de.replace(/ \./g,".").replace(/ \?/g,"?").replace(/ \!/g,"!").replace(/ ,/g,",").replace(/ \' /g,"'").replace(/ n\'t/g,"n't").replace(/ \'m/g,"'m").replace(/ \'s/g,"'s").replace(/ \'ve/g,"'ve").replace(/ \'re/g,"'re")}function v(de){return de.replace(/\p{M}/gu,"")}function b(de){return v(de.toLowerCase())}function C(de){return de>=19968&&de<=40959||de>=13312&&de<=19903||de>=131072&&de<=173791||de>=173824&&de<=177983||de>=177984&&de<=178207||de>=178208&&de<=183983||de>=63744&&de<=64255||de>=194560&&de<=195103}function y(de,S,G){let te=[],se=0;for(;se<de.length;){if(te.push(de[se]),(S.get(de[se])??G)!==G){++se;continue}for(;++se<de.length&&(S.get(de[se])??G)===G;)S.get(te.at(-1))!==G&&(te[te.length-1]+=de[se])}return te}function P(de){return de.match(/\S+/g)||[]}let I="\\p{P}\\u0021-\\u002F\\u003A-\\u0040\\u005B-\\u0060\\u007B-\\u007E",f=new RegExp(`^[${I}]+$`,"gu"),E=".,!?\u2026\u3002\uFF0C\u3001\u0964\u06D4\u060C",D=new Map([["(?i:'s|'t|'re|'ve|'m|'ll|'d)","(?:'([sS]|[tT]|[rR][eE]|[vV][eE]|[mM]|[lL][lL]|[dD]))"],["(?i:[sdmt]|ll|ve|re)","(?:[sS]|[dD]|[mM]|[tT]|[lL][lL]|[vV][eE]|[rR][eE])"],["[^\\r\\n\\p{L}\\p{N}]?+","[^\\r\\n\\p{L}\\p{N}]?"],["[^\\s\\p{L}\\p{N}]++","[^\\s\\p{L}\\p{N}]+"],[` ?[^(\\s|[${E}])]+`,` ?[^\\s${E}]+`]]);class O{constructor(S){this.content=S.content,this.id=S.id,this.single_word=S.single_word??!1,this.lstrip=S.lstrip??!1,this.rstrip=S.rstrip??!1,this.special=S.special??!1,this.normalized=S.normalized??null}}class U extends s.Callable{constructor(S){super(),this.config=S,this.vocab=[],this.tokens_to_ids=new Map,this.unk_token_id=void 0,this.unk_token=void 0,this.end_of_word_suffix=void 0,this.fuse_unk=this.config.fuse_unk??!1}static fromConfig(S,...G){switch(S.type){case"WordPiece":return new W(S);case"Unigram":return new z(S,...G);case"BPE":return new q(S);default:if(S.vocab)return Array.isArray(S.vocab)?new z(S,...G):Object.hasOwn(S,"continuing_subword_prefix")&&Object.hasOwn(S,"unk_token")?Object.hasOwn(S,"merges")?new q(S):new W(S):new re(S,...G);throw new Error(`Unknown TokenizerModel type: ${S.type}`)}}_call(S){return S=this.encode(S),this.fuse_unk&&(S=y(S,this.tokens_to_ids,this.unk_token_id)),S}encode(S){throw Error("encode should be implemented in subclass.")}convert_tokens_to_ids(S){return S.map(G=>this.tokens_to_ids.get(G)??this.unk_token_id)}convert_ids_to_tokens(S){return S.map(G=>this.vocab[G]??this.unk_token)}}class W extends U{constructor(S){super(S),this.tokens_to_ids=h(S.vocab),this.unk_token_id=this.tokens_to_ids.get(S.unk_token),this.unk_token=S.unk_token,this.max_input_chars_per_word=S.max_input_chars_per_word??100,this.vocab=new Array(this.tokens_to_ids.size);for(let[G,te]of this.tokens_to_ids)this.vocab[te]=G}encode(S){let G=[];for(let te of S){let se=[...te];if(se.length>this.max_input_chars_per_word){G.push(this.unk_token);continue}let me=!1,Ce=0,Ye=[];for(;Ce<se.length;){let Xe=se.length,Ze=null;for(;Ce<Xe;){let He=se.slice(Ce,Xe).join("");if(Ce>0&&(He=this.config.continuing_subword_prefix+He),this.tokens_to_ids.has(He)){Ze=He;break}--Xe}if(Ze===null){me=!0;break}Ye.push(Ze),Ce=Xe}me?G.push(this.unk_token):G.push(...Ye)}return G}}class z extends U{constructor(S,G){super(S);let te=S.vocab.length;this.vocab=new Array(te),this.scores=new Array(te);for(let se=0;se<te;++se)[this.vocab[se],this.scores[se]]=S.vocab[se];this.unk_token_id=S.unk_id,this.unk_token=this.vocab[S.unk_id],this.tokens_to_ids=new Map(this.vocab.map((se,me)=>[se,me])),this.bos_token=" ",this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=G.eos_token,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.unk_token=this.vocab[this.unk_token_id],this.minScore=(0,n.min)(this.scores)[0],this.unk_score=this.minScore-10,this.scores[this.unk_token_id]=this.unk_score,this.trie=new l.CharTrie,this.trie.extend(this.vocab),this.fuse_unk=!0}populateNodes(S){let G=S.chars,te=1,se=0;for(;se<G.length;){let me=!1,Ce=[],Ye=G.slice(se).join(""),Xe=this.trie.commonPrefixSearch(Ye);for(let Ze of Xe){Ce.push(Ze);let He=this.tokens_to_ids.get(Ze),It=this.scores[He],yt=(0,o.len)(Ze);S.insert(se,yt,It,He),!me&&yt===te&&(me=!0)}me||S.insert(se,te,this.unk_score,this.unk_token_id),se+=te}}tokenize(S){let G=new l.TokenLattice(S,this.bos_token_id,this.eos_token_id);return this.populateNodes(G),G.tokens()}encode(S){let G=[];for(let te of S){let se=this.tokenize(te);G.push(...se)}return G}}let X=(()=>{let de=[...Array.from({length:94},(se,me)=>me+33),...Array.from({length:12},(se,me)=>me+161),...Array.from({length:82},(se,me)=>me+174)],S=de.slice(),G=0;for(let se=0;se<256;++se)de.includes(se)||(de.push(se),S.push(256+G),G+=1);let te=S.map(se=>String.fromCharCode(se));return Object.fromEntries(de.map((se,me)=>[se,te[me]]))})(),J=(0,o.reverseDictionary)(X);class q extends U{constructor(S){super(S),this.tokens_to_ids=h(S.vocab),this.unk_token_id=this.tokens_to_ids.get(S.unk_token),this.unk_token=S.unk_token,this.vocab=new Array(this.tokens_to_ids.size);for(let[te,se]of this.tokens_to_ids)this.vocab[se]=te;let G=Array.isArray(S.merges[0]);this.merges=G?S.merges:S.merges.map(te=>te.split(" ",2)),this.bpe_ranks=new Map(this.merges.map((te,se)=>[JSON.stringify(te),se])),this.end_of_word_suffix=S.end_of_word_suffix,this.continuing_subword_suffix=S.continuing_subword_suffix??null,this.byte_fallback=this.config.byte_fallback??!1,this.byte_fallback&&(this.text_encoder=new TextEncoder),this.ignore_merges=this.config.ignore_merges??!1,this.max_length_to_cache=256,this.cache_capacity=1e4,this.cache=new l.LRUCache(this.cache_capacity)}clear_cache(){this.cache.clear()}bpe(S){if(S.length===0)return[];let G=this.cache.get(S);if(G!==void 0)return G;let te=Array.from(S);this.end_of_word_suffix&&(te[te.length-1]+=this.end_of_word_suffix);let se=[];if(te.length>1){let me=new l.PriorityQueue((Xe,Ze)=>Xe.score<Ze.score),Ce={token:te[0],bias:0,prev:null,next:null},Ye=Ce;for(let Xe=1;Xe<te.length;++Xe){let Ze={bias:Xe/te.length,token:te[Xe],prev:Ye,next:null};Ye.next=Ze,this._add_node(me,Ye),Ye=Ze}for(;!me.isEmpty();){let Xe=me.pop();if(Xe.deleted||!Xe.next||Xe.next.deleted)continue;if(Xe.deleted=!0,Xe.next.deleted=!0,Xe.prev){let He={...Xe.prev};Xe.prev.deleted=!0,Xe.prev=He,He.prev?He.prev.next=He:Ce=He}let Ze={token:Xe.token+Xe.next.token,bias:Xe.bias,prev:Xe.prev,next:Xe.next.next};Ze.prev?(Ze.prev.next=Ze,this._add_node(me,Ze.prev)):Ce=Ze,Ze.next&&(Ze.next.prev=Ze,this._add_node(me,Ze))}for(let Xe=Ce;Xe!==null;Xe=Xe.next)se.push(Xe.token)}else se=te;if(this.continuing_subword_suffix)for(let me=0;me<se.length-1;++me)se[me]+=this.continuing_subword_suffix;return S.length<this.max_length_to_cache&&this.cache.put(S,se),se}_add_node(S,G){let te=this.bpe_ranks.get(JSON.stringify([G.token,G.next.token]));te!==void 0&&(G.score=te+G.bias,S.push(G))}encode(S){let G=[];for(let te of S){if(this.ignore_merges&&this.tokens_to_ids.has(te)){G.push(te);continue}let se=this.bpe(te);for(let me of se)if(this.tokens_to_ids.has(me))G.push(me);else if(this.byte_fallback){let Ce=Array.from(this.text_encoder.encode(me)).map(Ye=>`<0x${Ye.toString(16).toUpperCase().padStart(2,"0")}>`);Ce.every(Ye=>this.tokens_to_ids.has(Ye))?G.push(...Ce):G.push(this.unk_token)}else G.push(this.unk_token)}return G}}class re extends U{constructor(S,G){super(S),this.tokens_to_ids=h(G.target_lang?S.vocab[G.target_lang]:S.vocab),this.bos_token=G.bos_token,this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=G.eos_token,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.pad_token=G.pad_token,this.pad_token_id=this.tokens_to_ids.get(this.pad_token),this.unk_token=G.unk_token,this.unk_token_id=this.tokens_to_ids.get(this.unk_token),this.vocab=new Array(this.tokens_to_ids.size);for(let[te,se]of this.tokens_to_ids)this.vocab[se]=te}encode(S){return S}}class oe extends s.Callable{constructor(S){super(),this.config=S}static fromConfig(S){if(S===null)return null;switch(S.type){case"BertNormalizer":return new rt(S);case"Precompiled":return new zt(S);case"Sequence":return new Le(S);case"Replace":return new ne(S);case"NFC":return new Y(S);case"NFD":return new H(S);case"NFKC":return new R(S);case"NFKD":return new L(S);case"Strip":return new ee(S);case"StripAccents":return new ue(S);case"Lowercase":return new ke(S);case"Prepend":return new Ie(S);default:throw new Error(`Unknown Normalizer type: ${S.type}`)}}normalize(S){throw Error("normalize should be implemented in subclass.")}_call(S){return this.normalize(S)}}class ne extends oe{normalize(S){let G=g(this.config.pattern);return G===null?S:S.replaceAll(G,this.config.content)}}class ye extends oe{form=void 0;normalize(S){return S=S.normalize(this.form),S}}class Y extends ye{form="NFC"}class H extends ye{form="NFD"}class R extends ye{form="NFKC"}class L extends ye{form="NFKD"}class ee extends oe{normalize(S){return this.config.strip_left&&this.config.strip_right?S=S.trim():(this.config.strip_left&&(S=S.trimStart()),this.config.strip_right&&(S=S.trimEnd())),S}}class ue extends oe{normalize(S){return S=v(S),S}}class ke extends oe{normalize(S){return S=S.toLowerCase(),S}}class Ie extends oe{normalize(S){return S=this.config.prepend+S,S}}class Le extends oe{constructor(S){super(S),this.normalizers=S.normalizers.map(G=>oe.fromConfig(G))}normalize(S){return this.normalizers.reduce((G,te)=>te.normalize(G),S)}}class rt extends oe{_tokenize_chinese_chars(S){let G=[];for(let te=0;te<S.length;++te){let se=S[te],me=se.charCodeAt(0);C(me)?(G.push(" "),G.push(se),G.push(" ")):G.push(se)}return G.join("")}stripAccents(S){return S.normalize("NFD").replace(/\p{Mn}/gu,"")}_is_control(S){switch(S){case" ":case`
|
|
2851
|
-
`:case"\r":return!1;default:return/^\p{Cc}|\p{Cf}|\p{Co}|\p{Cs}$/u.test(S)}}_clean_text(S){let G=[];for(let te of S){let se=te.charCodeAt(0);se===0||se===65533||this._is_control(te)||(/^\s$/.test(te)?G.push(" "):G.push(te))}return G.join("")}normalize(S){return this.config.clean_text&&(S=this._clean_text(S)),this.config.handle_chinese_chars&&(S=this._tokenize_chinese_chars(S)),this.config.lowercase?(S=S.toLowerCase(),this.config.strip_accents!==!1&&(S=this.stripAccents(S))):this.config.strip_accents&&(S=this.stripAccents(S)),S}}class we extends s.Callable{static fromConfig(S){if(S===null)return null;switch(S.type){case"BertPreTokenizer":return new A(S);case"Sequence":return new yr(S);case"Whitespace":return new zs(S);case"WhitespaceSplit":return new Ys(S);case"Metaspace":return new Lt(S);case"ByteLevel":return new le(S);case"Split":return new ge(S);case"Punctuation":return new be(S);case"Digits":return new Ae(S);case"Replace":return new Zs(S);case"FixedLength":return new or(S);default:throw new Error(`Unknown PreTokenizer type: ${S.type}`)}}pre_tokenize_text(S,G){throw Error("pre_tokenize_text should be implemented in subclass.")}pre_tokenize(S,G){return(Array.isArray(S)?S.map(te=>this.pre_tokenize_text(te,G)):this.pre_tokenize_text(S,G)).flat()}_call(S,G){return this.pre_tokenize(S,G)}}class A extends we{constructor(S){super(),this.pattern=new RegExp(`[^\\s${I}]+|[${I}]`,"gu")}pre_tokenize_text(S,G){return S.trim().match(this.pattern)||[]}}class le extends we{constructor(S){super(),this.config=S,this.add_prefix_space=this.config.add_prefix_space,this.trim_offsets=this.config.trim_offsets,this.use_regex=this.config.use_regex??!0,this.pattern=/'s|'t|'re|'ve|'m|'ll|'d| ?\p{L}+| ?\p{N}+| ?[^\s\p{L}\p{N}]+|\s+(?!\S)|\s+/gu,this.byte_encoder=X,this.text_encoder=new TextEncoder}pre_tokenize_text(S,G){return this.add_prefix_space&&!S.startsWith(" ")&&(S=" "+S),(this.use_regex?S.match(this.pattern)||[]:[S]).map(se=>Array.from(this.text_encoder.encode(se),me=>this.byte_encoder[me]).join(""))}}class ge extends we{constructor(S){super(),this.config=S,this.pattern=g(this.config.pattern,this.config.invert)}pre_tokenize_text(S,G){return this.pattern===null?[]:this.config.invert?S.match(this.pattern)||[]:this.config.behavior?.toLowerCase()==="removed"?S.split(this.pattern).filter(te=>te):d(S,this.pattern)}}class be extends we{constructor(S){super(),this.config=S,this.pattern=new RegExp(`[^${I}]+|[${I}]+`,"gu")}pre_tokenize_text(S,G){return S.match(this.pattern)||[]}}class Ae extends we{constructor(S){super(),this.config=S;let G=`[^\\d]+|\\d${this.config.individual_digits?"":"+"}`;this.pattern=new RegExp(G,"gu")}pre_tokenize_text(S,G){return S.match(this.pattern)||[]}}class ve extends s.Callable{constructor(S){super(),this.config=S}static fromConfig(S){if(S===null)return null;switch(S.type){case"TemplateProcessing":return new fe(S);case"ByteLevel":return new Te(S);case"RobertaProcessing":return new Pe(S);case"BertProcessing":return new pe(S);case"Sequence":return new We(S);default:throw new Error(`Unknown PostProcessor type: ${S.type}`)}}post_process(S,...G){throw Error("post_process should be implemented in subclass.")}_call(S,...G){return this.post_process(S,...G)}}class pe extends ve{constructor(S){super(S),this.cls=S.cls[0],this.sep=S.sep[0]}post_process(S,G=null,{add_special_tokens:te=!0}={}){te&&(S=(0,o.mergeArrays)([this.cls],S,[this.sep]));let se=new Array(S.length).fill(0);if(G!==null){let me=te&&this instanceof Pe?[this.sep]:[],Ce=te?[this.sep]:[];S=(0,o.mergeArrays)(S,me,G,Ce),se=(0,o.mergeArrays)(se,new Array(G.length+me.length+Ce.length).fill(1))}return{tokens:S,token_type_ids:se}}}class Pe extends pe{}class fe extends ve{constructor(S){super(S),this.single=S.single,this.pair=S.pair}post_process(S,G=null,{add_special_tokens:te=!0}={}){let se=G===null?this.single:this.pair,me=[],Ce=[];for(let Ye of se)"SpecialToken"in Ye?te&&(me.push(Ye.SpecialToken.id),Ce.push(Ye.SpecialToken.type_id)):"Sequence"in Ye&&(Ye.Sequence.id==="A"?(me=(0,o.mergeArrays)(me,S),Ce=(0,o.mergeArrays)(Ce,new Array(S.length).fill(Ye.Sequence.type_id))):Ye.Sequence.id==="B"&&(me=(0,o.mergeArrays)(me,G),Ce=(0,o.mergeArrays)(Ce,new Array(G.length).fill(Ye.Sequence.type_id))));return{tokens:me,token_type_ids:Ce}}}class Te extends ve{post_process(S,G=null){return G&&(S=(0,o.mergeArrays)(S,G)),{tokens:S}}}class We extends ve{constructor(S){super(S),this.processors=S.processors.map(G=>ve.fromConfig(G))}post_process(S,G=null,te={}){let se;for(let me of this.processors)if(me instanceof Te)S=me.post_process(S).tokens,G&&(G=me.post_process(G).tokens);else{let Ce=me.post_process(S,G,te);S=Ce.tokens,se=Ce.token_type_ids}return{tokens:S,token_type_ids:se}}}class $e extends s.Callable{constructor(S){super(),this.config=S,this.added_tokens=[],this.end_of_word_suffix=null,this.trim_offsets=S.trim_offsets}static fromConfig(S){if(S===null)return null;switch(S.type){case"WordPiece":return new Qe(S);case"Metaspace":return new fr(S);case"ByteLevel":return new je(S);case"Replace":return new Re(S);case"ByteFallback":return new Ne(S);case"Fuse":return new ot(S);case"Strip":return new De(S);case"Sequence":return new Ke(S);case"CTC":return new pt(S);case"BPEDecoder":return new bt(S);default:throw new Error(`Unknown Decoder type: ${S.type}`)}}_call(S){return this.decode(S)}decode(S){return this.decode_chain(S).join("")}decode_chain(S){throw Error("`decode_chain` should be implemented in subclass.")}}class Re extends $e{decode_chain(S){let G=g(this.config.pattern);return G===null?S:S.map(te=>te.replaceAll(G,this.config.content))}}class Ne extends $e{constructor(S){super(S),this.text_decoder=new TextDecoder}decode_chain(S){let G=[],te=[];for(let se of S){let me=null;if(se.length===6&&se.startsWith("<0x")&&se.endsWith(">")){let Ce=parseInt(se.slice(3,5),16);isNaN(Ce)||(me=Ce)}if(me!==null)te.push(me);else{if(te.length>0){let Ce=this.text_decoder.decode(Uint8Array.from(te));G.push(Ce),te=[]}G.push(se)}}if(te.length>0){let se=this.text_decoder.decode(Uint8Array.from(te));G.push(se),te=[]}return G}}class ot extends $e{decode_chain(S){return[S.join("")]}}class De extends $e{constructor(S){super(S),this.content=this.config.content,this.start=this.config.start,this.stop=this.config.stop}decode_chain(S){return S.map(G=>{let te=0;for(let me=0;me<this.start&&G[me]===this.content;++me){te=me+1;continue}let se=G.length;for(let me=0;me<this.stop;++me){let Ce=G.length-me-1;if(G[Ce]===this.content){se=Ce;continue}else break}return G.slice(te,se)})}}class Qe extends $e{constructor(S){super(S),this.cleanup=S.cleanup}decode_chain(S){return S.map((G,te)=>(te!==0&&(G.startsWith(this.config.prefix)?G=G.replace(this.config.prefix,""):G=" "+G),this.cleanup&&(G=F(G)),G))}}class je extends $e{constructor(S){super(S),this.byte_decoder=J,this.text_decoder=new TextDecoder("utf-8",{fatal:!1,ignoreBOM:!0}),this.end_of_word_suffix=null}convert_tokens_to_string(S){let G=S.join(""),te=new Uint8Array([...G].map(me=>this.byte_decoder[me]));return this.text_decoder.decode(te)}decode_chain(S){let G=[],te=[];for(let se of S)this.added_tokens.find(me=>me.content===se)!==void 0?(te.length>0&&(G.push(this.convert_tokens_to_string(te)),te=[]),G.push(se)):te.push(se);return te.length>0&&G.push(this.convert_tokens_to_string(te)),G}}class pt extends $e{constructor(S){super(S),this.pad_token=this.config.pad_token,this.word_delimiter_token=this.config.word_delimiter_token,this.cleanup=this.config.cleanup}convert_tokens_to_string(S){if(S.length===0)return"";let G=[S[0]];for(let me=1;me<S.length;++me)S[me]!==G.at(-1)&&G.push(S[me]);let se=G.filter(me=>me!==this.pad_token).join("");return this.cleanup&&(se=F(se).replaceAll(this.word_delimiter_token," ").trim()),se}decode_chain(S){return[this.convert_tokens_to_string(S)]}}class Ke extends $e{constructor(S){super(S),this.decoders=S.decoders.map(G=>$e.fromConfig(G))}decode_chain(S){return this.decoders.reduce((G,te)=>te.decode_chain(G),S)}}class bt extends $e{constructor(S){super(S),this.suffix=this.config.suffix}decode_chain(S){return S.map((G,te)=>G.replaceAll(this.suffix,te===S.length-1?"":" "))}}class At extends $e{decode_chain(S){let G="";for(let te=1;te<S.length;te+=2)G+=S[te];return[G]}}class Lt extends we{constructor(S){super(),this.replacement=S.replacement,this.strRep=S.str_rep||this.replacement,this.prepend_scheme=S.prepend_scheme??"always"}pre_tokenize_text(S,{section_index:G=void 0}={}){let te=S.replaceAll(" ",this.strRep);return!te.startsWith(this.replacement)&&(this.prepend_scheme==="always"||this.prepend_scheme==="first"&&G===0)&&(te=this.strRep+te),[te]}}class fr extends $e{constructor(S){super(S),this.replacement=S.replacement}decode_chain(S){let G=[];for(let te=0;te<S.length;++te){let se=S[te].replaceAll(this.replacement," ");te==0&&se.startsWith(" ")&&(se=se.substring(1)),G.push(se)}return G}}class zt extends oe{constructor(S){super(S),this.charsmap=S.precompiled_charsmap}normalize(S){return S=S.replace(/[\u0001-\u0008\u000B\u000E-\u001F\u007F\u008F\u009F]/gm,""),S=S.replace(/[\u0009\u000A\u000C\u000D\u00A0\u1680\u2000-\u200F\u2028\u2029\u202F\u205F\u2581\u3000\uFEFF\uFFFD]/gm," "),S.includes("\uFF5E")?S=S.split("\uFF5E").map(te=>te.normalize("NFKC")).join("\uFF5E"):S=S.normalize("NFKC"),S}}class yr extends we{constructor(S){super(),this.tokenizers=S.pretokenizers.map(G=>we.fromConfig(G))}pre_tokenize_text(S,G){return this.tokenizers.reduce((te,se)=>se.pre_tokenize(te,G),[S])}}class zs extends we{constructor(S){super()}pre_tokenize_text(S,G){return S.match(/\w+|[^\w\s]+/g)||[]}}class Ys extends we{constructor(S){super()}pre_tokenize_text(S,G){return P(S)}}class Zs extends we{constructor(S){super(),this.config=S,this.pattern=g(this.config.pattern),this.content=this.config.content}pre_tokenize_text(S,G){return this.pattern===null?[S]:[S.replaceAll(this.pattern,this.config.content)]}}class or extends we{constructor(S){super(),this._length=S.length}pre_tokenize_text(S,G){let te=[];for(let se=0;se<S.length;se+=this._length)te.push(S.slice(se,se+this._length));return te}}let Dr=["bos_token","eos_token","unk_token","sep_token","pad_token","cls_token","mask_token"];function Yr(de,S,G,te){for(let se of Object.keys(de)){let me=S-de[se].length,Ce=G(se),Ye=new Array(me).fill(Ce);de[se]=te==="right"?(0,o.mergeArrays)(de[se],Ye):(0,o.mergeArrays)(Ye,de[se])}}function Rs(de,S){for(let G of Object.keys(de))de[G].length=S}class ft extends s.Callable{return_token_type_ids=!1;padding_side="right";constructor(S,G){super(),this.config=G,this.normalizer=oe.fromConfig(S.normalizer),this.pre_tokenizer=we.fromConfig(S.pre_tokenizer),this.model=U.fromConfig(S.model,G),this.post_processor=ve.fromConfig(S.post_processor),this.decoder=$e.fromConfig(S.decoder),this.special_tokens=[],this.all_special_ids=[],this.added_tokens=[];for(let te of S.added_tokens){let se=new O(te);this.added_tokens.push(se),this.model.tokens_to_ids.set(se.content,se.id),this.model.vocab[se.id]=se.content,se.special&&(this.special_tokens.push(se.content),this.all_special_ids.push(se.id))}if(this.additional_special_tokens=G.additional_special_tokens??[],this.special_tokens.push(...this.additional_special_tokens),this.special_tokens=[...new Set(this.special_tokens)],this.decoder&&(this.decoder.added_tokens=this.added_tokens,this.decoder.end_of_word_suffix=this.model.end_of_word_suffix),this.added_tokens_splitter=new l.DictionarySplitter(this.added_tokens.map(te=>te.content)),this.added_tokens_map=new Map(this.added_tokens.map(te=>[te.content,te])),this.mask_token=this.getToken("mask_token"),this.mask_token_id=this.model.tokens_to_ids.get(this.mask_token),this.pad_token=this.getToken("pad_token","eos_token"),this.pad_token_id=this.model.tokens_to_ids.get(this.pad_token),this.sep_token=this.getToken("sep_token"),this.sep_token_id=this.model.tokens_to_ids.get(this.sep_token),this.unk_token=this.getToken("unk_token"),this.unk_token_id=this.model.tokens_to_ids.get(this.unk_token),this.bos_token=this.getToken("bos_token"),this.bos_token_id=this.model.tokens_to_ids.get(this.bos_token),this.eos_token=this.getToken("eos_token"),this.eos_token_id=this.model.tokens_to_ids.get(this.eos_token),this.model_max_length=G.model_max_length,this.remove_space=G.remove_space,this.clean_up_tokenization_spaces=G.clean_up_tokenization_spaces??!0,this.do_lowercase_and_remove_accent=G.do_lowercase_and_remove_accent??!1,G.padding_side&&(this.padding_side=G.padding_side),this.add_bos_token=G.add_bos_token,this.add_eos_token=G.add_eos_token,this.legacy=!1,this.chat_template=G.chat_template??null,Array.isArray(this.chat_template)){let te=Object.create(null);for(let{name:se,template:me}of this.chat_template){if(typeof se!="string"||typeof me!="string")throw new Error('Chat template must be a list of objects with "name" and "template" properties');te[se]=me}this.chat_template=te}this._compiled_template_cache=new Map}getToken(...S){for(let G of S){let te=this.config[G];if(te)if(typeof te=="object"){if(te.__type==="AddedToken")return te.content;throw Error(`Unknown token: ${te}`)}else return te}return null}static async from_pretrained(S,{progress_callback:G=null,config:te=null,cache_dir:se=null,local_files_only:me=!1,revision:Ce="main",legacy:Ye=null}={}){let Xe=await u(S,{progress_callback:G,config:te,cache_dir:se,local_files_only:me,revision:Ce,legacy:Ye});return new this(...Xe)}_call(S,{text_pair:G=null,add_special_tokens:te=!0,padding:se=!1,truncation:me=null,max_length:Ce=null,return_tensor:Ye=!0,return_token_type_ids:Xe=null}={}){let Ze=Array.isArray(S),He;if(Ze){if(S.length===0)throw Error("text array must be non-empty");if(G!==null){if(Array.isArray(G)){if(S.length!==G.length)throw Error("text and text_pair must have the same length")}else throw Error("text_pair must also be an array");He=S.map((yt,Xt)=>this._encode_plus(yt,{text_pair:G[Xt],add_special_tokens:te,return_token_type_ids:Xe}))}else He=S.map(yt=>this._encode_plus(yt,{add_special_tokens:te,return_token_type_ids:Xe}))}else{if(S==null)throw Error("text may not be null or undefined");if(Array.isArray(G))throw Error("When specifying `text_pair`, since `text` is a string, `text_pair` must also be a string (i.e., not an array).");He=[this._encode_plus(S,{text_pair:G,add_special_tokens:te,return_token_type_ids:Xe})]}if(Ce===null?Ce=this.model_max_length:me===null&&(se===!0?(console.warn("`max_length` is ignored when `padding: true` and there is no truncation strategy. To pad to max length, use `padding: 'max_length'`."),Ce=this.model_max_length):se===!1&&(console.warn("Truncation was not explicitly activated but `max_length` is provided a specific value, please use `truncation: true` to explicitly truncate examples to max length."),me=!0)),se===!0&&(Ce=Math.min((0,n.max)(He.map(yt=>yt.input_ids.length))[0],Ce??1/0)),Ce=Math.min(Ce,this.model_max_length??1/0),se||me)for(let yt=0;yt<He.length;++yt)He[yt].input_ids.length!==Ce&&(He[yt].input_ids.length>Ce?me&&Rs(He[yt],Ce):se&&Yr(He[yt],Ce,Xt=>Xt==="input_ids"?this.pad_token_id:0,this.padding_side));let It={};if(Ye){if(!(se&&me)&&He.some(Xt=>{for(let Mr of Object.keys(Xt))if(Xt[Mr].length!==He[0][Mr]?.length)return!0;return!1}))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=true' and 'truncation=true' to have batched tensors with the same length.");let yt=[He.length,He[0].input_ids.length];for(let Xt of Object.keys(He[0]))It[Xt]=new i.Tensor("int64",BigInt64Array.from(He.flatMap(Mr=>Mr[Xt]).map(BigInt)),yt)}else{for(let yt of Object.keys(He[0]))It[yt]=He.map(Xt=>Xt[yt]);if(!Ze)for(let yt of Object.keys(It))It[yt]=It[yt][0]}return It}_encode_text(S){if(S===null)return null;let G=this.added_tokens_splitter.split(S);for(let se=0;se<G.length;++se){let me=this.added_tokens_map.get(G[se]);me&&(me.lstrip&&se>0&&(G[se-1]=G[se-1].trimEnd()),me.rstrip&&se<G.length-1&&(G[se+1]=G[se+1].trimStart()))}return G.flatMap((se,me)=>{if(se.length===0)return[];if(this.added_tokens_map.has(se))return[se];if(this.remove_space===!0&&(se=se.trim().split(/\s+/).join(" ")),this.do_lowercase_and_remove_accent&&(se=b(se)),this.normalizer!==null&&(se=this.normalizer(se)),se.length===0)return[];let Ce=this.pre_tokenizer!==null?this.pre_tokenizer(se,{section_index:me}):[se];return this.model(Ce)})}_encode_plus(S,{text_pair:G=null,add_special_tokens:te=!0,return_token_type_ids:se=null}={}){let{tokens:me,token_type_ids:Ce}=this._tokenize_helper(S,{pair:G,add_special_tokens:te}),Ye=this.model.convert_tokens_to_ids(me),Xe={input_ids:Ye,attention_mask:new Array(Ye.length).fill(1)};return(se??this.return_token_type_ids)&&Ce&&(Xe.token_type_ids=Ce),Xe}_tokenize_helper(S,{pair:G=null,add_special_tokens:te=!1}={}){let se=this._encode_text(S),me=this._encode_text(G);return this.post_processor?this.post_processor(se,me,{add_special_tokens:te}):{tokens:(0,o.mergeArrays)(se??[],me??[])}}tokenize(S,{pair:G=null,add_special_tokens:te=!1}={}){return this._tokenize_helper(S,{pair:G,add_special_tokens:te}).tokens}encode(S,{text_pair:G=null,add_special_tokens:te=!0,return_token_type_ids:se=null}={}){return this._encode_plus(S,{text_pair:G,add_special_tokens:te,return_token_type_ids:se}).input_ids}batch_decode(S,G={}){return S instanceof i.Tensor&&(S=S.tolist()),S.map(te=>this.decode(te,G))}decode(S,G={}){if(S instanceof i.Tensor&&(S=x(S)),!Array.isArray(S)||S.length===0||!(0,o.isIntegralNumber)(S[0]))throw Error("token_ids must be a non-empty array of integers.");return this.decode_single(S,G)}decode_single(S,{skip_special_tokens:G=!1,clean_up_tokenization_spaces:te=null}){let se=this.model.convert_ids_to_tokens(S);G&&(se=se.filter(Ce=>!this.special_tokens.includes(Ce)));let me=this.decoder?this.decoder(se):se.join(" ");return this.decoder&&this.decoder.end_of_word_suffix&&(me=me.replaceAll(this.decoder.end_of_word_suffix," "),G&&(me=me.trim())),(te??this.clean_up_tokenization_spaces)&&(me=F(me)),me}get_chat_template({chat_template:S=null,tools:G=null}={}){if(this.chat_template&&typeof this.chat_template=="object"){let te=this.chat_template;if(S!==null&&Object.hasOwn(te,S))S=te[S];else if(S===null)if(G!==null&&"tool_use"in te)S=te.tool_use;else if("default"in te)S=te.default;else throw Error(`This model has multiple chat templates with no default specified! Please either pass a chat template or the name of the template you wish to use to the 'chat_template' argument. Available template names are ${Object.keys(te).sort()}.`)}else if(S===null)if(this.chat_template)S=this.chat_template;else throw Error("Cannot use apply_chat_template() because tokenizer.chat_template is not set and no template argument was passed! For information about writing templates and setting the tokenizer.chat_template attribute, please see the documentation at https://huggingface.co/docs/transformers/main/en/chat_templating");return S}apply_chat_template(S,{tools:G=null,documents:te=null,chat_template:se=null,add_generation_prompt:me=!1,tokenize:Ce=!0,padding:Ye=!1,truncation:Xe=!1,max_length:Ze=null,return_tensor:He=!0,return_dict:It=!1,tokenizer_kwargs:yt={},...Xt}={}){if(se=this.get_chat_template({chat_template:se,tools:G}),typeof se!="string")throw Error(`chat_template must be a string, but got ${typeof se}`);let Mr=this._compiled_template_cache.get(se);Mr===void 0&&(Mr=new c.Template(se),this._compiled_template_cache.set(se,Mr));let nr=Object.create(null);for(let ir of Dr){let Tr=this.getToken(ir);Tr&&(nr[ir]=Tr)}let Br=Mr.render({messages:S,add_generation_prompt:me,tools:G,documents:te,...nr,...Xt});if(Ce){let ir=this._call(Br,{add_special_tokens:!1,padding:Ye,truncation:Xe,max_length:Ze,return_tensor:He,...yt});return It?ir:ir.input_ids}return Br}}class Cs extends ft{return_token_type_ids=!0}class qt extends ft{return_token_type_ids=!0}class Ss extends ft{return_token_type_ids=!0}class Qr extends ft{return_token_type_ids=!0}class St extends ft{return_token_type_ids=!0}class Xr extends ft{return_token_type_ids=!0}class k extends ft{return_token_type_ids=!0}class Q extends ft{return_token_type_ids=!0}class N extends ft{return_token_type_ids=!0}class K extends ft{}class Z extends ft{}class ce extends ft{return_token_type_ids=!0;constructor(S,G){super(S,G),console.warn('WARNING: `XLMTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}}class xe extends ft{return_token_type_ids=!0}class et extends ft{}class ut extends ft{}class qe extends ft{}class wt extends ft{constructor(S,G){super(S,G),this.languageRegex=/^[a-z]{2}_[A-Z]{2}$/,this.language_codes=this.special_tokens.filter(te=>this.languageRegex.test(te)),this.lang_to_token=te=>te}_build_translation_inputs(S,G,te){return Gr(this,S,G,te)}}class tt extends wt{}class gt extends ft{}class Nt extends ft{}let Qt="\u2581";class ur extends ft{padding_side="left";constructor(S,G){super(S,G),this.legacy=G.legacy??!0,this.legacy||(this.normalizer=null,this.pre_tokenizer=new Lt({replacement:Qt,prepend_scheme:"first"}))}_encode_text(S){if(S===null)return null;if(this.legacy||S.length===0)return super._encode_text(S);let G=super._encode_text(Qt+S.replaceAll(Qt," "));return G.length>1&&G[0]===Qt&&this.special_tokens.includes(G[1])&&(G=G.slice(1)),G}}class Or extends ft{}class Cr extends ft{}class Lr extends ft{}class _s extends ft{}class Fs extends ft{}class gr extends ft{}class Ns extends ft{}class as extends ft{}class Nr extends ft{}function Gr(de,S,G,te){if(!("language_codes"in de)||!Array.isArray(de.language_codes))throw new Error("Tokenizer must have `language_codes` attribute set and it should be an array of language ids.");if(!("languageRegex"in de)||!(de.languageRegex instanceof RegExp))throw new Error("Tokenizer must have `languageRegex` attribute set and it should be a regular expression.");if(!("lang_to_token"in de)||typeof de.lang_to_token!="function")throw new Error("Tokenizer must have `lang_to_token` attribute set and it should be a function.");let se=te.src_lang,me=te.tgt_lang;if(!de.language_codes.includes(me))throw new Error(`Target language code "${me}" is not valid. Must be one of: {${de.language_codes.join(", ")}}`);if(se!==void 0){if(!de.language_codes.includes(se))throw new Error(`Source language code "${se}" is not valid. Must be one of: {${de.language_codes.join(", ")}}`);for(let Ce of de.post_processor.config.single)if("SpecialToken"in Ce&&de.languageRegex.test(Ce.SpecialToken.id)){Ce.SpecialToken.id=de.lang_to_token(se);break}}return te.forced_bos_token_id=de.model.convert_tokens_to_ids([de.lang_to_token(me)])[0],de._call(S,G)}class ar extends ft{constructor(S,G){super(S,G),this.languageRegex=/^[a-z]{3}_[A-Z][a-z]{3}$/,this.language_codes=this.special_tokens.filter(te=>this.languageRegex.test(te)),this.lang_to_token=te=>te}_build_translation_inputs(S,G,te){return Gr(this,S,G,te)}}class _r extends ft{constructor(S,G){super(S,G),this.languageRegex=/^__[a-z]{2,3}__$/,this.language_codes=this.special_tokens.filter(te=>this.languageRegex.test(te)).map(te=>te.slice(2,-2)),this.lang_to_token=te=>`__${te}__`}_build_translation_inputs(S,G,te){return Gr(this,S,G,te)}}class ps extends ft{get timestamp_begin(){return this.model.convert_tokens_to_ids(["<|notimestamps|>"])[0]+1}_decode_asr(S,{return_timestamps:G=!1,return_language:te=!1,time_precision:se=null,force_full_sequences:me=!0}={}){if(se===null)throw Error("Must specify time_precision");let Ce=null,Ye=G==="word";function Xe(){return{language:Ce,timestamp:[null,null],text:""}}let Ze=[],He=Xe(),It=0,yt=this.timestamp_begin,Mr=yt+1500,nr=[],Br=[],ir=!1,Tr=null,zr=new Set(this.all_special_ids);for(let Yt of S){let vr=Yt.tokens,Sr=Ye?Yt.token_timestamps:null,Jr=null,ms=yt;if("stride"in Yt){let[lr,pr,wr]=Yt.stride;if(It-=pr,Tr=lr-wr,pr&&(ms=pr/se+yt),wr)for(let er=vr.length-1;er>=0;--er){let Kr=Number(vr[er]);if(Kr>=yt){if(Jr!==null&&(Kr-yt)*se<Tr)break;Jr=Kr}}}let Fr=[],is=[];for(let lr=0;lr<vr.length;++lr){let pr=Number(vr[lr]);if(zr.has(pr)){let wr=this.decode([pr]),er=_.WHISPER_LANGUAGE_MAPPING.get(wr.slice(2,-2));if(er!==void 0){if(Ce!==null&&er!==Ce&&!G){nr.push(Fr);let Kr=this.findLongestCommonSequence(nr)[0],Ws=this.decode(Kr);He.text=Ws,Ze.push(He),nr=[],Fr=[],He=Xe()}Ce=He.language=er}}else if(pr>=yt&&pr<=Mr){let wr=(pr-yt)*se+It,er=(0,n.round)(wr,2);if(Jr!==null&&pr>=Jr)ir=!0;else if(ir||nr.length>0&&pr<ms)ir=!1;else if(He.timestamp[0]===null)He.timestamp[0]=er;else if(er!==He.timestamp[0]){He.timestamp[1]=er,nr.push(Fr),Ye&&Br.push(is);let[Kr,Ws]=this.findLongestCommonSequence(nr,Br),Os=this.decode(Kr);He.text=Os,Ye&&(He.words=this.collateWordTimestamps(Kr,Ws,Ce)),Ze.push(He),nr=[],Fr=[],Br=[],is=[],He=Xe()}}else if(Fr.push(pr),Ye){let wr=(0,n.round)(Sr[lr]+It,2),er;if(lr+1<Sr.length){er=(0,n.round)(Sr[lr+1]+It,2);let Kr=this.decode([pr]);f.test(Kr)&&(er=(0,n.round)(Math.min(wr+se,er),2))}else er=null;is.push([wr,er])}}if("stride"in Yt){let[lr,pr,wr]=Yt.stride;It+=lr-wr}Fr.length>0?(nr.push(Fr),Ye&&Br.push(is)):nr.every(lr=>lr.length===0)&&(He=Xe(),nr=[],Fr=[],Br=[],is=[])}if(nr.length>0){if(me&&G)throw new Error("Whisper did not predict an ending timestamp, which can happen if audio is cut off in the middle of a word. Also make sure WhisperTimeStampLogitsProcessor was used during generation.");let[Yt,vr]=this.findLongestCommonSequence(nr,Br),Sr=this.decode(Yt);He.text=Sr,Ye&&(He.words=this.collateWordTimestamps(Yt,vr,Ce)),Ze.push(He)}let Pr=Object.create(null),Zr=Ze.map(Yt=>Yt.text).join("");if(G||te){for(let Yt=0;Yt<Ze.length;++Yt){let vr=Ze[Yt];G||delete vr.timestamp,te||delete vr.language}if(Ye){let Yt=[];for(let vr of Ze)for(let Sr of vr.words)Yt.push(Sr);Pr={chunks:Yt}}else Pr={chunks:Ze}}return[Zr,Pr]}findLongestCommonSequence(S,G=null){let te=S[0],se=te.length,me=[],Ce=Array.isArray(G)&&G.length>0,Ye=Ce?[]:null,Xe=Ce?G[0]:null;for(let Ze=1;Ze<S.length;++Ze){let He=S[Ze],It=0,yt=[se,se,0,0],Xt=He.length;for(let Pr=1;Pr<se+Xt;++Pr){let Zr=Math.max(0,se-Pr),Yt=Math.min(se,se+Xt-Pr),vr=te.slice(Zr,Yt),Sr=Math.max(0,Pr-se),Jr=Math.min(Xt,Pr),ms=He.slice(Sr,Jr);if(vr.length!==ms.length)throw new Error("There is a bug within whisper `decode_asr` function, please report it. Dropping to prevent bad inference.");let Fr;Ce?Fr=vr.filter((pr,wr)=>pr===ms[wr]&&Xe[Zr+wr]<=G[Ze][Sr+wr]).length:Fr=vr.filter((pr,wr)=>pr===ms[wr]).length;let is=Pr/1e4,lr=Fr/Pr+is;Fr>1&&lr>It&&(It=lr,yt=[Zr,Yt,Sr,Jr])}let[Mr,nr,Br,ir]=yt,Tr=Math.floor((nr+Mr)/2),zr=Math.floor((ir+Br)/2);me.push(...te.slice(0,Tr)),te=He.slice(zr),se=te.length,Ce&&(Ye.push(...Xe.slice(0,Tr)),Xe=G[Ze].slice(zr))}return me.push(...te),Ce?(Ye.push(...Xe),[me,Ye]):[me,[]]}collateWordTimestamps(S,G,te){let[se,me,Ce]=this.combineTokensIntoWords(S,te),Ye=[];for(let Xe=0;Xe<se.length;++Xe){let Ze=Ce[Xe];Ye.push({text:se[Xe],timestamp:[G[Ze.at(0)][0],G[Ze.at(-1)][1]]})}return Ye}combineTokensIntoWords(S,G,te=`"'\u201C\xA1\xBF([{-`,se=`"'.\u3002,\uFF0C!\uFF01?\uFF1F:\uFF1A\u201D)]}\u3001`){G=G??"english";let me,Ce,Ye;return["chinese","japanese","thai","lao","myanmar"].includes(G)?[me,Ce,Ye]=this.splitTokensOnUnicode(S):[me,Ce,Ye]=this.splitTokensOnSpaces(S),this.mergePunctuations(me,Ce,Ye,te,se)}decode(S,G){let te;return G?.decode_with_timestamps?(S instanceof i.Tensor&&(S=x(S)),te=this.decodeWithTimestamps(S,G)):te=super.decode(S,G),te}decodeWithTimestamps(S,G){let te=G?.time_precision??.02,se=Array.from(this.all_special_ids).at(-1)+1,me=[[]];for(let Ce of S)if(Ce=Number(Ce),Ce>=se){let Ye=((Ce-se)*te).toFixed(2);me.push(`<|${Ye}|>`),me.push([])}else me[me.length-1].push(Ce);return me=me.map(Ce=>typeof Ce=="string"?Ce:super.decode(Ce,G)),me.join("")}splitTokensOnUnicode(S){let G=this.decode(S,{decode_with_timestamps:!0}),te="\uFFFD",se=[],me=[],Ce=[],Ye=[],Xe=[],Ze=0;for(let He=0;He<S.length;++He){let It=S[He];Ye.push(It),Xe.push(He);let yt=this.decode(Ye,{decode_with_timestamps:!0});(!yt.includes(te)||G[Ze+yt.indexOf(te)]===te)&&(se.push(yt),me.push(Ye),Ce.push(Xe),Ye=[],Xe=[],Ze+=yt.length)}return[se,me,Ce]}splitTokensOnSpaces(S){let[G,te,se]=this.splitTokensOnUnicode(S),me=[],Ce=[],Ye=[],Xe=new RegExp(`^[${I}]$`,"gu");for(let Ze=0;Ze<G.length;++Ze){let He=G[Ze],It=te[Ze],yt=se[Ze],Xt=It[0]>=this.model.tokens_to_ids.get("<|endoftext|>"),Mr=He.startsWith(" "),nr=He.trim(),Br=Xe.test(nr);if(Xt||Mr||Br||me.length===0)me.push(He),Ce.push(It),Ye.push(yt);else{let ir=me.length-1;me[ir]+=He,Ce[ir].push(...It),Ye[ir].push(...yt)}}return[me,Ce,Ye]}mergePunctuations(S,G,te,se,me){let Ce=structuredClone(S),Ye=structuredClone(G),Xe=structuredClone(te),Ze=Ce.length-2,He=Ce.length-1;for(;Ze>=0;)Ce[Ze].startsWith(" ")&&se.includes(Ce[Ze].trim())?(Ce[He]=Ce[Ze]+Ce[He],Ye[He]=(0,o.mergeArrays)(Ye[Ze],Ye[He]),Xe[He]=(0,o.mergeArrays)(Xe[Ze],Xe[He]),Ce[Ze]="",Ye[Ze]=[],Xe[Ze]=[]):He=Ze,--Ze;for(Ze=0,He=1;He<Ce.length;)!Ce[Ze].endsWith(" ")&&me.includes(Ce[He])?(Ce[Ze]+=Ce[He],Ye[Ze]=(0,o.mergeArrays)(Ye[Ze],Ye[He]),Xe[Ze]=(0,o.mergeArrays)(Xe[Ze],Xe[He]),Ce[He]="",Ye[He]=[],Xe[He]=[]):Ze=He,++He;return[Ce.filter(It=>It),Ye.filter(It=>It.length>0),Xe.filter(It=>It.length>0)]}}class Is extends ft{}class As extends ft{}class $s extends ft{}class ns extends ft{constructor(S,G){super(S,G),this.languageRegex=/^(>>\w+<<)\s*/g,this.supported_language_codes=this.model.vocab.filter(te=>this.languageRegex.test(te)),console.warn('WARNING: `MarianTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}_encode_text(S){if(S===null)return null;let[G,...te]=S.trim().split(this.languageRegex);if(te.length===0)return super._encode_text(G);if(te.length===2){let[se,me]=te;return this.supported_language_codes.includes(se)||console.warn(`Unsupported language code "${se}" detected, which may lead to unexpected behavior. Should be one of: ${JSON.stringify(this.supported_language_codes)}`),(0,o.mergeArrays)([se],super._encode_text(me))}}}class Wr extends ft{}class ze extends ft{}class Ue extends ft{}class at extends ft{}class Ht extends ft{}class js extends ft{constructor(S,G){super(S,G),this.decoder=new At({})}}class Ds extends ft{}class Vs extends ft{}class Wo{static TOKENIZER_CLASS_MAPPING={T5Tokenizer:et,DistilBertTokenizer:K,CamembertTokenizer:Z,DebertaTokenizer:St,DebertaV2Tokenizer:Xr,BertTokenizer:Cs,HerbertTokenizer:k,ConvBertTokenizer:Q,RoFormerTokenizer:N,XLMTokenizer:ce,ElectraTokenizer:xe,MobileBertTokenizer:Ss,SqueezeBertTokenizer:Qr,AlbertTokenizer:qt,GPT2Tokenizer:ut,BartTokenizer:qe,MBartTokenizer:wt,MBart50Tokenizer:tt,RobertaTokenizer:gt,WhisperTokenizer:ps,CodeGenTokenizer:Is,CLIPTokenizer:As,SiglipTokenizer:$s,MarianTokenizer:ns,BloomTokenizer:Nt,NllbTokenizer:ar,M2M100Tokenizer:_r,LlamaTokenizer:ur,CodeLlamaTokenizer:Or,XLMRobertaTokenizer:Cr,MPNetTokenizer:Lr,FalconTokenizer:_s,GPTNeoXTokenizer:Fs,EsmTokenizer:gr,Wav2Vec2CTCTokenizer:Wr,BlenderbotTokenizer:ze,BlenderbotSmallTokenizer:Ue,SpeechT5Tokenizer:at,NougatTokenizer:Ht,VitsTokenizer:js,Qwen2Tokenizer:Ns,GemmaTokenizer:as,Grok1Tokenizer:Nr,CohereTokenizer:Ds,MgpstrTokenizer:Vs,PreTrainedTokenizer:ft};static async from_pretrained(S,{progress_callback:G=null,config:te=null,cache_dir:se=null,local_files_only:me=!1,revision:Ce="main",legacy:Ye=null}={}){let[Xe,Ze]=await u(S,{progress_callback:G,config:te,cache_dir:se,local_files_only:me,revision:Ce,legacy:Ye}),He=Ze.tokenizer_class?.replace(/Fast$/,"")??"PreTrainedTokenizer",It=this.TOKENIZER_CLASS_MAPPING[He];return It||(console.warn(`Unknown tokenizer class "${He}", attempting to construct from base class.`),It=ft),new It(Xe,Ze)}}}),"./src/utils/audio.js":((e,r,t)=>{t.r(r),t.d(r,{RawAudio:()=>W,hamming:()=>d,hanning:()=>u,mel_filter_bank:()=>C,read_audio:()=>c,spectrogram:()=>E,window_function:()=>D});var s=t("./src/utils/hub.js"),o=t("./src/utils/maths.js"),a=t("./src/utils/core.js"),n=t("./src/env.js"),i=t("./src/utils/tensor.js"),l=t("?7992");async function c(z,X){if(typeof AudioContext>"u")throw Error("Unable to load audio from path/URL since `AudioContext` is not available in your environment. Instead, audio data should be passed directly to the pipeline/processor. For more information and some example code, see https://huggingface.co/docs/transformers.js/guides/node-audio-processing.");let J=await(await(0,s.getFile)(z)).arrayBuffer(),q=new AudioContext({sampleRate:X});typeof X>"u"&&console.warn(`No sampling rate provided, using default of ${q.sampleRate}Hz.`);let re=await q.decodeAudioData(J),oe;if(re.numberOfChannels===2){let ne=Math.sqrt(2),ye=re.getChannelData(0),Y=re.getChannelData(1);oe=new Float32Array(ye.length);for(let H=0;H<re.length;++H)oe[H]=ne*(ye[H]+Y[H])/2}else oe=re.getChannelData(0);return oe}function _(z,X){if(z<1)return new Float64Array;if(z===1)return new Float64Array([1]);let J=1-X,q=2*Math.PI/(z-1),re=new Float64Array(z);for(let oe=0;oe<z;++oe)re[oe]=X-J*Math.cos(oe*q);return re}function u(z){return _(z,.5)}function d(z){return _(z,.54)}let g={htk:z=>2595*Math.log10(1+z/700),kaldi:z=>1127*Math.log(1+z/700),slaney:(z,X=1e3,J=15,q=27/Math.log(6.4))=>z>=X?J+Math.log(z/X)*q:3*z/200};function h(z,X="htk"){let J=g[X];if(!J)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof z=="number"?J(z):z.map(q=>J(q))}let x={htk:z=>700*(10**(z/2595)-1),kaldi:z=>700*(Math.exp(z/1127)-1),slaney:(z,X=1e3,J=15,q=Math.log(6.4)/27)=>z>=J?X*Math.exp(q*(z-J)):200*z/3};function F(z,X="htk"){let J=x[X];if(!J)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof z=="number"?J(z):z.map(q=>J(q))}function v(z,X){let J=Float64Array.from({length:X.length-1},(ne,ye)=>X[ye+1]-X[ye]),q=Array.from({length:z.length},()=>new Array(X.length));for(let ne=0;ne<z.length;++ne){let ye=q[ne];for(let Y=0;Y<X.length;++Y)ye[Y]=X[Y]-z[ne]}let re=X.length-2,oe=Array.from({length:re},()=>new Array(z.length));for(let ne=0;ne<z.length;++ne){let ye=q[ne];for(let Y=0;Y<re;++Y){let H=-ye[Y]/J[Y],R=ye[Y+2]/J[Y+1];oe[Y][ne]=Math.max(0,Math.min(H,R))}}return oe}function b(z,X,J){let q=(X-z)/(J-1);return Float64Array.from({length:J},(re,oe)=>z+q*oe)}function C(z,X,J,q,re,oe=null,ne="htk",ye=!1){if(oe!==null&&oe!=="slaney")throw new Error('norm must be one of null or "slaney"');if(z<2)throw new Error(`Require num_frequency_bins: ${z} >= 2`);if(J>q)throw new Error(`Require min_frequency: ${J} <= max_frequency: ${q}`);let Y=h(J,ne),H=h(q,ne),R=b(Y,H,X+2),L=F(R,ne),ee;if(ye){let ke=re/((z-1)*2);ee=h(Float64Array.from({length:z},(Ie,Le)=>Le*ke),ne),L=R}else ee=b(0,Math.floor(re/2),z);let ue=v(ee,L);if(oe!==null&&oe==="slaney")for(let ke=0;ke<X;++ke){let Ie=ue[ke],Le=2/(L[ke+2]-L[ke]);for(let rt=0;rt<z;++rt)Ie[rt]*=Le}return ue}function y(z,X,J){let q=new z.constructor(z.length+X+J),re=z.length-1;for(let oe=0;oe<z.length;++oe)q[X+oe]=z[oe];for(let oe=1;oe<=X;++oe)q[X-oe]=z[(0,a.calculateReflectOffset)(oe,re)];for(let oe=1;oe<=J;++oe)q[re+X+oe]=z[(0,a.calculateReflectOffset)(re-oe,re)];return q}function P(z,X,J,q,re){if(J<=0)throw new Error("reference must be greater than zero");if(q<=0)throw new Error("min_value must be greater than zero");J=Math.max(q,J);let oe=Math.log10(J);for(let ne=0;ne<z.length;++ne)z[ne]=X*Math.log10(Math.max(q,z[ne])-oe);if(re!==null){if(re<=0)throw new Error("db_range must be greater than zero");let ne=(0,o.max)(z)[0]-re;for(let ye=0;ye<z.length;++ye)z[ye]=Math.max(z[ye],ne)}return z}function I(z,X=1,J=1e-5,q=null){return P(z,20,X,J,q)}function f(z,X=1,J=1e-10,q=null){return P(z,10,X,J,q)}async function E(z,X,J,q,{fft_length:re=null,power:oe=1,center:ne=!0,pad_mode:ye="reflect",onesided:Y=!0,preemphasis:H=null,preemphasis_htk_flavor:R=!0,mel_filters:L=null,mel_floor:ee=1e-10,log_mel:ue=null,reference:ke=1,min_value:Ie=1e-10,db_range:Le=null,remove_dc_offset:rt=null,min_num_frames:we=null,max_num_frames:A=null,do_pad:le=!0,transpose:ge=!1,mel_offset:be=0}={}){let Ae=X.length;if(re===null&&(re=J),J>re)throw Error(`frame_length (${J}) may not be larger than fft_length (${re})`);if(Ae!==J)throw new Error(`Length of the window (${Ae}) must equal frame_length (${J})`);if(q<=0)throw new Error("hop_length must be greater than zero");if(oe===null&&L!==null)throw new Error("You have provided `mel_filters` but `power` is `None`. Mel spectrogram computation is not yet supported for complex-valued spectrogram. Specify `power` to fix this issue.");if(!R)throw new Error("`preemphasis_htk_flavor=false` is not currently supported.");if(ne)switch(ye){case"reflect":{let Qe=Math.floor((re-1)/2)+1;z=y(z,Qe,Qe);break}case"constant":{let Qe=Math.floor(re/2),je=new z.constructor(z.length+2*Qe);je.set(z,Qe),z=je;break}default:throw new Error(`pad_mode="${ye}" not implemented yet.`)}let ve=Math.floor(1+Math.floor((z.length-J)/q));we!==null&&ve<we&&(ve=we);let pe=Y?Math.floor(re/2)+1:re,Pe=ve,fe=ve;A!==null&&(A>ve?le&&(fe=A):fe=Pe=A);let Te=new o.FFT(re),We=new Float64Array(re),$e=new Float64Array(Te.outputBufferSize),Re=new Float32Array(pe*fe);for(let Qe=0;Qe<Pe;++Qe){let je=Qe*q,pt=Math.min(z.length-je,J);pt!==J&&We.fill(0,0,J);for(let Ke=0;Ke<pt;++Ke)We[Ke]=z[je+Ke];if(rt){let Ke=0;for(let At=0;At<pt;++At)Ke+=We[At];let bt=Ke/pt;for(let At=0;At<pt;++At)We[At]-=bt}if(H!==null){for(let Ke=pt-1;Ke>=1;--Ke)We[Ke]-=H*We[Ke-1];We[0]*=1-H}for(let Ke=0;Ke<X.length;++Ke)We[Ke]*=X[Ke];Te.realTransform($e,We);for(let Ke=0;Ke<pe;++Ke){let bt=Ke<<1;Re[Ke*fe+Qe]=$e[bt]**2+$e[bt+1]**2}}if(oe!==null&&oe!==2){let Qe=oe/2;for(let je=0;je<Re.length;++je)Re[je]**=Qe}let Ne=L.length,ot=await(0,i.matmul)(new i.Tensor("float32",L.flat(),[Ne,pe]),new i.Tensor("float32",Re,[pe,fe]));ge&&(ot=ot.transpose(1,0));let De=ot.data;for(let Qe=0;Qe<De.length;++Qe)De[Qe]=be+Math.max(ee,De[Qe]);if(oe!==null&&ue!==null){let Qe=Math.min(De.length,Pe*Ne);switch(ue){case"log":for(let je=0;je<Qe;++je)De[je]=Math.log(De[je]);break;case"log10":for(let je=0;je<Qe;++je)De[je]=Math.log10(De[je]);break;case"dB":if(oe===1)I(De,ke,Ie,Le);else if(oe===2)f(De,ke,Ie,Le);else throw new Error(`Cannot use log_mel option '${ue}' with power ${oe}`);break;default:throw new Error(`log_mel must be one of null, 'log', 'log10' or 'dB'. Got '${ue}'`)}}return ot}function D(z,X,{periodic:J=!0,frame_length:q=null,center:re=!0}={}){let oe=J?z+1:z,ne;switch(X){case"boxcar":ne=new Float64Array(oe).fill(1);break;case"hann":case"hann_window":ne=u(oe);break;case"hamming":ne=d(oe);break;case"povey":ne=u(oe).map(ye=>Math.pow(ye,.85));break;default:throw new Error(`Unknown window type ${X}.`)}if(J&&(ne=ne.subarray(0,z)),q===null)return ne;if(z>q)throw new Error(`Length of the window (${z}) may not be larger than frame_length (${q})`);return ne}function O(z,X){let J=44,q=new ArrayBuffer(J+z.length*4),re=new DataView(q);U(re,0,"RIFF"),re.setUint32(4,36+z.length*4,!0),U(re,8,"WAVE"),U(re,12,"fmt "),re.setUint32(16,16,!0),re.setUint16(20,3,!0),re.setUint16(22,1,!0),re.setUint32(24,X,!0),re.setUint32(28,X*4,!0),re.setUint16(32,4,!0),re.setUint16(34,32,!0),U(re,36,"data"),re.setUint32(40,z.length*4,!0);for(let oe=0;oe<z.length;++oe,J+=4)re.setFloat32(J,z[oe],!0);return q}function U(z,X,J){for(let q=0;q<J.length;++q)z.setUint8(X+q,J.charCodeAt(q))}class W{constructor(X,J){this.audio=X,this.sampling_rate=J}toWav(){return O(this.audio,this.sampling_rate)}toBlob(){let X=this.toWav();return new Blob([X],{type:"audio/wav"})}async save(X){let J;if(n.apis.IS_BROWSER_ENV){if(n.apis.IS_WEBWORKER_ENV)throw new Error("Unable to save a file from a Web Worker.");J=a.saveBlob}else if(n.apis.IS_FS_AVAILABLE)J=async(q,re)=>{let oe=await re.arrayBuffer();l.writeFileSync(q,Buffer.from(oe))};else throw new Error("Unable to save because filesystem is disabled in this environment.");await J(X,this.toBlob())}}}),"./src/utils/constants.js":((e,r,t)=>{t.r(r),t.d(r,{CHAT_TEMPLATE_NAME:()=>l,CONFIG_NAME:()=>o,FEATURE_EXTRACTOR_NAME:()=>a,GENERATION_CONFIG_NAME:()=>c,GITHUB_ISSUE_URL:()=>s,IMAGE_PROCESSOR_NAME:()=>n,PROCESSOR_NAME:()=>i});let s="https://github.com/huggingface/transformers.js/issues/new/choose",o="config.json",a="preprocessor_config.json",n=a,i="processor_config.json",l="chat_template.jinja",c="generation_config.json"}),"./src/utils/core.js":((e,r,t)=>{t.r(r),t.d(r,{calculateDimensions:()=>c,calculateReflectOffset:()=>g,count:()=>v,dispatchCallback:()=>s,escapeRegExp:()=>a,isIntegralNumber:()=>i,isNullishDimension:()=>l,isTypedArray:()=>n,len:()=>F,mergeArrays:()=>u,pick:()=>x,pop:()=>_,product:()=>d,reverseDictionary:()=>o,saveBlob:()=>h});function s(b,C){b&&b(C)}function o(b){return Object.fromEntries(Object.entries(b).map(([C,y])=>[y,C]))}function a(b){return b.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function n(b){return b?.prototype?.__proto__?.constructor?.name==="TypedArray"}function i(b){return Number.isInteger(b)||typeof b=="bigint"}function l(b){return b==null||b===-1}function c(b){let C=[],y=b;for(;Array.isArray(y);)C.push(y.length),y=y[0];return C}function _(b,C,y=void 0){let P=b[C];if(P!==void 0)return delete b[C],P;if(y===void 0)throw Error(`Key ${C} does not exist in object.`);return y}function u(...b){return Array.prototype.concat.apply([],b)}function d(...b){return b.reduce((C,y)=>C.flatMap(P=>y.map(I=>[P,I])))}function g(b,C){return Math.abs((b+C)%(2*C)-C)}function h(b,C){let y=URL.createObjectURL(C),P=document.createElement("a");P.href=y,P.download=b,P.click(),P.remove(),URL.revokeObjectURL(y)}function x(b,C){return Object.assign({},...C.map(y=>{if(b[y]!==void 0)return{[y]:b[y]}}))}function F(b){let C=0;for(let y of b)++C;return C}function v(b,C){let y=0;for(let P of b)P===C&&++y;return y}}),"./src/utils/data-structures.js":((e,r,t)=>{t.r(r),t.d(r,{CharTrie:()=>o,DictionarySplitter:()=>l,LRUCache:()=>c,PriorityQueue:()=>s,TokenLattice:()=>n});class s{constructor(u=(g,h)=>g>h,d=1/0){this._heap=[],this._comparator=u,this._maxSize=d}get size(){return this._heap.length}isEmpty(){return this.size===0}peek(){return this._heap[0]}push(...u){return this.extend(u)}extend(u){for(let d of u)if(this.size<this._maxSize)this._heap.push(d),this._siftUp();else{let g=this._smallest();this._comparator(d,this._heap[g])&&(this._heap[g]=d,this._siftUpFrom(g))}return this.size}pop(){let u=this.peek(),d=this.size-1;return d>0&&this._swap(0,d),this._heap.pop(),this._siftDown(),u}replace(u){let d=this.peek();return this._heap[0]=u,this._siftDown(),d}_parent(u){return(u+1>>>1)-1}_left(u){return(u<<1)+1}_right(u){return u+1<<1}_greater(u,d){return this._comparator(this._heap[u],this._heap[d])}_swap(u,d){let g=this._heap[u];this._heap[u]=this._heap[d],this._heap[d]=g}_siftUp(){this._siftUpFrom(this.size-1)}_siftUpFrom(u){for(;u>0&&this._greater(u,this._parent(u));)this._swap(u,this._parent(u)),u=this._parent(u)}_siftDown(){let u=0;for(;this._left(u)<this.size&&this._greater(this._left(u),u)||this._right(u)<this.size&&this._greater(this._right(u),u);){let d=this._right(u)<this.size&&this._greater(this._right(u),this._left(u))?this._right(u):this._left(u);this._swap(u,d),u=d}}_smallest(){return 2**Math.floor(Math.log2(this.size))-1}}class o{constructor(){this.root=a.default()}extend(u){for(let d of u)this.push(d)}push(u){let d=this.root;for(let g of u){let h=d.children.get(g);h===void 0&&(h=a.default(),d.children.set(g,h)),d=h}d.isLeaf=!0}*commonPrefixSearch(u){let d=this.root;if(d===void 0)return;let g="";for(let h of u){if(g+=h,d=d.children.get(h),d===void 0)return;d.isLeaf&&(yield g)}}}class a{constructor(u,d){this.isLeaf=u,this.children=d}static default(){return new a(!1,new Map)}}class n{constructor(u,d,g){this.chars=Array.from(u),this.len=this.chars.length,this.bosTokenId=d,this.eosTokenId=g,this.nodes=[],this.beginNodes=Array.from({length:this.len+1},()=>[]),this.endNodes=Array.from({length:this.len+1},()=>[]);let h=new i(this.bosTokenId,0,0,0,0),x=new i(this.eosTokenId,1,this.len,0,0);this.nodes.push(h.clone()),this.nodes.push(x.clone()),this.beginNodes[this.len].push(x),this.endNodes[0].push(h)}insert(u,d,g,h){let x=this.nodes.length,F=new i(h,x,u,d,g);this.beginNodes[u].push(F),this.endNodes[u+d].push(F),this.nodes.push(F)}viterbi(){let u=this.len,d=0;for(;d<=u;){if(this.beginNodes[d].length==0)return[];for(let v of this.beginNodes[d]){v.prev=null;let b=0,C=null;for(let y of this.endNodes[d]){let P=y.backtraceScore+v.score;(C===null||P>b)&&(C=y.clone(),b=P)}if(C!==null)v.prev=C,v.backtraceScore=b;else return[]}++d}let g=[],x=this.beginNodes[u][0].prev;if(x===null)return[];let F=x.clone();for(;F.prev!==null;)g.push(F.clone()),F=F.clone().prev.clone();return g.reverse(),g}piece(u){return this.chars.slice(u.pos,u.pos+u.length).join("")}tokens(){return this.viterbi().map(d=>this.piece(d))}tokenIds(){return this.viterbi().map(d=>d.tokenId)}}class i{constructor(u,d,g,h,x){this.tokenId=u,this.nodeId=d,this.pos=g,this.length=h,this.score=x,this.prev=null,this.backtraceScore=0}clone(){let u=new i(this.tokenId,this.nodeId,this.pos,this.length,this.score);return u.prev=this.prev,u.backtraceScore=this.backtraceScore,u}}class l{constructor(u){this.trie=this._buildTrie(u)}_buildTrie(u){let d=Object.create(null);for(let g of u){let h=d;for(let x=0;x<g.length;++x)h=h[g[x]]??=Object.create(null);h.end=g}return d}split(u){let d=[],g=u.length,h=0,x=0;for(;x<g;){let F=this.trie,v=null,b=x;for(;b<g&&(F=F[u[b]]);)F.end&&(v=F.end),++b;v?(x>h&&d.push(u.slice(h,x)),d.push(v),x+=v.length,h=x):++x}return h<g&&d.push(u.slice(h)),d}}class c{constructor(u){this.capacity=u,this.cache=new Map}get(u){if(!this.cache.has(u))return;let d=this.cache.get(u);return this.cache.delete(u),this.cache.set(u,d),d}put(u,d){this.cache.has(u)&&this.cache.delete(u),this.cache.set(u,d),this.cache.size>this.capacity&&this.cache.delete(this.cache.keys().next().value)}clear(){this.cache.clear()}}}),"./src/utils/devices.js":((e,r,t)=>{t.r(r),t.d(r,{DEVICE_TYPES:()=>s});let s=Object.freeze({auto:"auto",gpu:"gpu",cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",webnn:"webnn","webnn-npu":"webnn-npu","webnn-gpu":"webnn-gpu","webnn-cpu":"webnn-cpu"})}),"./src/utils/dtypes.js":((e,r,t)=>{t.r(r),t.d(r,{DATA_TYPES:()=>n,DEFAULT_DEVICE_DTYPE_MAPPING:()=>i,DEFAULT_DTYPE_SUFFIX_MAPPING:()=>l,isWebGpuFp16Supported:()=>a});var s=t("./src/env.js"),o=t("./src/utils/devices.js");let a=(function(){let c;return async function(){if(c===void 0)if(!s.apis.IS_WEBGPU_AVAILABLE)c=!1;else try{c=(await navigator.gpu.requestAdapter()).features.has("shader-f16")}catch{c=!1}return c}})(),n=Object.freeze({auto:"auto",fp32:"fp32",fp16:"fp16",q8:"q8",int8:"int8",uint8:"uint8",q4:"q4",bnb4:"bnb4",q4f16:"q4f16"}),i=Object.freeze({[o.DEVICE_TYPES.wasm]:n.q8}),l=Object.freeze({[n.fp32]:"",[n.fp16]:"_fp16",[n.int8]:"_int8",[n.uint8]:"_uint8",[n.q8]:"_quantized",[n.q4]:"_q4",[n.q4f16]:"_q4f16",[n.bnb4]:"_bnb4"})}),"./src/utils/generic.js":((e,r,t)=>{t.r(r),t.d(r,{Callable:()=>s});let s=class{constructor(){let o=function(...a){return o._call(...a)};return Object.setPrototypeOf(o,new.target.prototype)}_call(...o){throw Error("Must implement _call method in subclass")}}}),"./src/utils/hub.js":((e,r,t)=>{t.r(r),t.d(r,{MAX_EXTERNAL_DATA_CHUNKS:()=>i,getFile:()=>g,getModelFile:()=>b,getModelJSON:()=>y,getModelText:()=>C});var s=t("?7992"),o=t("?5af5"),a=t("./src/env.js"),n=t("./src/utils/core.js");let i=100,l={txt:"text/plain",html:"text/html",css:"text/css",js:"text/javascript",json:"application/json",png:"image/png",jpg:"image/jpeg",jpeg:"image/jpeg",gif:"image/gif"};class c{constructor(E){if(this.filePath=E,this.headers=new Headers,this.exists=s.existsSync(E),this.exists){this.status=200,this.statusText="OK";let D=s.statSync(E);this.headers.set("content-length",D.size.toString()),this.updateContentType();let O=s.createReadStream(E);this.body=new ReadableStream({start(U){O.on("data",W=>U.enqueue(W)),O.on("end",()=>U.close()),O.on("error",W=>U.error(W))},cancel(){O.destroy()}})}else this.status=404,this.statusText="Not Found",this.body=null}updateContentType(){let E=this.filePath.toString().split(".").pop().toLowerCase();this.headers.set("content-type",l[E]??"application/octet-stream")}clone(){let E=new c(this.filePath);return E.exists=this.exists,E.status=this.status,E.statusText=this.statusText,E.headers=new Headers(this.headers),E}async arrayBuffer(){return(await s.promises.readFile(this.filePath)).buffer}async blob(){let E=await s.promises.readFile(this.filePath);return new Blob([E],{type:this.headers.get("content-type")})}async text(){return await s.promises.readFile(this.filePath,"utf8")}async json(){return JSON.parse(await this.text())}}function _(f,E=null,D=null){let O;try{O=new URL(f)}catch{return!1}return!(E&&!E.includes(O.protocol)||D&&!D.includes(O.hostname))}let u=/^(\b[\w\-.]+\b\/)?\b[\w\-.]{1,96}\b$/;function d(f){return!(!u.test(f)||f.includes("..")||f.includes("--")||f.endsWith(".git")||f.endsWith(".ipynb"))}async function g(f){if(a.env.useFS&&!_(f,["http:","https:","blob:"]))return new c(f instanceof URL?f.protocol==="file:"?f.pathname:f.toString():f);if(typeof process<"u"&&process?.release?.name==="node"){let E=!!process.env?.TESTING_REMOTELY,D=a.env.version,O=new Headers;if(O.set("User-Agent",`transformers.js/${D}; is_ci/${E};`),_(f,["http:","https:"],["huggingface.co","hf.co"])){let W=process.env?.HF_TOKEN??process.env?.HF_ACCESS_TOKEN;W&&O.set("Authorization",`Bearer ${W}`)}return fetch(f,{headers:O})}else return fetch(f)}let h={400:"Bad request error occurred while trying to load file",401:"Unauthorized access to file",403:"Forbidden access to file",404:"Could not locate file",408:"Request timeout error occurred while trying to load file",500:"Internal server error error occurred while trying to load file",502:"Bad gateway error occurred while trying to load file",503:"Service unavailable error occurred while trying to load file",504:"Gateway timeout error occurred while trying to load file"};function x(f,E,D){if(!D)return null;let O=h[f]??`Error (${f}) occurred while trying to load file`;throw Error(`${O}: "${E}".`)}class F{constructor(E){this.path=E}async match(E){let D=o.join(this.path,E),O=new c(D);if(O.exists)return O}async put(E,D,O=void 0){let U=o.join(this.path,E);try{let W=D.headers.get("Content-Length"),z=parseInt(W??"0"),X=0;await s.promises.mkdir(o.dirname(U),{recursive:!0});let J=s.createWriteStream(U),q=D.body.getReader();for(;;){let{done:re,value:oe}=await q.read();if(re)break;await new Promise((ye,Y)=>{J.write(oe,H=>{if(H){Y(H);return}ye()})}),X+=oe.length;let ne=z?X/z*100:0;O?.({progress:ne,loaded:X,total:z})}J.close()}catch(W){try{await s.promises.unlink(U)}catch{}throw W}}}async function v(f,...E){for(let D of E)try{let O=await f.match(D);if(O)return O}catch{continue}}async function b(f,E,D=!0,O={},U=!1){if(!a.env.allowLocalModels){if(O.local_files_only)throw Error("Invalid configuration detected: local models are disabled (`env.allowLocalModels=false`) but you have requested to only use local models (`local_files_only=true`).");if(!a.env.allowRemoteModels)throw Error("Invalid configuration detected: both local and remote models are disabled. Fix by setting `env.allowLocalModels` or `env.allowRemoteModels` to `true`.")}(0,n.dispatchCallback)(O.progress_callback,{status:"initiate",name:f,file:E});let W;if(!W&&a.env.useCustomCache){if(!a.env.customCache)throw Error("`env.useCustomCache=true`, but `env.customCache` is not defined.");if(!a.env.customCache.match||!a.env.customCache.put)throw new Error("`env.customCache` must be an object which implements the `match` and `put` functions of the Web Cache API. For more information, see https://developer.mozilla.org/en-US/docs/Web/API/Cache");W=a.env.customCache}if(!W&&a.env.useBrowserCache){if(typeof caches>"u")throw Error("Browser cache is not available in this environment.");try{W=await caches.open("transformers-cache")}catch(ee){console.warn("An error occurred while opening the browser cache:",ee)}}if(!W&&a.env.useFSCache){if(!a.apis.IS_FS_AVAILABLE)throw Error("File System Cache is not available in this environment.");W=new F(O.cache_dir??a.env.cacheDir)}let z=O.revision??"main",X=I(f,E),J=d(f),q=J?I(a.env.localModelPath,X):X,re=I(a.env.remoteHost,a.env.remotePathTemplate.replaceAll("{model}",f).replaceAll("{revision}",encodeURIComponent(z)),E),oe,ne=W instanceof F?z==="main"?X:I(f,z,E):re,ye=!1,Y;W&&(Y=await v(W,q,ne));let H=Y!==void 0;if(Y===void 0){if(a.env.allowLocalModels)if(_(X,["http:","https:"])){if(O.local_files_only)throw new Error(`\`local_files_only=true\`, but attempted to load a remote file from: ${X}.`);if(!a.env.allowRemoteModels)throw new Error(`\`env.allowRemoteModels=false\`, but attempted to load a remote file from: ${X}.`)}else try{Y=await g(q),oe=q}catch(ue){console.warn(`Unable to load from local path "${q}": "${ue}"`)}if(Y===void 0||Y.status===404){if(O.local_files_only||!a.env.allowRemoteModels){if(D)throw Error(`\`local_files_only=true\` or \`env.allowRemoteModels=false\` and file was not found locally at "${q}".`);return null}if(!J)throw Error(`Local file missing at "${q}" and download aborted due to invalid model ID "${f}".`);if(Y=await g(re),Y.status!==200)return x(Y.status,re,D);oe=ne}ye=W&&typeof Response<"u"&&Y instanceof Response&&Y.status===200}(0,n.dispatchCallback)(O.progress_callback,{status:"download",name:f,file:E});let R;if(!(a.apis.IS_NODE_ENV&&U)){let ee;O.progress_callback?H&&typeof navigator<"u"&&/firefox/i.test(navigator.userAgent)?(ee=new Uint8Array(await Y.arrayBuffer()),(0,n.dispatchCallback)(O.progress_callback,{status:"progress",name:f,file:E,progress:100,loaded:ee.length,total:ee.length})):ee=await P(Y,ue=>{(0,n.dispatchCallback)(O.progress_callback,{status:"progress",name:f,file:E,...ue})}):ee=new Uint8Array(await Y.arrayBuffer()),R=ee}if(ye&&oe&&await W.match(oe)===void 0)if(R)await W.put(oe,new Response(R,{headers:Y.headers})).catch(ee=>{console.warn(`Unable to add response to browser cache: ${ee}.`)});else{let ee=O.progress_callback?ue=>(0,n.dispatchCallback)(O.progress_callback,{status:"progress",name:f,file:E,...ue}):void 0;await W.put(oe,Y,ee)}if((0,n.dispatchCallback)(O.progress_callback,{status:"done",name:f,file:E}),R){if(!a.apis.IS_NODE_ENV&&U)throw new Error("Cannot return path in a browser environment.");return R}if(Y instanceof c)return Y.filePath;let L=await W?.match(oe);if(L instanceof c)return L.filePath;if(L instanceof Response)return new Uint8Array(await L.arrayBuffer());if(typeof L=="string")return L;throw new Error("Unable to get model file path or buffer.")}async function C(f,E,D=!0,O={}){let U=await b(f,E,D,O,!1);return U===null?null:new TextDecoder("utf-8").decode(U)}async function y(f,E,D=!0,O={}){let U=await C(f,E,D,O);return U===null?{}:JSON.parse(U)}async function P(f,E){let D=f.headers.get("Content-Length");D===null&&console.warn("Unable to determine content-length from response headers. Will expand buffer when needed.");let O=parseInt(D??"0"),U=new Uint8Array(O),W=0,z=f.body.getReader();async function X(){let{done:J,value:q}=await z.read();if(J)return;let re=W+q.length;if(re>O){O=re;let ne=new Uint8Array(O);ne.set(U),U=ne}U.set(q,W),W=re;let oe=W/O*100;return E({progress:oe,loaded:W,total:O}),X()}return await X(),U}function I(...f){return f=f.map((E,D)=>(D&&(E=E.replace(new RegExp("^/"),"")),D!==f.length-1&&(E=E.replace(new RegExp("/$"),"")),E)),f.join("/")}}),"./src/utils/image.js":((e,r,t)=>{t.r(r),t.d(r,{RawImage:()=>h,load_image:()=>x});var s=t("./src/utils/core.js"),o=t("./src/utils/hub.js"),a=t("./src/env.js"),n=t("./src/utils/tensor.js"),i=t("?2b25");let l,c,_,u=a.apis.IS_BROWSER_ENV||a.apis.IS_WEBWORKER_ENV;if(u)l=(F,v)=>{if(!self.OffscreenCanvas)throw new Error("OffscreenCanvas not supported by this browser.");return new self.OffscreenCanvas(F,v)},_=self.createImageBitmap,c=self.ImageData;else if(i)_=async F=>{let b=(await F.metadata()).channels,{data:C,info:y}=await F.rotate().raw().toBuffer({resolveWithObject:!0}),P=new h(new Uint8ClampedArray(C),y.width,y.height,y.channels);return b!==void 0&&b!==y.channels&&P.convert(b),P};else throw new Error("Unable to load image processing library.");let d={0:"nearest",1:"lanczos",2:"bilinear",3:"bicubic",4:"box",5:"hamming"},g=new Map([["png","image/png"],["jpg","image/jpeg"],["jpeg","image/jpeg"],["gif","image/gif"]]);class h{constructor(v,b,C,y){this.data=v,this.width=b,this.height=C,this.channels=y}get size(){return[this.width,this.height]}static async read(v){if(v instanceof h)return v;if(typeof v=="string"||v instanceof URL)return await this.fromURL(v);if(v instanceof Blob)return await this.fromBlob(v);if(typeof HTMLCanvasElement<"u"&&v instanceof HTMLCanvasElement||typeof OffscreenCanvas<"u"&&v instanceof OffscreenCanvas)return this.fromCanvas(v);throw new Error(`Unsupported input type: ${typeof v}`)}static fromCanvas(v){if(!u)throw new Error("fromCanvas() is only supported in browser environments.");let C=v.getContext("2d").getImageData(0,0,v.width,v.height).data;return new h(C,v.width,v.height,4)}static async fromURL(v){let b=await(0,o.getFile)(v);if(b.status!==200)throw new Error(`Unable to read image from "${v}" (${b.status} ${b.statusText})`);let C=await b.blob();return this.fromBlob(C)}static async fromBlob(v){if(u){let b=await _(v),C=l(b.width,b.height).getContext("2d");return C.drawImage(b,0,0),new this(C.getImageData(0,0,b.width,b.height).data,b.width,b.height,4)}else{let b=i(await v.arrayBuffer());return await _(b)}}static fromTensor(v,b="CHW"){if(v.dims.length!==3)throw new Error(`Tensor should have 3 dimensions, but has ${v.dims.length} dimensions.`);if(b==="CHW")v=v.transpose(1,2,0);else if(b!=="HWC")throw new Error(`Unsupported channel format: ${b}`);if(!(v.data instanceof Uint8ClampedArray||v.data instanceof Uint8Array))throw new Error(`Unsupported tensor type: ${v.type}`);switch(v.dims[2]){case 1:case 2:case 3:case 4:return new h(v.data,v.dims[1],v.dims[0],v.dims[2]);default:throw new Error(`Unsupported number of channels: ${v.dims[2]}`)}}grayscale(){if(this.channels===1)return this;let v=new Uint8ClampedArray(this.width*this.height*1);switch(this.channels){case 3:case 4:for(let b=0,C=0;b<this.data.length;b+=this.channels){let y=this.data[b],P=this.data[b+1],I=this.data[b+2];v[C++]=Math.round(.2989*y+.587*P+.114*I)}break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(v,this.width,this.height,1)}rgb(){if(this.channels===3)return this;let v=new Uint8ClampedArray(this.width*this.height*3);switch(this.channels){case 1:for(let b=0,C=0;b<this.data.length;++b)v[C++]=this.data[b],v[C++]=this.data[b],v[C++]=this.data[b];break;case 4:for(let b=0,C=0;b<this.data.length;b+=4)v[C++]=this.data[b],v[C++]=this.data[b+1],v[C++]=this.data[b+2];break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(v,this.width,this.height,3)}rgba(){if(this.channels===4)return this;let v=new Uint8ClampedArray(this.width*this.height*4);switch(this.channels){case 1:for(let b=0,C=0;b<this.data.length;++b)v[C++]=this.data[b],v[C++]=this.data[b],v[C++]=this.data[b],v[C++]=255;break;case 3:for(let b=0,C=0;b<this.data.length;b+=3)v[C++]=this.data[b],v[C++]=this.data[b+1],v[C++]=this.data[b+2],v[C++]=255;break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(v,this.width,this.height,4)}putAlpha(v){if(v.width!==this.width||v.height!==this.height)throw new Error(`Expected mask size to be ${this.width}x${this.height}, but got ${v.width}x${v.height}`);if(v.channels!==1)throw new Error(`Expected mask to have 1 channel, but got ${v.channels}`);let b=this.data,C=v.data,y=this.width*this.height;if(this.channels===3){let P=new Uint8ClampedArray(y*4);for(let I=0,f=0,E=0;I<y;++I)P[E++]=b[f++],P[E++]=b[f++],P[E++]=b[f++],P[E++]=C[I];return this._update(P,this.width,this.height,4)}else if(this.channels===4){for(let P=0;P<y;++P)b[4*P+3]=C[P];return this}throw new Error(`Expected image to have 3 or 4 channels, but got ${this.channels}`)}async resize(v,b,{resample:C=2}={}){if(this.width===v&&this.height===b)return this;let y=d[C]??C,P=(0,s.isNullishDimension)(v),I=(0,s.isNullishDimension)(b);if(P&&I)return this;if(P?v=b/this.height*this.width:I&&(b=v/this.width*this.height),u){let f=this.channels,E=this.toCanvas(),D=l(v,b).getContext("2d");return D.drawImage(E,0,0,v,b),new h(D.getImageData(0,0,v,b).data,v,b,4).convert(f)}else{let f=this.toSharp();switch(y){case"box":case"hamming":(y==="box"||y==="hamming")&&(console.warn(`Resampling method ${y} is not yet supported. Using bilinear instead.`),y="bilinear");case"nearest":case"bilinear":case"bicubic":f=f.affine([v/this.width,0,0,b/this.height],{interpolator:y});break;case"lanczos":f=f.resize({width:v,height:b,fit:"fill",kernel:"lanczos3"});break;default:throw new Error(`Resampling method ${y} is not supported.`)}return await _(f)}}async pad([v,b,C,y]){if(v=Math.max(v,0),b=Math.max(b,0),C=Math.max(C,0),y=Math.max(y,0),v===0&&b===0&&C===0&&y===0)return this;if(u){let P=this.channels,I=this.toCanvas(),f=this.width+v+b,E=this.height+C+y,D=l(f,E).getContext("2d");return D.drawImage(I,0,0,this.width,this.height,v,C,this.width,this.height),new h(D.getImageData(0,0,f,E).data,f,E,4).convert(P)}else{let P=this.toSharp().extend({left:v,right:b,top:C,bottom:y});return await _(P)}}async crop([v,b,C,y]){if(v=Math.max(v,0),b=Math.max(b,0),C=Math.min(C,this.width-1),y=Math.min(y,this.height-1),v===0&&b===0&&C===this.width-1&&y===this.height-1)return this;let P=C-v+1,I=y-b+1;if(u){let f=this.channels,E=this.toCanvas(),D=l(P,I).getContext("2d");return D.drawImage(E,v,b,P,I,0,0,P,I),new h(D.getImageData(0,0,P,I).data,P,I,4).convert(f)}else{let f=this.toSharp().extract({left:v,top:b,width:P,height:I});return await _(f)}}async center_crop(v,b){if(this.width===v&&this.height===b)return this;let C=(this.width-v)/2,y=(this.height-b)/2;if(u){let P=this.channels,I=this.toCanvas(),f=l(v,b).getContext("2d"),E=0,D=0,O=0,U=0;return C>=0?E=C:O=-C,y>=0?D=y:U=-y,f.drawImage(I,E,D,v,b,O,U,v,b),new h(f.getImageData(0,0,v,b).data,v,b,4).convert(P)}else{let P=this.toSharp();if(C>=0&&y>=0)P=P.extract({left:Math.floor(C),top:Math.floor(y),width:v,height:b});else if(C<=0&&y<=0){let I=Math.floor(-y),f=Math.floor(-C);P=P.extend({top:I,left:f,right:v-this.width-f,bottom:b-this.height-I})}else{let I=[0,0],f=0;y<0?(I[0]=Math.floor(-y),I[1]=b-this.height-I[0]):f=Math.floor(y);let E=[0,0],D=0;C<0?(E[0]=Math.floor(-C),E[1]=v-this.width-E[0]):D=Math.floor(C),P=P.extend({top:I[0],bottom:I[1],left:E[0],right:E[1]}).extract({left:D,top:f,width:v,height:b})}return await _(P)}}async toBlob(v="image/png",b=1){if(!u)throw new Error("toBlob() is only supported in browser environments.");return await this.toCanvas().convertToBlob({type:v,quality:b})}toTensor(v="CHW"){let b=new n.Tensor("uint8",new Uint8Array(this.data),[this.height,this.width,this.channels]);if(v!=="HWC")if(v==="CHW")b=b.permute(2,0,1);else throw new Error(`Unsupported channel format: ${v}`);return b}toCanvas(){if(!u)throw new Error("toCanvas() is only supported in browser environments.");let v=this.clone().rgba(),b=l(v.width,v.height),C=new c(v.data,v.width,v.height);return b.getContext("2d").putImageData(C,0,0),b}split(){let{data:v,width:b,height:C,channels:y}=this,P=v.constructor,I=v.length/y,f=Array.from({length:y},()=>new P(I));for(let E=0;E<I;++E){let D=y*E;for(let O=0;O<y;++O)f[O][E]=v[D+O]}return f.map(E=>new h(E,b,C,1))}_update(v,b,C,y=null){return this.data=v,this.width=b,this.height=C,y!==null&&(this.channels=y),this}clone(){return new h(this.data.slice(),this.width,this.height,this.channels)}convert(v){if(this.channels===v)return this;switch(v){case 1:this.grayscale();break;case 3:this.rgb();break;case 4:this.rgba();break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this}async save(v){if(u){if(a.apis.IS_WEBWORKER_ENV)throw new Error("Unable to save an image from a Web Worker.");let b=v.split(".").pop().toLowerCase(),C=g.get(b)??"image/png",y=await this.toBlob(C);(0,s.saveBlob)(v,y)}else{if(a.apis.IS_FS_AVAILABLE)return await this.toSharp().toFile(v);throw new Error("Unable to save the image because filesystem is disabled in this environment.")}}toSharp(){if(u)throw new Error("toSharp() is only supported in server-side environments.");return i(this.data,{raw:{width:this.width,height:this.height,channels:this.channels}})}}let x=h.read.bind(h)}),"./src/utils/maths.js":((e,r,t)=>{t.r(r),t.d(r,{FFT:()=>x,bankers_round:()=>b,cos_sim:()=>l,dot:()=>i,dynamic_time_warping:()=>C,interpolate_data:()=>s,log_softmax:()=>n,magnitude:()=>c,max:()=>u,medianFilter:()=>F,min:()=>_,permute_data:()=>o,round:()=>v,softmax:()=>a});function s(y,[P,I,f],[E,D],O="bilinear",U=!1){let W=D/f,z=E/I,X=new y.constructor(E*D*P),J=I*f,q=E*D;for(let re=0;re<E;++re)for(let oe=0;oe<D;++oe){let ne=re*D+oe,ye=(oe+.5)/W-.5,Y=(re+.5)/z-.5,H=Math.floor(ye),R=Math.floor(Y),L=Math.min(H+1,f-1),ee=Math.min(R+1,I-1);H=Math.max(H,0),R=Math.max(R,0);let ue=ye-H,ke=Y-R,Ie=(1-ue)*(1-ke),Le=ue*(1-ke),rt=(1-ue)*ke,we=ue*ke,A=R*f,le=ee*f,ge=A+H,be=A+L,Ae=le+H,ve=le+L;for(let pe=0;pe<P;++pe){let Pe=pe*J;X[pe*q+ne]=Ie*y[Pe+ge]+Le*y[Pe+be]+rt*y[Pe+Ae]+we*y[Pe+ve]}}return X}function o(y,P,I){let f=new Array(I.length),E=new Array(I.length);for(let U=I.length-1,W=1;U>=0;--U)E[U]=W,f[U]=P[I[U]],W*=f[U];let D=I.map((U,W)=>E[I.indexOf(W)]),O=new y.constructor(y.length);for(let U=0;U<y.length;++U){let W=0;for(let z=P.length-1,X=U;z>=0;--z)W+=X%P[z]*D[z],X=Math.floor(X/P[z]);O[W]=y[U]}return[O,f]}function a(y){let P=u(y)[0],I=y.map(D=>Math.exp(D-P)),f=I.reduce((D,O)=>D+O,0);return I.map(D=>D/f)}function n(y){let P=u(y)[0],I=0;for(let D=0;D<y.length;++D)I+=Math.exp(y[D]-P);let f=Math.log(I);return y.map(D=>D-P-f)}function i(y,P){let I=0;for(let f=0;f<y.length;++f)I+=y[f]*P[f];return I}function l(y,P){let I=i(y,P),f=c(y),E=c(P);return I/(f*E)}function c(y){return Math.sqrt(y.reduce((P,I)=>P+I*I,0))}function _(y){if(y.length===0)throw Error("Array must not be empty");let P=y[0],I=0;for(let f=1;f<y.length;++f)y[f]<P&&(P=y[f],I=f);return[P,I]}function u(y){if(y.length===0)throw Error("Array must not be empty");let P=y[0],I=0;for(let f=1;f<y.length;++f)y[f]>P&&(P=y[f],I=f);return[P,I]}function d(y){return y>0&&(y&y-1)===0}class g{constructor(P){if(this.size=P|0,this.size<=1||!d(this.size))throw new Error("FFT size must be a power of two larger than 1");this._csize=P<<1,this.table=new Float64Array(this.size*2);for(let f=0;f<this.table.length;f+=2){let E=Math.PI*f/this.size;this.table[f]=Math.cos(E),this.table[f+1]=-Math.sin(E)}let I=0;for(let f=1;this.size>f;f<<=1)++I;this._width=I%2===0?I-1:I,this._bitrev=new Int32Array(1<<this._width);for(let f=0;f<this._bitrev.length;++f){this._bitrev[f]=0;for(let E=0;E<this._width;E+=2){let D=this._width-E-2;this._bitrev[f]|=(f>>>E&3)<<D}}}createComplexArray(){return new Float64Array(this._csize)}fromComplexArray(P,I){let f=I||new Array(P.length>>>1);for(let E=0;E<P.length;E+=2)f[E>>>1]=P[E];return f}toComplexArray(P,I){let f=I||this.createComplexArray();for(let E=0;E<f.length;E+=2)f[E]=P[E>>>1],f[E+1]=0;return f}transform(P,I){if(P===I)throw new Error("Input and output buffers must be different");this._transform4(P,I,1)}realTransform(P,I){if(P===I)throw new Error("Input and output buffers must be different");this._realTransform4(P,I,1)}inverseTransform(P,I){if(P===I)throw new Error("Input and output buffers must be different");this._transform4(P,I,-1);for(let f=0;f<P.length;++f)P[f]/=this.size}_transform4(P,I,f){let E=this._csize,O=1<<this._width,U=E/O<<1,W,z,X=this._bitrev;if(U===4)for(W=0,z=0;W<E;W+=U,++z){let q=X[z];this._singleTransform2(I,P,W,q,O)}else for(W=0,z=0;W<E;W+=U,++z){let q=X[z];this._singleTransform4(I,P,W,q,O,f)}let J=this.table;for(O>>=2;O>=2;O>>=2){U=E/O<<1;let q=U>>>2;for(W=0;W<E;W+=U){let re=W+q-1;for(let oe=W,ne=0;oe<re;oe+=2,ne+=O){let ye=oe,Y=ye+q,H=Y+q,R=H+q,L=P[ye],ee=P[ye+1],ue=P[Y],ke=P[Y+1],Ie=P[H],Le=P[H+1],rt=P[R],we=P[R+1],A=J[ne],le=f*J[ne+1],ge=ue*A-ke*le,be=ue*le+ke*A,Ae=J[2*ne],ve=f*J[2*ne+1],pe=Ie*Ae-Le*ve,Pe=Ie*ve+Le*Ae,fe=J[3*ne],Te=f*J[3*ne+1],We=rt*fe-we*Te,$e=rt*Te+we*fe,Re=L+pe,Ne=ee+Pe,ot=L-pe,De=ee-Pe,Qe=ge+We,je=be+$e,pt=f*(ge-We),Ke=f*(be-$e);P[ye]=Re+Qe,P[ye+1]=Ne+je,P[Y]=ot+Ke,P[Y+1]=De-pt,P[H]=Re-Qe,P[H+1]=Ne-je,P[R]=ot-Ke,P[R+1]=De+pt}}}}_singleTransform2(P,I,f,E,D){let O=P[E],U=P[E+1],W=P[E+D],z=P[E+D+1];I[f]=O+W,I[f+1]=U+z,I[f+2]=O-W,I[f+3]=U-z}_singleTransform4(P,I,f,E,D,O){let U=D*2,W=D*3,z=P[E],X=P[E+1],J=P[E+D],q=P[E+D+1],re=P[E+U],oe=P[E+U+1],ne=P[E+W],ye=P[E+W+1],Y=z+re,H=X+oe,R=z-re,L=X-oe,ee=J+ne,ue=q+ye,ke=O*(J-ne),Ie=O*(q-ye);I[f]=Y+ee,I[f+1]=H+ue,I[f+2]=R+Ie,I[f+3]=L-ke,I[f+4]=Y-ee,I[f+5]=H-ue,I[f+6]=R-Ie,I[f+7]=L+ke}_realTransform4(P,I,f){let E=this._csize,O=1<<this._width,U=E/O<<1,W,z,X=this._bitrev;if(U===4)for(W=0,z=0;W<E;W+=U,++z){let re=X[z];this._singleRealTransform2(I,P,W,re>>>1,O>>>1)}else for(W=0,z=0;W<E;W+=U,++z){let re=X[z];this._singleRealTransform4(I,P,W,re>>>1,O>>>1,f)}let J=this.table;for(O>>=2;O>=2;O>>=2){U=E/O<<1;let re=U>>>1,oe=re>>>1,ne=oe>>>1;for(W=0;W<E;W+=U)for(let ye=0,Y=0;ye<=ne;ye+=2,Y+=O){let H=W+ye,R=H+oe,L=R+oe,ee=L+oe,ue=P[H],ke=P[H+1],Ie=P[R],Le=P[R+1],rt=P[L],we=P[L+1],A=P[ee],le=P[ee+1],ge=ue,be=ke,Ae=J[Y],ve=f*J[Y+1],pe=Ie*Ae-Le*ve,Pe=Ie*ve+Le*Ae,fe=J[2*Y],Te=f*J[2*Y+1],We=rt*fe-we*Te,$e=rt*Te+we*fe,Re=J[3*Y],Ne=f*J[3*Y+1],ot=A*Re-le*Ne,De=A*Ne+le*Re,Qe=ge+We,je=be+$e,pt=ge-We,Ke=be-$e,bt=pe+ot,At=Pe+De,Lt=f*(pe-ot),fr=f*(Pe-De);if(P[H]=Qe+bt,P[H+1]=je+At,P[R]=pt+fr,P[R+1]=Ke-Lt,ye===0){P[L]=Qe-bt,P[L+1]=je-At;continue}if(ye===ne)continue;let zt=W+oe-ye,yr=W+re-ye;P[zt]=pt-f*fr,P[zt+1]=-Ke-f*Lt,P[yr]=Qe-f*bt,P[yr+1]=-je+f*At}}let q=E>>>1;for(let re=2;re<q;re+=2)P[E-re]=P[re],P[E-re+1]=-P[re+1]}_singleRealTransform2(P,I,f,E,D){let O=P[E],U=P[E+D];I[f]=O+U,I[f+1]=0,I[f+2]=O-U,I[f+3]=0}_singleRealTransform4(P,I,f,E,D,O){let U=D*2,W=D*3,z=P[E],X=P[E+D],J=P[E+U],q=P[E+W],re=z+J,oe=z-J,ne=X+q,ye=O*(X-q);I[f]=re+ne,I[f+1]=0,I[f+2]=oe,I[f+3]=-ye,I[f+4]=re-ne,I[f+5]=0,I[f+6]=oe,I[f+7]=ye}}class h{constructor(P){let I=2*(P-1),f=2*(2*P-1),E=2**Math.ceil(Math.log2(f));this.bufferSize=E,this._a=I;let D=new Float64Array(f),O=new Float64Array(E);this._chirpBuffer=new Float64Array(E),this._buffer1=new Float64Array(E),this._buffer2=new Float64Array(E),this._outBuffer1=new Float64Array(E),this._outBuffer2=new Float64Array(E);let U=-2*Math.PI/P,W=Math.cos(U),z=Math.sin(U);for(let X=0;X<f>>1;++X){let J=(X+1-P)**2/2,q=Math.sqrt(W**2+z**2)**J,re=J*Math.atan2(z,W),oe=2*X;D[oe]=q*Math.cos(re),D[oe+1]=q*Math.sin(re),O[oe]=D[oe],O[oe+1]=-D[oe+1]}this._slicedChirpBuffer=D.subarray(I,f),this._f=new g(E>>1),this._f.transform(this._chirpBuffer,O)}_transform(P,I,f){let E=this._buffer1,D=this._buffer2,O=this._outBuffer1,U=this._outBuffer2,W=this._chirpBuffer,z=this._slicedChirpBuffer,X=this._a;if(f)for(let J=0;J<z.length;J+=2){let q=J+1,re=J>>1,oe=I[re];E[J]=oe*z[J],E[q]=oe*z[q]}else for(let J=0;J<z.length;J+=2){let q=J+1;E[J]=I[J]*z[J]-I[q]*z[q],E[q]=I[J]*z[q]+I[q]*z[J]}this._f.transform(O,E);for(let J=0;J<W.length;J+=2){let q=J+1;D[J]=O[J]*W[J]-O[q]*W[q],D[q]=O[J]*W[q]+O[q]*W[J]}this._f.inverseTransform(U,D);for(let J=0;J<U.length;J+=2){let q=U[J+X],re=U[J+X+1],oe=z[J],ne=z[J+1];P[J]=q*oe-re*ne,P[J+1]=q*ne+re*oe}}transform(P,I){this._transform(P,I,!1)}realTransform(P,I){this._transform(P,I,!0)}}class x{constructor(P){this.fft_length=P,this.isPowerOfTwo=d(P),this.isPowerOfTwo?(this.fft=new g(P),this.outputBufferSize=2*P):(this.fft=new h(P),this.outputBufferSize=this.fft.bufferSize)}realTransform(P,I){this.fft.realTransform(P,I)}transform(P,I){this.fft.transform(P,I)}}function F(y,P){if(P%2===0||P<=0)throw new Error("Window size must be a positive odd number");let I=new y.constructor(y.length),f=new y.constructor(P),E=Math.floor(P/2);for(let D=0;D<y.length;++D){let O=0;for(let U=-E;U<=E;++U){let W=D+U;W<0?W=Math.abs(W):W>=y.length&&(W=2*(y.length-1)-W),f[O++]=y[W]}f.sort(),I[D]=f[E]}return I}function v(y,P){let I=Math.pow(10,P);return Math.round(y*I)/I}function b(y){let P=Math.round(y);return Math.abs(y)%1===.5?P%2===0?P:P-1:P}function C(y){let P=y.length,I=y[0].length,f=[P+1,I+1],E=Array.from({length:f[0]},()=>Array(f[1]).fill(1/0));E[0][0]=0;let D=Array.from({length:f[0]},()=>Array(f[1]).fill(-1));for(let X=1;X<f[1];++X)for(let J=1;J<f[0];++J){let q=E[J-1][X-1],re=E[J-1][X],oe=E[J][X-1],ne,ye;q<re&&q<oe?(ne=q,ye=0):re<q&&re<oe?(ne=re,ye=1):(ne=oe,ye=2),E[J][X]=y[J-1][X-1]+ne,D[J][X]=ye}for(let X=0;X<f[1];++X)D[0][X]=2;for(let X=0;X<f[0];++X)D[X][0]=1;let O=P,U=I,W=[],z=[];for(;O>0||U>0;)switch(W.push(O-1),z.push(U-1),D[O][U]){case 0:--O,--U;break;case 1:--O;break;case 2:--U;break;default:throw new Error(`Internal error in dynamic time warping. Unexpected trace[${O}, ${U}]. Please file a bug report.`)}return W.reverse(),z.reverse(),[W,z]}}),"./src/utils/tensor.js":((e,r,t)=>{t.r(r),t.d(r,{DataTypeMap:()=>n,Tensor:()=>i,cat:()=>I,full:()=>z,full_like:()=>X,interpolate:()=>_,interpolate_4d:()=>u,layer_norm:()=>b,matmul:()=>d,mean:()=>O,mean_pooling:()=>v,ones:()=>J,ones_like:()=>q,permute:()=>c,quantize_embeddings:()=>Y,rand:()=>ne,randn:()=>ye,rfft:()=>g,slice:()=>F,stack:()=>f,std_mean:()=>D,topk:()=>h,zeros:()=>re,zeros_like:()=>oe});var s=t("./src/utils/maths.js"),o=t("./src/backends/onnx.js"),a=t("./src/ops/registry.js");let n=Object.freeze({float32:Float32Array,float16:typeof Float16Array<"u"?Float16Array:Uint16Array,float64:Float64Array,string:Array,int8:Int8Array,uint8:Uint8Array,int16:Int16Array,uint16:Uint16Array,int32:Int32Array,uint32:Uint32Array,int64:BigInt64Array,uint64:BigUint64Array,bool:Uint8Array,uint4:Uint8Array,int4:Int8Array});class i{get dims(){return this.ort_tensor.dims}set dims(R){this.ort_tensor.dims=R}get type(){return this.ort_tensor.type}get data(){return this.ort_tensor.data}get size(){return this.ort_tensor.size}get location(){return this.ort_tensor.location}ort_tensor;constructor(...R){return(0,o.isONNXTensor)(R[0])?this.ort_tensor=R[0]:this.ort_tensor=new o.Tensor(R[0],R[1],R[2]),new Proxy(this,{get:(L,ee)=>{if(typeof ee=="string"){let ue=Number(ee);if(Number.isInteger(ue))return L._getitem(ue)}return L[ee]},set:(L,ee,ue)=>L[ee]=ue})}dispose(){this.ort_tensor.dispose()}*[Symbol.iterator](){let[R,...L]=this.dims;if(L.length>0){let ee=L.reduce((ue,ke)=>ue*ke);for(let ue=0;ue<R;++ue)yield this._subarray(ue,ee,L)}else yield*this.data}_getitem(R){let[L,...ee]=this.dims;if(R=P(R,L),ee.length>0){let ue=ee.reduce((ke,Ie)=>ke*Ie);return this._subarray(R,ue,ee)}else return new i(this.type,[this.data[R]],ee)}indexOf(R){let L=this.data;for(let ee=0;ee<L.length;++ee)if(L[ee]==R)return ee;return-1}_subarray(R,L,ee){let ue=R*L,ke=(R+1)*L,Ie="subarray"in this.data?this.data.subarray(ue,ke):this.data.slice(ue,ke);return new i(this.type,Ie,ee)}item(){let R=this.data;if(R.length!==1)throw new Error(`a Tensor with ${R.length} elements cannot be converted to Scalar`);return R[0]}tolist(){return l(this.data,this.dims)}sigmoid(){return this.clone().sigmoid_()}sigmoid_(){let R=this.data;for(let L=0;L<R.length;++L)R[L]=1/(1+Math.exp(-R[L]));return this}map(R){return this.clone().map_(R)}map_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]=R(L[ee],ee,L);return this}mul(R){return this.clone().mul_(R)}mul_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]*=R;return this}div(R){return this.clone().div_(R)}div_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]/=R;return this}add(R){return this.clone().add_(R)}add_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]+=R;return this}sub(R){return this.clone().sub_(R)}sub_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]-=R;return this}clone(){return new i(this.type,this.data.slice(),this.dims.slice())}slice(...R){let L=[],ee=[];for(let A=0;A<this.dims.length;++A){let le=R[A];if(le==null)ee.push([0,this.dims[A]]),L.push(this.dims[A]);else if(typeof le=="number")le=P(le,this.dims[A],A),ee.push([le,le+1]);else if(Array.isArray(le)&&le.length===2){let[ge,be]=le;if(ge=ge===null?0:P(ge,this.dims[A],A,!1),be=be===null?this.dims[A]:P(be,this.dims[A],A,!1),ge>be)throw new Error(`Invalid slice: ${le}`);let Ae=[Math.max(ge,0),Math.min(be,this.dims[A])];ee.push(Ae),L.push(Ae[1]-Ae[0])}else throw new Error(`Invalid slice: ${le}`)}let ue=ee.map(([A,le])=>le-A),ke=ue.reduce((A,le)=>A*le),Ie=this.data,Le=new Ie.constructor(ke),rt=this.stride(),we=!0;for(let A=1;A<ue.length;++A)if(ee[A][0]!==0||ee[A][1]!==this.dims[A]){we=!1;break}if(we){let A=ee[0][0]*rt[0],le=ee[0][1]*rt[0];if(ArrayBuffer.isView(Ie))Le.set(Ie.subarray(A,le));else if(Array.isArray(Ie)){let ge=Ie.slice(A,le);for(let be=0;be<ge.length;++be)Le[be]=ge[be]}else throw new Error("Unsupported data type for slicing")}else for(let A=0;A<ke;++A){let le=0;for(let ge=ue.length-1,be=A;ge>=0;--ge){let Ae=ue[ge];le+=(be%Ae+ee[ge][0])*rt[ge],be=Math.floor(be/Ae)}Le[A]=Ie[le]}return new i(this.type,Le,L)}permute(...R){return c(this,R)}transpose(...R){return this.permute(...R)}sum(R=null,L=!1){return this.norm(1,R,L)}norm(R="fro",L=null,ee=!1){if(R==="fro")R=2;else if(typeof R=="string")throw Error(`Unsupported norm: ${R}`);let ue=this.data,ke=(we,A)=>we+A**R;if(L===null){let we=ue.reduce(ke,0)**(1/R);return new i(this.type,[we],[])}let[Ie,Le,rt]=E(ke,this,L,ee);if(R!==1)for(let we=0;we<Le.length;++we)Le[we]=Le[we]**(1/R);return new i(Ie,Le,rt)}normalize_(R=2,L=1){L=P(L,this.dims.length);let ee=this.norm(R,L,!0),ue=this.data,ke=ee.data;for(let Ie=0;Ie<ue.length;++Ie){let Le=0;for(let rt=this.dims.length-1,we=Ie,A=1;rt>=0;--rt){let le=this.dims[rt];if(rt!==L){let ge=we%le;Le+=ge*A,A*=this.dims[rt]}we=Math.floor(we/le)}ue[Ie]/=ke[Le]}return this}normalize(R=2,L=1){return this.clone().normalize_(R,L)}stride(){return U(this.dims)}squeeze(R=null){return new i(this.type,this.data,C(this.dims,R))}squeeze_(R=null){return this.dims=C(this.dims,R),this}unsqueeze(R=null){return new i(this.type,this.data,y(this.dims,R))}unsqueeze_(R=null){return this.dims=y(this.dims,R),this}flatten_(R=0,L=-1){L=(L+this.dims.length)%this.dims.length;let ee=this.dims.slice(0,R),ue=this.dims.slice(R,L+1),ke=this.dims.slice(L+1);return this.dims=[...ee,ue.reduce((Ie,Le)=>Ie*Le,1),...ke],this}flatten(R=0,L=-1){return this.clone().flatten_(R,L)}view(...R){let L=-1;for(let ue=0;ue<R.length;++ue)if(R[ue]===-1){if(L!==-1)throw new Error("Only one dimension can be inferred");L=ue}let ee=this.data;if(L!==-1){let ue=R.reduce((ke,Ie,Le)=>Le!==L?ke*Ie:ke,1);R[L]=ee.length/ue}return new i(this.type,ee,R)}neg_(){let R=this.data;for(let L=0;L<R.length;++L)R[L]=-R[L];return this}neg(){return this.clone().neg_()}gt(R){let L=new Uint8Array(this.data.length),ee=this.data;for(let ue=0;ue<ee.length;++ue)L[ue]=ee[ue]>R?1:0;return new i("bool",L,this.dims)}lt(R){let L=new Uint8Array(this.data.length),ee=this.data;for(let ue=0;ue<ee.length;++ue)L[ue]=ee[ue]<R?1:0;return new i("bool",L,this.dims)}clamp_(R,L){let ee=this.data;for(let ue=0;ue<ee.length;++ue)ee[ue]=Math.min(Math.max(ee[ue],R),L);return this}clamp(R,L){return this.clone().clamp_(R,L)}round_(){let R=this.data;for(let L=0;L<R.length;++L)R[L]=Math.round(R[L]);return this}round(){return this.clone().round_()}mean(R=null,L=!1){return O(this,R,L)}min(R=null,L=!1){if(R===null){let Ie=(0,s.min)(this.data)[0];return new i(this.type,[Ie],[])}let[ee,ue,ke]=E((Ie,Le)=>Math.min(Ie,Le),this,R,L,1/0);return new i(ee,ue,ke)}max(R=null,L=!1){if(R===null){let Ie=(0,s.max)(this.data)[0];return new i(this.type,[Ie],[])}let[ee,ue,ke]=E((Ie,Le)=>Math.max(Ie,Le),this,R,L,-1/0);return new i(ee,ue,ke)}argmin(R=null,L=!1){if(R!==null)throw new Error("`dim !== null` not yet implemented.");let ee=(0,s.min)(this.data)[1];return new i("int64",[BigInt(ee)],[])}argmax(R=null,L=!1){if(R!==null)throw new Error("`dim !== null` not yet implemented.");let ee=(0,s.max)(this.data)[1];return new i("int64",[BigInt(ee)],[])}to(R){if(this.type===R)return this;if(!n.hasOwnProperty(R))throw new Error(`Unsupported type: ${R}`);let L,ee=["int64","uint64"].includes(this.type),ue=["int64","uint64"].includes(R);return ee&&!ue?L=Number:!ee&&ue&&(["float16","float32","float64"].includes(this.type)?L=ke=>BigInt(Math.floor(ke)):L=BigInt),new i(R,n[R].from(this.data,L),this.dims)}}function l(H,R){let L=H.length,ee=R.reduce((ke,Ie)=>ke*Ie);if(L!==ee)throw Error(`cannot reshape array of size ${L} into shape (${R})`);let ue=H;for(let ke=R.length-1;ke>=0;ke--)ue=ue.reduce((Ie,Le)=>{let rt=Ie[Ie.length-1];return rt.length<R[ke]?rt.push(Le):Ie.push([Le]),Ie},[[]]);return ue[0]}function c(H,R){let[L,ee]=(0,s.permute_data)(H.data,H.dims,R);return new i(H.type,L,ee)}function _(H,[R,L],ee="bilinear",ue=!1){let ke=H.dims.at(-3)??1,Ie=H.dims.at(-2),Le=H.dims.at(-1),rt=(0,s.interpolate_data)(H.data,[ke,Ie,Le],[R,L],ee,ue);return new i(H.type,rt,[ke,R,L])}async function u(H,{size:R=null,mode:L="bilinear"}={}){if(H.dims.length!==4)throw new Error("`interpolate_4d` currently only supports 4D input.");if(!R)throw new Error("`interpolate_4d` requires a `size` argument.");let ee;if(R.length===2)ee=[...H.dims.slice(0,2),...R];else if(R.length===3)ee=[H.dims[0],...R];else if(R.length===4)ee=R;else throw new Error("`size` must be of length 2, 3, or 4.");let ue;if(L==="nearest")ue=await a.TensorOpRegistry.nearest_interpolate_4d;else if(L==="bilinear")ue=await a.TensorOpRegistry.bilinear_interpolate_4d;else if(L==="bicubic")ue=await a.TensorOpRegistry.bicubic_interpolate_4d;else throw new Error(`Unsupported mode: ${L}`);let ke=new i("int64",new BigInt64Array(ee.map(BigInt)),[ee.length]);return await ue({x:H,s:ke})}async function d(H,R){return await(await a.TensorOpRegistry.matmul)({a:H,b:R})}async function g(H,R){return await(await a.TensorOpRegistry.rfft)({x:H,a:R})}async function h(H,R){let L=await a.TensorOpRegistry.top_k;return R==null?R=H.dims.at(-1):R=Math.min(R,H.dims.at(-1)),await L({x:H,k:new i("int64",[BigInt(R)],[1])})}let x=H=>new i("int64",H,[H.length]);async function F(H,R,L,ee,ue){return await(await a.TensorOpRegistry.slice)({x:H,s:x(R),e:x(L),a:x(ee),t:x(ue??new Array(ee.length).fill(1))})}function v(H,R){let L=H.data,ee=R.data,ue=[H.dims[0],H.dims[2]],ke=new L.constructor(ue[0]*ue[1]),[Ie,Le,rt]=H.dims,we=0;for(let A=0;A<Ie;++A){let le=A*rt*Le;for(let ge=0;ge<rt;++ge){let be=0,Ae=0,ve=A*Le,pe=le+ge;for(let fe=0;fe<Le;++fe){let Te=Number(ee[ve+fe]);Ae+=Te,be+=L[pe+fe*rt]*Te}let Pe=be/Ae;ke[we++]=Pe}}return new i(H.type,ke,ue)}function b(H,R,{eps:L=1e-5}={}){if(H.dims.length!==2)throw new Error("`layer_norm` currently only supports 2D input.");let[ee,ue]=H.dims;if(R.length!==1&&R[0]!==ue)throw new Error("`normalized_shape` must be a 1D array with shape `[input.dims[1]]`.");let[ke,Ie]=D(H,1,0,!0),Le=ke.data,rt=Ie.data,we=H.data,A=new we.constructor(we.length);for(let le=0;le<ee;++le){let ge=le*ue;for(let be=0;be<ue;++be){let Ae=ge+be;A[Ae]=(we[Ae]-rt[le])/(Le[le]+L)}}return new i(H.type,A,H.dims)}function C(H,R){return H=H.slice(),R===null?H=H.filter(L=>L!==1):typeof R=="number"?H[R]===1&&H.splice(R,1):Array.isArray(R)&&(H=H.filter((L,ee)=>L!==1||!R.includes(ee))),H}function y(H,R){return R=P(R,H.length+1),H=H.slice(),H.splice(R,0,1),H}function P(H,R,L=null,ee=!0){if(H<-R||H>=R){if(ee)throw new Error(`IndexError: index ${H} is out of bounds for dimension${L===null?"":" "+L} with size ${R}`);return H<-R?0:R}return H<0&&(H=(H%R+R)%R),H}function I(H,R=0){R=P(R,H[0].dims.length);let L=H[0].dims.slice();L[R]=H.reduce((Ie,Le)=>Ie+Le.dims[R],0);let ee=L.reduce((Ie,Le)=>Ie*Le,1),ue=new H[0].data.constructor(ee),ke=H[0].type;if(R===0){let Ie=0;for(let Le of H){let rt=Le.data;ue.set(rt,Ie),Ie+=rt.length}}else{let Ie=0;for(let Le=0;Le<H.length;++Le){let{data:rt,dims:we}=H[Le];for(let A=0;A<rt.length;++A){let le=0;for(let ge=we.length-1,be=A,Ae=1;ge>=0;--ge){let ve=we[ge],pe=be%ve;ge===R&&(pe+=Ie),le+=pe*Ae,Ae*=L[ge],be=Math.floor(be/ve)}ue[le]=rt[A]}Ie+=we[R]}}return new i(ke,ue,L)}function f(H,R=0){return I(H.map(L=>L.unsqueeze(R)),R)}function E(H,R,L=null,ee=!1,ue=null){let ke=R.data,Ie=R.dims;L=P(L,Ie.length);let Le=Ie.slice();Le[L]=1;let rt=new ke.constructor(ke.length/Ie[L]);ue!==null&&rt.fill(ue);for(let we=0;we<ke.length;++we){let A=0;for(let le=Ie.length-1,ge=we,be=1;le>=0;--le){let Ae=Ie[le];if(le!==L){let ve=ge%Ae;A+=ve*be,be*=Le[le]}ge=Math.floor(ge/Ae)}rt[A]=H(rt[A],ke[we],we,A)}return ee||Le.splice(L,1),[R.type,rt,Le]}function D(H,R=null,L=1,ee=!1){let ue=H.data,ke=H.dims;if(R===null){let be=ue.reduce((Pe,fe)=>Pe+fe,0)/ue.length,Ae=Math.sqrt(ue.reduce((Pe,fe)=>Pe+(fe-be)**2,0)/(ue.length-L)),ve=new i(H.type,[be],[]);return[new i(H.type,[Ae],[]),ve]}R=P(R,ke.length);let Ie=O(H,R,ee),Le=Ie.data,[rt,we,A]=E((ge,be,Ae,ve)=>ge+(be-Le[ve])**2,H,R,ee);for(let ge=0;ge<we.length;++ge)we[ge]=Math.sqrt(we[ge]/(ke[R]-L));return[new i(rt,we,A),Ie]}function O(H,R=null,L=!1){let ee=H.dims,ue=H.data;if(R===null){let rt=ue.reduce((we,A)=>we+A,0);return new i(H.type,[rt/ue.length],[])}R=P(R,ee.length);let[ke,Ie,Le]=E((rt,we)=>rt+we,H,R,L);if(ee[R]!==1)for(let rt=0;rt<Ie.length;++rt)Ie[rt]/=ee[R];return new i(ke,Ie,Le)}function U(H){let R=new Array(H.length);for(let L=H.length-1,ee=1;L>=0;--L)R[L]=ee,ee*=H[L];return R}function W(H,R,L,ee){let ue=H.reduce((ke,Ie)=>ke*Ie,1);return new i(L,new ee(ue).fill(R),H)}function z(H,R){let L,ee;if(typeof R=="number")L="float32",ee=Float32Array;else if(typeof R=="bigint")L="int64",ee=BigInt64Array;else if(typeof R=="boolean")L="bool",ee=Uint8Array;else throw new Error(`Unsupported data type: ${typeof R}`);return W(H,R,L,ee)}function X(H,R){return z(H.dims,R)}function J(H){return W(H,1n,"int64",BigInt64Array)}function q(H){return J(H.dims)}function re(H){return W(H,0n,"int64",BigInt64Array)}function oe(H){return re(H.dims)}function ne(H){let R=H.reduce((L,ee)=>L*ee,1);return new i("float32",Float32Array.from({length:R},()=>Math.random()),H)}function ye(H){let R=H.reduce((ee,ue)=>ee*ue,1);function L(){let ee=1-Math.random(),ue=1-Math.random();return Math.sqrt(-2*Math.log(ee))*Math.cos(2*Math.PI*ue)}return new i("float32",Float32Array.from({length:R},()=>L()),H)}function Y(H,R){if(H.dims.length!==2)throw new Error("The tensor must have 2 dimensions");if(H.dims.at(-1)%8!==0)throw new Error("The last dimension of the tensor must be a multiple of 8");if(!["binary","ubinary"].includes(R))throw new Error("The precision must be either 'binary' or 'ubinary'");let L=R==="binary",ee=L?"int8":"uint8",ue=L?Int8Array:Uint8Array,ke=H.data,Ie=new ue(ke.length/8);for(let Le=0;Le<ke.length;++Le){let rt=ke[Le]>0?1:0,we=Math.floor(Le/8),A=Le%8;Ie[we]|=rt<<7-A,L&&A===0&&(Ie[we]-=128)}return new i(ee,Ie,[H.dims[0],H.dims[1]/8])}}),"./src/utils/video.js":((e,r,t)=>{t.r(r),t.d(r,{RawVideo:()=>n,RawVideoFrame:()=>a,load_video:()=>i});var s=t("./src/utils/image.js"),o=t("./src/env.js");class a{constructor(c,_){this.image=c,this.timestamp=_}}class n{constructor(c,_){c.length>0&&c[0]instanceof s.RawImage&&(c=c.map((u,d)=>new a(u,(d+1)/(c.length+1)*_))),this.frames=c,this.duration=_}get width(){return this.frames[0].image.width}get height(){return this.frames[0].image.height}get fps(){return this.frames.length/this.duration}}async function i(l,{num_frames:c=null,fps:_=null}={}){if(!o.apis.IS_BROWSER_ENV)throw new Error("`load_video` is currently only supported in browser environments.");if(c==null&&_==null)throw new Error("Either num_frames or fps must be provided.");let u=[],d=document.createElement("video");if(d.crossOrigin="anonymous",d.muted=!0,typeof l=="string")d.src=l;else if(l instanceof Blob)d.src=URL.createObjectURL(l);else if(l instanceof HTMLVideoElement)d.src=l.src;else throw new Error("Invalid URL or video element provided.");if(await new Promise(C=>d.onloadedmetadata=C),d.seekable.start(0)===d.seekable.end(0)){let y=await(await fetch(d.src)).blob();d.src=URL.createObjectURL(y),await new Promise(P=>d.onloadedmetadata=P)}let g=d.duration,h,x;c!=null?(h=c,x=c===1?0:g/(c-1)):(x=1/_,h=Math.floor(g/x));let F=[];for(let C=0;C<h;++C)F.push(c===1?g/2:C*x);let v=document.createElement("canvas");v.width=d.videoWidth,v.height=d.videoHeight;let b=v.getContext("2d",{willReadFrequently:!0});for(let C of F){d.currentTime=C,await new Promise(f=>{d.onseeked=f}),b.drawImage(d,0,0,v.width,v.height);let y=b.getImageData(0,0,v.width,v.height),P=new s.RawImage(y.data,v.width,v.height,4),I=new a(P,C);u.push(I)}return d.remove(),new n(u,g)}})},I0={};function Vt(e){var r=I0[e];if(r!==void 0)return r.exports;var t=I0[e]={exports:{}};return gE[e](t,t.exports,Vt),t.exports}(()=>{var e=Object.getPrototypeOf?t=>Object.getPrototypeOf(t):t=>t.__proto__,r;Vt.t=function(t,s){if(s&1&&(t=this(t)),s&8||typeof t=="object"&&t&&(s&4&&t.__esModule||s&16&&typeof t.then=="function"))return t;var o=Object.create(null);Vt.r(o);var a={};r=r||[null,e({}),e([]),e(e)];for(var n=s&2&&t;typeof n=="object"&&!~r.indexOf(n);n=e(n))Object.getOwnPropertyNames(n).forEach(i=>a[i]=()=>t[i]);return a.default=()=>t,Vt.d(o,a),o}})();Vt.d=(e,r)=>{for(var t in r)Vt.o(r,t)&&!Vt.o(e,t)&&Object.defineProperty(e,t,{enumerable:!0,get:r[t]})};Vt.o=(e,r)=>Object.prototype.hasOwnProperty.call(e,r);Vt.r=e=>{typeof Symbol<"u"&&Symbol.toStringTag&&Object.defineProperty(e,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(e,"__esModule",{value:!0})};var p={};(()=>{Vt.r(p),Vt.d(p,{ASTFeatureExtractor:()=>u.ASTFeatureExtractor,ASTForAudioClassification:()=>t.ASTForAudioClassification,ASTModel:()=>t.ASTModel,ASTPreTrainedModel:()=>t.ASTPreTrainedModel,AlbertForMaskedLM:()=>t.AlbertForMaskedLM,AlbertForQuestionAnswering:()=>t.AlbertForQuestionAnswering,AlbertForSequenceClassification:()=>t.AlbertForSequenceClassification,AlbertModel:()=>t.AlbertModel,AlbertPreTrainedModel:()=>t.AlbertPreTrainedModel,AlbertTokenizer:()=>s.AlbertTokenizer,ArceeForCausalLM:()=>t.ArceeForCausalLM,ArceeModel:()=>t.ArceeModel,ArceePreTrainedModel:()=>t.ArceePreTrainedModel,AudioClassificationPipeline:()=>r.AudioClassificationPipeline,AutoConfig:()=>o.AutoConfig,AutoFeatureExtractor:()=>d.AutoFeatureExtractor,AutoImageProcessor:()=>x.AutoImageProcessor,AutoModel:()=>t.AutoModel,AutoModelForAudioClassification:()=>t.AutoModelForAudioClassification,AutoModelForAudioFrameClassification:()=>t.AutoModelForAudioFrameClassification,AutoModelForAudioTextToText:()=>t.AutoModelForAudioTextToText,AutoModelForCTC:()=>t.AutoModelForCTC,AutoModelForCausalLM:()=>t.AutoModelForCausalLM,AutoModelForDepthEstimation:()=>t.AutoModelForDepthEstimation,AutoModelForDocumentQuestionAnswering:()=>t.AutoModelForDocumentQuestionAnswering,AutoModelForImageClassification:()=>t.AutoModelForImageClassification,AutoModelForImageFeatureExtraction:()=>t.AutoModelForImageFeatureExtraction,AutoModelForImageMatting:()=>t.AutoModelForImageMatting,AutoModelForImageSegmentation:()=>t.AutoModelForImageSegmentation,AutoModelForImageTextToText:()=>t.AutoModelForImageTextToText,AutoModelForImageToImage:()=>t.AutoModelForImageToImage,AutoModelForMaskGeneration:()=>t.AutoModelForMaskGeneration,AutoModelForMaskedLM:()=>t.AutoModelForMaskedLM,AutoModelForNormalEstimation:()=>t.AutoModelForNormalEstimation,AutoModelForObjectDetection:()=>t.AutoModelForObjectDetection,AutoModelForPoseEstimation:()=>t.AutoModelForPoseEstimation,AutoModelForQuestionAnswering:()=>t.AutoModelForQuestionAnswering,AutoModelForSemanticSegmentation:()=>t.AutoModelForSemanticSegmentation,AutoModelForSeq2SeqLM:()=>t.AutoModelForSeq2SeqLM,AutoModelForSequenceClassification:()=>t.AutoModelForSequenceClassification,AutoModelForSpeechSeq2Seq:()=>t.AutoModelForSpeechSeq2Seq,AutoModelForTextToSpectrogram:()=>t.AutoModelForTextToSpectrogram,AutoModelForTextToWaveform:()=>t.AutoModelForTextToWaveform,AutoModelForTokenClassification:()=>t.AutoModelForTokenClassification,AutoModelForUniversalSegmentation:()=>t.AutoModelForUniversalSegmentation,AutoModelForVision2Seq:()=>t.AutoModelForVision2Seq,AutoModelForXVector:()=>t.AutoModelForXVector,AutoModelForZeroShotObjectDetection:()=>t.AutoModelForZeroShotObjectDetection,AutoProcessor:()=>b.AutoProcessor,AutoTokenizer:()=>s.AutoTokenizer,AutomaticSpeechRecognitionPipeline:()=>r.AutomaticSpeechRecognitionPipeline,BackgroundRemovalPipeline:()=>r.BackgroundRemovalPipeline,BartForConditionalGeneration:()=>t.BartForConditionalGeneration,BartForSequenceClassification:()=>t.BartForSequenceClassification,BartModel:()=>t.BartModel,BartPretrainedModel:()=>t.BartPretrainedModel,BartTokenizer:()=>s.BartTokenizer,BaseModelOutput:()=>t.BaseModelOutput,BaseStreamer:()=>C.BaseStreamer,BeitFeatureExtractor:()=>h.BeitFeatureExtractor,BeitForImageClassification:()=>t.BeitForImageClassification,BeitModel:()=>t.BeitModel,BeitPreTrainedModel:()=>t.BeitPreTrainedModel,BertForMaskedLM:()=>t.BertForMaskedLM,BertForQuestionAnswering:()=>t.BertForQuestionAnswering,BertForSequenceClassification:()=>t.BertForSequenceClassification,BertForTokenClassification:()=>t.BertForTokenClassification,BertModel:()=>t.BertModel,BertPreTrainedModel:()=>t.BertPreTrainedModel,BertTokenizer:()=>s.BertTokenizer,BitImageProcessor:()=>h.BitImageProcessor,BlenderbotForConditionalGeneration:()=>t.BlenderbotForConditionalGeneration,BlenderbotModel:()=>t.BlenderbotModel,BlenderbotPreTrainedModel:()=>t.BlenderbotPreTrainedModel,BlenderbotSmallForConditionalGeneration:()=>t.BlenderbotSmallForConditionalGeneration,BlenderbotSmallModel:()=>t.BlenderbotSmallModel,BlenderbotSmallPreTrainedModel:()=>t.BlenderbotSmallPreTrainedModel,BlenderbotSmallTokenizer:()=>s.BlenderbotSmallTokenizer,BlenderbotTokenizer:()=>s.BlenderbotTokenizer,BloomForCausalLM:()=>t.BloomForCausalLM,BloomModel:()=>t.BloomModel,BloomPreTrainedModel:()=>t.BloomPreTrainedModel,BloomTokenizer:()=>s.BloomTokenizer,CLIPFeatureExtractor:()=>h.CLIPFeatureExtractor,CLIPImageProcessor:()=>h.CLIPImageProcessor,CLIPModel:()=>t.CLIPModel,CLIPPreTrainedModel:()=>t.CLIPPreTrainedModel,CLIPSegForImageSegmentation:()=>t.CLIPSegForImageSegmentation,CLIPSegModel:()=>t.CLIPSegModel,CLIPSegPreTrainedModel:()=>t.CLIPSegPreTrainedModel,CLIPTextModel:()=>t.CLIPTextModel,CLIPTextModelWithProjection:()=>t.CLIPTextModelWithProjection,CLIPTokenizer:()=>s.CLIPTokenizer,CLIPVisionModel:()=>t.CLIPVisionModel,CLIPVisionModelWithProjection:()=>t.CLIPVisionModelWithProjection,CamembertForMaskedLM:()=>t.CamembertForMaskedLM,CamembertForQuestionAnswering:()=>t.CamembertForQuestionAnswering,CamembertForSequenceClassification:()=>t.CamembertForSequenceClassification,CamembertForTokenClassification:()=>t.CamembertForTokenClassification,CamembertModel:()=>t.CamembertModel,CamembertPreTrainedModel:()=>t.CamembertPreTrainedModel,CamembertTokenizer:()=>s.CamembertTokenizer,CausalLMOutput:()=>t.CausalLMOutput,CausalLMOutputWithPast:()=>t.CausalLMOutputWithPast,ChineseCLIPFeatureExtractor:()=>h.ChineseCLIPFeatureExtractor,ChineseCLIPModel:()=>t.ChineseCLIPModel,ChineseCLIPPreTrainedModel:()=>t.ChineseCLIPPreTrainedModel,ClapAudioModelWithProjection:()=>t.ClapAudioModelWithProjection,ClapFeatureExtractor:()=>u.ClapFeatureExtractor,ClapModel:()=>t.ClapModel,ClapPreTrainedModel:()=>t.ClapPreTrainedModel,ClapTextModelWithProjection:()=>t.ClapTextModelWithProjection,ClassifierFreeGuidanceLogitsProcessor:()=>P.ClassifierFreeGuidanceLogitsProcessor,CodeGenForCausalLM:()=>t.CodeGenForCausalLM,CodeGenModel:()=>t.CodeGenModel,CodeGenPreTrainedModel:()=>t.CodeGenPreTrainedModel,CodeGenTokenizer:()=>s.CodeGenTokenizer,CodeLlamaTokenizer:()=>s.CodeLlamaTokenizer,CohereForCausalLM:()=>t.CohereForCausalLM,CohereModel:()=>t.CohereModel,CoherePreTrainedModel:()=>t.CoherePreTrainedModel,CohereTokenizer:()=>s.CohereTokenizer,ConvBertForMaskedLM:()=>t.ConvBertForMaskedLM,ConvBertForQuestionAnswering:()=>t.ConvBertForQuestionAnswering,ConvBertForSequenceClassification:()=>t.ConvBertForSequenceClassification,ConvBertForTokenClassification:()=>t.ConvBertForTokenClassification,ConvBertModel:()=>t.ConvBertModel,ConvBertPreTrainedModel:()=>t.ConvBertPreTrainedModel,ConvBertTokenizer:()=>s.ConvBertTokenizer,ConvNextFeatureExtractor:()=>h.ConvNextFeatureExtractor,ConvNextForImageClassification:()=>t.ConvNextForImageClassification,ConvNextImageProcessor:()=>h.ConvNextImageProcessor,ConvNextModel:()=>t.ConvNextModel,ConvNextPreTrainedModel:()=>t.ConvNextPreTrainedModel,ConvNextV2ForImageClassification:()=>t.ConvNextV2ForImageClassification,ConvNextV2Model:()=>t.ConvNextV2Model,ConvNextV2PreTrainedModel:()=>t.ConvNextV2PreTrainedModel,DFineForObjectDetection:()=>t.DFineForObjectDetection,DFineModel:()=>t.DFineModel,DFinePreTrainedModel:()=>t.DFinePreTrainedModel,DINOv3ConvNextModel:()=>t.DINOv3ConvNextModel,DINOv3ConvNextPreTrainedModel:()=>t.DINOv3ConvNextPreTrainedModel,DINOv3ViTImageProcessor:()=>h.DINOv3ViTImageProcessor,DINOv3ViTModel:()=>t.DINOv3ViTModel,DINOv3ViTPreTrainedModel:()=>t.DINOv3ViTPreTrainedModel,DPTFeatureExtractor:()=>h.DPTFeatureExtractor,DPTForDepthEstimation:()=>t.DPTForDepthEstimation,DPTImageProcessor:()=>h.DPTImageProcessor,DPTModel:()=>t.DPTModel,DPTPreTrainedModel:()=>t.DPTPreTrainedModel,DacDecoderModel:()=>t.DacDecoderModel,DacDecoderOutput:()=>t.DacDecoderOutput,DacEncoderModel:()=>t.DacEncoderModel,DacEncoderOutput:()=>t.DacEncoderOutput,DacFeatureExtractor:()=>u.DacFeatureExtractor,DacModel:()=>t.DacModel,DacPreTrainedModel:()=>t.DacPreTrainedModel,DataTypeMap:()=>l.DataTypeMap,DebertaForMaskedLM:()=>t.DebertaForMaskedLM,DebertaForQuestionAnswering:()=>t.DebertaForQuestionAnswering,DebertaForSequenceClassification:()=>t.DebertaForSequenceClassification,DebertaForTokenClassification:()=>t.DebertaForTokenClassification,DebertaModel:()=>t.DebertaModel,DebertaPreTrainedModel:()=>t.DebertaPreTrainedModel,DebertaTokenizer:()=>s.DebertaTokenizer,DebertaV2ForMaskedLM:()=>t.DebertaV2ForMaskedLM,DebertaV2ForQuestionAnswering:()=>t.DebertaV2ForQuestionAnswering,DebertaV2ForSequenceClassification:()=>t.DebertaV2ForSequenceClassification,DebertaV2ForTokenClassification:()=>t.DebertaV2ForTokenClassification,DebertaV2Model:()=>t.DebertaV2Model,DebertaV2PreTrainedModel:()=>t.DebertaV2PreTrainedModel,DebertaV2Tokenizer:()=>s.DebertaV2Tokenizer,DecisionTransformerModel:()=>t.DecisionTransformerModel,DecisionTransformerPreTrainedModel:()=>t.DecisionTransformerPreTrainedModel,DeiTFeatureExtractor:()=>h.DeiTFeatureExtractor,DeiTForImageClassification:()=>t.DeiTForImageClassification,DeiTImageProcessor:()=>h.DeiTImageProcessor,DeiTModel:()=>t.DeiTModel,DeiTPreTrainedModel:()=>t.DeiTPreTrainedModel,DepthAnythingForDepthEstimation:()=>t.DepthAnythingForDepthEstimation,DepthAnythingPreTrainedModel:()=>t.DepthAnythingPreTrainedModel,DepthEstimationPipeline:()=>r.DepthEstimationPipeline,DepthProForDepthEstimation:()=>t.DepthProForDepthEstimation,DepthProPreTrainedModel:()=>t.DepthProPreTrainedModel,DetrFeatureExtractor:()=>h.DetrFeatureExtractor,DetrForObjectDetection:()=>t.DetrForObjectDetection,DetrForSegmentation:()=>t.DetrForSegmentation,DetrImageProcessor:()=>h.DetrImageProcessor,DetrModel:()=>t.DetrModel,DetrObjectDetectionOutput:()=>t.DetrObjectDetectionOutput,DetrPreTrainedModel:()=>t.DetrPreTrainedModel,DetrSegmentationOutput:()=>t.DetrSegmentationOutput,Dinov2ForImageClassification:()=>t.Dinov2ForImageClassification,Dinov2Model:()=>t.Dinov2Model,Dinov2PreTrainedModel:()=>t.Dinov2PreTrainedModel,Dinov2WithRegistersForImageClassification:()=>t.Dinov2WithRegistersForImageClassification,Dinov2WithRegistersModel:()=>t.Dinov2WithRegistersModel,Dinov2WithRegistersPreTrainedModel:()=>t.Dinov2WithRegistersPreTrainedModel,DistilBertForMaskedLM:()=>t.DistilBertForMaskedLM,DistilBertForQuestionAnswering:()=>t.DistilBertForQuestionAnswering,DistilBertForSequenceClassification:()=>t.DistilBertForSequenceClassification,DistilBertForTokenClassification:()=>t.DistilBertForTokenClassification,DistilBertModel:()=>t.DistilBertModel,DistilBertPreTrainedModel:()=>t.DistilBertPreTrainedModel,DistilBertTokenizer:()=>s.DistilBertTokenizer,DocumentQuestionAnsweringPipeline:()=>r.DocumentQuestionAnsweringPipeline,DonutFeatureExtractor:()=>h.DonutFeatureExtractor,DonutImageProcessor:()=>h.DonutImageProcessor,DonutSwinModel:()=>t.DonutSwinModel,DonutSwinPreTrainedModel:()=>t.DonutSwinPreTrainedModel,EdgeTamModel:()=>t.EdgeTamModel,EfficientNetForImageClassification:()=>t.EfficientNetForImageClassification,EfficientNetImageProcessor:()=>h.EfficientNetImageProcessor,EfficientNetModel:()=>t.EfficientNetModel,EfficientNetPreTrainedModel:()=>t.EfficientNetPreTrainedModel,ElectraForMaskedLM:()=>t.ElectraForMaskedLM,ElectraForQuestionAnswering:()=>t.ElectraForQuestionAnswering,ElectraForSequenceClassification:()=>t.ElectraForSequenceClassification,ElectraForTokenClassification:()=>t.ElectraForTokenClassification,ElectraModel:()=>t.ElectraModel,ElectraPreTrainedModel:()=>t.ElectraPreTrainedModel,ElectraTokenizer:()=>s.ElectraTokenizer,EncodecFeatureExtractor:()=>u.EncodecFeatureExtractor,EosTokenCriteria:()=>y.EosTokenCriteria,Ernie4_5ForCausalLM:()=>t.Ernie4_5ForCausalLM,Ernie4_5Model:()=>t.Ernie4_5Model,Ernie4_5PreTrainedModel:()=>t.Ernie4_5PreTrainedModel,EsmForMaskedLM:()=>t.EsmForMaskedLM,EsmForSequenceClassification:()=>t.EsmForSequenceClassification,EsmForTokenClassification:()=>t.EsmForTokenClassification,EsmModel:()=>t.EsmModel,EsmPreTrainedModel:()=>t.EsmPreTrainedModel,EsmTokenizer:()=>s.EsmTokenizer,ExaoneForCausalLM:()=>t.ExaoneForCausalLM,ExaoneModel:()=>t.ExaoneModel,ExaonePreTrainedModel:()=>t.ExaonePreTrainedModel,FFT:()=>c.FFT,FalconForCausalLM:()=>t.FalconForCausalLM,FalconModel:()=>t.FalconModel,FalconPreTrainedModel:()=>t.FalconPreTrainedModel,FalconTokenizer:()=>s.FalconTokenizer,FastViTForImageClassification:()=>t.FastViTForImageClassification,FastViTModel:()=>t.FastViTModel,FastViTPreTrainedModel:()=>t.FastViTPreTrainedModel,FeatureExtractionPipeline:()=>r.FeatureExtractionPipeline,FeatureExtractor:()=>_.FeatureExtractor,FillMaskPipeline:()=>r.FillMaskPipeline,Florence2ForConditionalGeneration:()=>t.Florence2ForConditionalGeneration,Florence2PreTrainedModel:()=>t.Florence2PreTrainedModel,Florence2Processor:()=>v.Florence2Processor,ForcedBOSTokenLogitsProcessor:()=>P.ForcedBOSTokenLogitsProcessor,ForcedEOSTokenLogitsProcessor:()=>P.ForcedEOSTokenLogitsProcessor,GLPNFeatureExtractor:()=>h.GLPNFeatureExtractor,GLPNForDepthEstimation:()=>t.GLPNForDepthEstimation,GLPNModel:()=>t.GLPNModel,GLPNPreTrainedModel:()=>t.GLPNPreTrainedModel,GPT2LMHeadModel:()=>t.GPT2LMHeadModel,GPT2Model:()=>t.GPT2Model,GPT2PreTrainedModel:()=>t.GPT2PreTrainedModel,GPT2Tokenizer:()=>s.GPT2Tokenizer,GPTBigCodeForCausalLM:()=>t.GPTBigCodeForCausalLM,GPTBigCodeModel:()=>t.GPTBigCodeModel,GPTBigCodePreTrainedModel:()=>t.GPTBigCodePreTrainedModel,GPTJForCausalLM:()=>t.GPTJForCausalLM,GPTJModel:()=>t.GPTJModel,GPTJPreTrainedModel:()=>t.GPTJPreTrainedModel,GPTNeoForCausalLM:()=>t.GPTNeoForCausalLM,GPTNeoModel:()=>t.GPTNeoModel,GPTNeoPreTrainedModel:()=>t.GPTNeoPreTrainedModel,GPTNeoXForCausalLM:()=>t.GPTNeoXForCausalLM,GPTNeoXModel:()=>t.GPTNeoXModel,GPTNeoXPreTrainedModel:()=>t.GPTNeoXPreTrainedModel,GPTNeoXTokenizer:()=>s.GPTNeoXTokenizer,Gemma2ForCausalLM:()=>t.Gemma2ForCausalLM,Gemma2Model:()=>t.Gemma2Model,Gemma2PreTrainedModel:()=>t.Gemma2PreTrainedModel,Gemma3ForCausalLM:()=>t.Gemma3ForCausalLM,Gemma3Model:()=>t.Gemma3Model,Gemma3PreTrainedModel:()=>t.Gemma3PreTrainedModel,Gemma3nAudioFeatureExtractor:()=>u.Gemma3nAudioFeatureExtractor,Gemma3nForConditionalGeneration:()=>t.Gemma3nForConditionalGeneration,Gemma3nPreTrainedModel:()=>t.Gemma3nPreTrainedModel,Gemma3nProcessor:()=>v.Gemma3nProcessor,GemmaForCausalLM:()=>t.GemmaForCausalLM,GemmaModel:()=>t.GemmaModel,GemmaPreTrainedModel:()=>t.GemmaPreTrainedModel,GemmaTokenizer:()=>s.GemmaTokenizer,GlmForCausalLM:()=>t.GlmForCausalLM,GlmModel:()=>t.GlmModel,GlmPreTrainedModel:()=>t.GlmPreTrainedModel,GraniteForCausalLM:()=>t.GraniteForCausalLM,GraniteModel:()=>t.GraniteModel,GraniteMoeHybridForCausalLM:()=>t.GraniteMoeHybridForCausalLM,GraniteMoeHybridModel:()=>t.GraniteMoeHybridModel,GraniteMoeHybridPreTrainedModel:()=>t.GraniteMoeHybridPreTrainedModel,GranitePreTrainedModel:()=>t.GranitePreTrainedModel,Grok1Tokenizer:()=>s.Grok1Tokenizer,GroundingDinoForObjectDetection:()=>t.GroundingDinoForObjectDetection,GroundingDinoImageProcessor:()=>h.GroundingDinoImageProcessor,GroundingDinoPreTrainedModel:()=>t.GroundingDinoPreTrainedModel,GroundingDinoProcessor:()=>v.GroundingDinoProcessor,GroupViTModel:()=>t.GroupViTModel,GroupViTPreTrainedModel:()=>t.GroupViTPreTrainedModel,HeliumForCausalLM:()=>t.HeliumForCausalLM,HeliumModel:()=>t.HeliumModel,HeliumPreTrainedModel:()=>t.HeliumPreTrainedModel,HerbertTokenizer:()=>s.HerbertTokenizer,HieraForImageClassification:()=>t.HieraForImageClassification,HieraModel:()=>t.HieraModel,HieraPreTrainedModel:()=>t.HieraPreTrainedModel,HubertForCTC:()=>t.HubertForCTC,HubertForSequenceClassification:()=>t.HubertForSequenceClassification,HubertModel:()=>t.HubertModel,HubertPreTrainedModel:()=>t.HubertPreTrainedModel,IJepaForImageClassification:()=>t.IJepaForImageClassification,IJepaModel:()=>t.IJepaModel,IJepaPreTrainedModel:()=>t.IJepaPreTrainedModel,Idefics3ForConditionalGeneration:()=>t.Idefics3ForConditionalGeneration,Idefics3ImageProcessor:()=>h.Idefics3ImageProcessor,Idefics3PreTrainedModel:()=>t.Idefics3PreTrainedModel,Idefics3Processor:()=>v.Idefics3Processor,ImageClassificationPipeline:()=>r.ImageClassificationPipeline,ImageFeatureExtractionPipeline:()=>r.ImageFeatureExtractionPipeline,ImageFeatureExtractor:()=>u.ImageFeatureExtractor,ImageMattingOutput:()=>t.ImageMattingOutput,ImageProcessor:()=>g.ImageProcessor,ImageSegmentationPipeline:()=>r.ImageSegmentationPipeline,ImageToImagePipeline:()=>r.ImageToImagePipeline,ImageToTextPipeline:()=>r.ImageToTextPipeline,InterruptableStoppingCriteria:()=>y.InterruptableStoppingCriteria,JAISLMHeadModel:()=>t.JAISLMHeadModel,JAISModel:()=>t.JAISModel,JAISPreTrainedModel:()=>t.JAISPreTrainedModel,JinaCLIPImageProcessor:()=>h.JinaCLIPImageProcessor,JinaCLIPModel:()=>t.JinaCLIPModel,JinaCLIPPreTrainedModel:()=>t.JinaCLIPPreTrainedModel,JinaCLIPProcessor:()=>v.JinaCLIPProcessor,JinaCLIPTextModel:()=>t.JinaCLIPTextModel,JinaCLIPVisionModel:()=>t.JinaCLIPVisionModel,Lfm2ForCausalLM:()=>t.Lfm2ForCausalLM,Lfm2Model:()=>t.Lfm2Model,Lfm2PreTrainedModel:()=>t.Lfm2PreTrainedModel,LiteWhisperForConditionalGeneration:()=>t.LiteWhisperForConditionalGeneration,Llama4ForCausalLM:()=>t.Llama4ForCausalLM,Llama4PreTrainedModel:()=>t.Llama4PreTrainedModel,LlamaForCausalLM:()=>t.LlamaForCausalLM,LlamaModel:()=>t.LlamaModel,LlamaPreTrainedModel:()=>t.LlamaPreTrainedModel,LlamaTokenizer:()=>s.LlamaTokenizer,LlavaForConditionalGeneration:()=>t.LlavaForConditionalGeneration,LlavaOnevisionForConditionalGeneration:()=>t.LlavaOnevisionForConditionalGeneration,LlavaOnevisionImageProcessor:()=>h.LlavaOnevisionImageProcessor,LlavaPreTrainedModel:()=>t.LlavaPreTrainedModel,LlavaProcessor:()=>v.LlavaProcessor,LlavaQwen2ForCausalLM:()=>t.LlavaQwen2ForCausalLM,LogitsProcessor:()=>P.LogitsProcessor,LogitsProcessorList:()=>P.LogitsProcessorList,LogitsWarper:()=>P.LogitsWarper,LongT5ForConditionalGeneration:()=>t.LongT5ForConditionalGeneration,LongT5Model:()=>t.LongT5Model,LongT5PreTrainedModel:()=>t.LongT5PreTrainedModel,M2M100ForConditionalGeneration:()=>t.M2M100ForConditionalGeneration,M2M100Model:()=>t.M2M100Model,M2M100PreTrainedModel:()=>t.M2M100PreTrainedModel,M2M100Tokenizer:()=>s.M2M100Tokenizer,MBart50Tokenizer:()=>s.MBart50Tokenizer,MBartForCausalLM:()=>t.MBartForCausalLM,MBartForConditionalGeneration:()=>t.MBartForConditionalGeneration,MBartForSequenceClassification:()=>t.MBartForSequenceClassification,MBartModel:()=>t.MBartModel,MBartPreTrainedModel:()=>t.MBartPreTrainedModel,MBartTokenizer:()=>s.MBartTokenizer,MPNetForMaskedLM:()=>t.MPNetForMaskedLM,MPNetForQuestionAnswering:()=>t.MPNetForQuestionAnswering,MPNetForSequenceClassification:()=>t.MPNetForSequenceClassification,MPNetForTokenClassification:()=>t.MPNetForTokenClassification,MPNetModel:()=>t.MPNetModel,MPNetPreTrainedModel:()=>t.MPNetPreTrainedModel,MPNetTokenizer:()=>s.MPNetTokenizer,MT5ForConditionalGeneration:()=>t.MT5ForConditionalGeneration,MT5Model:()=>t.MT5Model,MT5PreTrainedModel:()=>t.MT5PreTrainedModel,MarianMTModel:()=>t.MarianMTModel,MarianModel:()=>t.MarianModel,MarianPreTrainedModel:()=>t.MarianPreTrainedModel,MarianTokenizer:()=>s.MarianTokenizer,Mask2FormerImageProcessor:()=>h.Mask2FormerImageProcessor,MaskFormerFeatureExtractor:()=>h.MaskFormerFeatureExtractor,MaskFormerForInstanceSegmentation:()=>t.MaskFormerForInstanceSegmentation,MaskFormerImageProcessor:()=>h.MaskFormerImageProcessor,MaskFormerModel:()=>t.MaskFormerModel,MaskFormerPreTrainedModel:()=>t.MaskFormerPreTrainedModel,MaskedLMOutput:()=>t.MaskedLMOutput,MaxLengthCriteria:()=>y.MaxLengthCriteria,Metric3DForDepthEstimation:()=>t.Metric3DForDepthEstimation,Metric3DPreTrainedModel:()=>t.Metric3DPreTrainedModel,Metric3Dv2ForDepthEstimation:()=>t.Metric3Dv2ForDepthEstimation,Metric3Dv2PreTrainedModel:()=>t.Metric3Dv2PreTrainedModel,MgpstrForSceneTextRecognition:()=>t.MgpstrForSceneTextRecognition,MgpstrModelOutput:()=>t.MgpstrModelOutput,MgpstrPreTrainedModel:()=>t.MgpstrPreTrainedModel,MgpstrProcessor:()=>v.MgpstrProcessor,MgpstrTokenizer:()=>s.MgpstrTokenizer,MimiDecoderModel:()=>t.MimiDecoderModel,MimiDecoderOutput:()=>t.MimiDecoderOutput,MimiEncoderModel:()=>t.MimiEncoderModel,MimiEncoderOutput:()=>t.MimiEncoderOutput,MimiModel:()=>t.MimiModel,MimiPreTrainedModel:()=>t.MimiPreTrainedModel,MinLengthLogitsProcessor:()=>P.MinLengthLogitsProcessor,MinNewTokensLengthLogitsProcessor:()=>P.MinNewTokensLengthLogitsProcessor,Ministral3ForCausalLM:()=>t.Ministral3ForCausalLM,Ministral3Model:()=>t.Ministral3Model,Ministral3PreTrainedModel:()=>t.Ministral3PreTrainedModel,MinistralForCausalLM:()=>t.MinistralForCausalLM,MinistralModel:()=>t.MinistralModel,MinistralPreTrainedModel:()=>t.MinistralPreTrainedModel,Mistral3ForConditionalGeneration:()=>t.Mistral3ForConditionalGeneration,MistralForCausalLM:()=>t.MistralForCausalLM,MistralModel:()=>t.MistralModel,MistralPreTrainedModel:()=>t.MistralPreTrainedModel,MobileBertForMaskedLM:()=>t.MobileBertForMaskedLM,MobileBertForQuestionAnswering:()=>t.MobileBertForQuestionAnswering,MobileBertForSequenceClassification:()=>t.MobileBertForSequenceClassification,MobileBertModel:()=>t.MobileBertModel,MobileBertPreTrainedModel:()=>t.MobileBertPreTrainedModel,MobileBertTokenizer:()=>s.MobileBertTokenizer,MobileLLMForCausalLM:()=>t.MobileLLMForCausalLM,MobileLLMModel:()=>t.MobileLLMModel,MobileLLMPreTrainedModel:()=>t.MobileLLMPreTrainedModel,MobileNetV1FeatureExtractor:()=>h.MobileNetV1FeatureExtractor,MobileNetV1ForImageClassification:()=>t.MobileNetV1ForImageClassification,MobileNetV1ForSemanticSegmentation:()=>t.MobileNetV1ForSemanticSegmentation,MobileNetV1ImageProcessor:()=>h.MobileNetV1ImageProcessor,MobileNetV1Model:()=>t.MobileNetV1Model,MobileNetV1PreTrainedModel:()=>t.MobileNetV1PreTrainedModel,MobileNetV2FeatureExtractor:()=>h.MobileNetV2FeatureExtractor,MobileNetV2ForImageClassification:()=>t.MobileNetV2ForImageClassification,MobileNetV2ForSemanticSegmentation:()=>t.MobileNetV2ForSemanticSegmentation,MobileNetV2ImageProcessor:()=>h.MobileNetV2ImageProcessor,MobileNetV2Model:()=>t.MobileNetV2Model,MobileNetV2PreTrainedModel:()=>t.MobileNetV2PreTrainedModel,MobileNetV3FeatureExtractor:()=>h.MobileNetV3FeatureExtractor,MobileNetV3ForImageClassification:()=>t.MobileNetV3ForImageClassification,MobileNetV3ForSemanticSegmentation:()=>t.MobileNetV3ForSemanticSegmentation,MobileNetV3ImageProcessor:()=>h.MobileNetV3ImageProcessor,MobileNetV3Model:()=>t.MobileNetV3Model,MobileNetV3PreTrainedModel:()=>t.MobileNetV3PreTrainedModel,MobileNetV4FeatureExtractor:()=>h.MobileNetV4FeatureExtractor,MobileNetV4ForImageClassification:()=>t.MobileNetV4ForImageClassification,MobileNetV4ForSemanticSegmentation:()=>t.MobileNetV4ForSemanticSegmentation,MobileNetV4ImageProcessor:()=>h.MobileNetV4ImageProcessor,MobileNetV4Model:()=>t.MobileNetV4Model,MobileNetV4PreTrainedModel:()=>t.MobileNetV4PreTrainedModel,MobileViTFeatureExtractor:()=>h.MobileViTFeatureExtractor,MobileViTForImageClassification:()=>t.MobileViTForImageClassification,MobileViTImageProcessor:()=>h.MobileViTImageProcessor,MobileViTModel:()=>t.MobileViTModel,MobileViTPreTrainedModel:()=>t.MobileViTPreTrainedModel,MobileViTV2ForImageClassification:()=>t.MobileViTV2ForImageClassification,MobileViTV2Model:()=>t.MobileViTV2Model,MobileViTV2PreTrainedModel:()=>t.MobileViTV2PreTrainedModel,ModelOutput:()=>t.ModelOutput,ModernBertDecoderForCausalLM:()=>t.ModernBertDecoderForCausalLM,ModernBertDecoderModel:()=>t.ModernBertDecoderModel,ModernBertDecoderPreTrainedModel:()=>t.ModernBertDecoderPreTrainedModel,ModernBertForMaskedLM:()=>t.ModernBertForMaskedLM,ModernBertForSequenceClassification:()=>t.ModernBertForSequenceClassification,ModernBertForTokenClassification:()=>t.ModernBertForTokenClassification,ModernBertModel:()=>t.ModernBertModel,ModernBertPreTrainedModel:()=>t.ModernBertPreTrainedModel,Moondream1ForConditionalGeneration:()=>t.Moondream1ForConditionalGeneration,MoonshineFeatureExtractor:()=>u.MoonshineFeatureExtractor,MoonshineForConditionalGeneration:()=>t.MoonshineForConditionalGeneration,MoonshineModel:()=>t.MoonshineModel,MoonshinePreTrainedModel:()=>t.MoonshinePreTrainedModel,MoonshineProcessor:()=>v.MoonshineProcessor,MptForCausalLM:()=>t.MptForCausalLM,MptModel:()=>t.MptModel,MptPreTrainedModel:()=>t.MptPreTrainedModel,MultiModalityCausalLM:()=>t.MultiModalityCausalLM,MultiModalityPreTrainedModel:()=>t.MultiModalityPreTrainedModel,MusicgenForCausalLM:()=>t.MusicgenForCausalLM,MusicgenForConditionalGeneration:()=>t.MusicgenForConditionalGeneration,MusicgenModel:()=>t.MusicgenModel,MusicgenPreTrainedModel:()=>t.MusicgenPreTrainedModel,NanoChatForCausalLM:()=>t.NanoChatForCausalLM,NanoChatModel:()=>t.NanoChatModel,NanoChatPreTrainedModel:()=>t.NanoChatPreTrainedModel,NeoBertForMaskedLM:()=>t.NeoBertForMaskedLM,NeoBertForQuestionAnswering:()=>t.NeoBertForQuestionAnswering,NeoBertForSequenceClassification:()=>t.NeoBertForSequenceClassification,NeoBertForTokenClassification:()=>t.NeoBertForTokenClassification,NeoBertModel:()=>t.NeoBertModel,NeoBertPreTrainedModel:()=>t.NeoBertPreTrainedModel,NllbTokenizer:()=>s.NllbTokenizer,NoBadWordsLogitsProcessor:()=>P.NoBadWordsLogitsProcessor,NoRepeatNGramLogitsProcessor:()=>P.NoRepeatNGramLogitsProcessor,NomicBertModel:()=>t.NomicBertModel,NomicBertPreTrainedModel:()=>t.NomicBertPreTrainedModel,NougatImageProcessor:()=>h.NougatImageProcessor,NougatTokenizer:()=>s.NougatTokenizer,OPTForCausalLM:()=>t.OPTForCausalLM,OPTModel:()=>t.OPTModel,OPTPreTrainedModel:()=>t.OPTPreTrainedModel,ObjectDetectionPipeline:()=>r.ObjectDetectionPipeline,Olmo2ForCausalLM:()=>t.Olmo2ForCausalLM,Olmo2Model:()=>t.Olmo2Model,Olmo2PreTrainedModel:()=>t.Olmo2PreTrainedModel,OlmoForCausalLM:()=>t.OlmoForCausalLM,OlmoModel:()=>t.OlmoModel,OlmoPreTrainedModel:()=>t.OlmoPreTrainedModel,OpenELMForCausalLM:()=>t.OpenELMForCausalLM,OpenELMModel:()=>t.OpenELMModel,OpenELMPreTrainedModel:()=>t.OpenELMPreTrainedModel,OwlViTFeatureExtractor:()=>h.OwlViTFeatureExtractor,OwlViTForObjectDetection:()=>t.OwlViTForObjectDetection,OwlViTImageProcessor:()=>h.OwlViTImageProcessor,OwlViTModel:()=>t.OwlViTModel,OwlViTPreTrainedModel:()=>t.OwlViTPreTrainedModel,OwlViTProcessor:()=>v.OwlViTProcessor,Owlv2ForObjectDetection:()=>t.Owlv2ForObjectDetection,Owlv2ImageProcessor:()=>h.Owlv2ImageProcessor,Owlv2Model:()=>t.Owlv2Model,Owlv2PreTrainedModel:()=>t.Owlv2PreTrainedModel,PaliGemmaForConditionalGeneration:()=>t.PaliGemmaForConditionalGeneration,PaliGemmaPreTrainedModel:()=>t.PaliGemmaPreTrainedModel,PaliGemmaProcessor:()=>v.PaliGemmaProcessor,ParakeetFeatureExtractor:()=>u.ParakeetFeatureExtractor,ParakeetForCTC:()=>t.ParakeetForCTC,ParakeetPreTrainedModel:()=>t.ParakeetPreTrainedModel,PatchTSMixerForPrediction:()=>t.PatchTSMixerForPrediction,PatchTSMixerModel:()=>t.PatchTSMixerModel,PatchTSMixerPreTrainedModel:()=>t.PatchTSMixerPreTrainedModel,PatchTSTForPrediction:()=>t.PatchTSTForPrediction,PatchTSTModel:()=>t.PatchTSTModel,PatchTSTPreTrainedModel:()=>t.PatchTSTPreTrainedModel,Phi3ForCausalLM:()=>t.Phi3ForCausalLM,Phi3Model:()=>t.Phi3Model,Phi3PreTrainedModel:()=>t.Phi3PreTrainedModel,Phi3VForCausalLM:()=>t.Phi3VForCausalLM,Phi3VImageProcessor:()=>h.Phi3VImageProcessor,Phi3VPreTrainedModel:()=>t.Phi3VPreTrainedModel,Phi3VProcessor:()=>v.Phi3VProcessor,PhiForCausalLM:()=>t.PhiForCausalLM,PhiModel:()=>t.PhiModel,PhiPreTrainedModel:()=>t.PhiPreTrainedModel,Pipeline:()=>r.Pipeline,PixtralImageProcessor:()=>h.PixtralImageProcessor,PixtralProcessor:()=>v.PixtralProcessor,PreTrainedModel:()=>t.PreTrainedModel,PreTrainedTokenizer:()=>s.PreTrainedTokenizer,PretrainedConfig:()=>o.PretrainedConfig,PretrainedMixin:()=>t.PretrainedMixin,Processor:()=>F.Processor,PvtForImageClassification:()=>t.PvtForImageClassification,PvtImageProcessor:()=>h.PvtImageProcessor,PvtModel:()=>t.PvtModel,PvtPreTrainedModel:()=>t.PvtPreTrainedModel,PyAnnoteFeatureExtractor:()=>u.PyAnnoteFeatureExtractor,PyAnnoteForAudioFrameClassification:()=>t.PyAnnoteForAudioFrameClassification,PyAnnoteModel:()=>t.PyAnnoteModel,PyAnnotePreTrainedModel:()=>t.PyAnnotePreTrainedModel,PyAnnoteProcessor:()=>v.PyAnnoteProcessor,QuestionAnsweringModelOutput:()=>t.QuestionAnsweringModelOutput,QuestionAnsweringPipeline:()=>r.QuestionAnsweringPipeline,Qwen2ForCausalLM:()=>t.Qwen2ForCausalLM,Qwen2Model:()=>t.Qwen2Model,Qwen2PreTrainedModel:()=>t.Qwen2PreTrainedModel,Qwen2Tokenizer:()=>s.Qwen2Tokenizer,Qwen2VLForConditionalGeneration:()=>t.Qwen2VLForConditionalGeneration,Qwen2VLImageProcessor:()=>h.Qwen2VLImageProcessor,Qwen2VLPreTrainedModel:()=>t.Qwen2VLPreTrainedModel,Qwen2VLProcessor:()=>v.Qwen2VLProcessor,Qwen3ForCausalLM:()=>t.Qwen3ForCausalLM,Qwen3Model:()=>t.Qwen3Model,Qwen3PreTrainedModel:()=>t.Qwen3PreTrainedModel,RFDetrForObjectDetection:()=>t.RFDetrForObjectDetection,RFDetrModel:()=>t.RFDetrModel,RFDetrObjectDetectionOutput:()=>t.RFDetrObjectDetectionOutput,RFDetrPreTrainedModel:()=>t.RFDetrPreTrainedModel,RTDetrForObjectDetection:()=>t.RTDetrForObjectDetection,RTDetrImageProcessor:()=>h.RTDetrImageProcessor,RTDetrModel:()=>t.RTDetrModel,RTDetrObjectDetectionOutput:()=>t.RTDetrObjectDetectionOutput,RTDetrPreTrainedModel:()=>t.RTDetrPreTrainedModel,RTDetrV2ForObjectDetection:()=>t.RTDetrV2ForObjectDetection,RTDetrV2Model:()=>t.RTDetrV2Model,RTDetrV2ObjectDetectionOutput:()=>t.RTDetrV2ObjectDetectionOutput,RTDetrV2PreTrainedModel:()=>t.RTDetrV2PreTrainedModel,RawAudio:()=>a.RawAudio,RawImage:()=>n.RawImage,RawVideo:()=>i.RawVideo,RawVideoFrame:()=>i.RawVideoFrame,RepetitionPenaltyLogitsProcessor:()=>P.RepetitionPenaltyLogitsProcessor,ResNetForImageClassification:()=>t.ResNetForImageClassification,ResNetModel:()=>t.ResNetModel,ResNetPreTrainedModel:()=>t.ResNetPreTrainedModel,RoFormerForMaskedLM:()=>t.RoFormerForMaskedLM,RoFormerForQuestionAnswering:()=>t.RoFormerForQuestionAnswering,RoFormerForSequenceClassification:()=>t.RoFormerForSequenceClassification,RoFormerForTokenClassification:()=>t.RoFormerForTokenClassification,RoFormerModel:()=>t.RoFormerModel,RoFormerPreTrainedModel:()=>t.RoFormerPreTrainedModel,RoFormerTokenizer:()=>s.RoFormerTokenizer,RobertaForMaskedLM:()=>t.RobertaForMaskedLM,RobertaForQuestionAnswering:()=>t.RobertaForQuestionAnswering,RobertaForSequenceClassification:()=>t.RobertaForSequenceClassification,RobertaForTokenClassification:()=>t.RobertaForTokenClassification,RobertaModel:()=>t.RobertaModel,RobertaPreTrainedModel:()=>t.RobertaPreTrainedModel,RobertaTokenizer:()=>s.RobertaTokenizer,Sam2ImageProcessor:()=>h.Sam2ImageProcessor,Sam2ImageSegmentationOutput:()=>t.Sam2ImageSegmentationOutput,Sam2Model:()=>t.Sam2Model,Sam2PreTrainedModel:()=>t.Sam2PreTrainedModel,Sam2Processor:()=>v.Sam2Processor,Sam2VideoProcessor:()=>v.Sam2VideoProcessor,Sam3ImageProcessor:()=>h.Sam3ImageProcessor,Sam3TrackerModel:()=>t.Sam3TrackerModel,SamImageProcessor:()=>h.SamImageProcessor,SamImageSegmentationOutput:()=>t.SamImageSegmentationOutput,SamModel:()=>t.SamModel,SamPreTrainedModel:()=>t.SamPreTrainedModel,SamProcessor:()=>v.SamProcessor,SapiensForDepthEstimation:()=>t.SapiensForDepthEstimation,SapiensForNormalEstimation:()=>t.SapiensForNormalEstimation,SapiensForSemanticSegmentation:()=>t.SapiensForSemanticSegmentation,SapiensPreTrainedModel:()=>t.SapiensPreTrainedModel,SeamlessM4TFeatureExtractor:()=>u.SeamlessM4TFeatureExtractor,SegformerFeatureExtractor:()=>h.SegformerFeatureExtractor,SegformerForImageClassification:()=>t.SegformerForImageClassification,SegformerForSemanticSegmentation:()=>t.SegformerForSemanticSegmentation,SegformerImageProcessor:()=>h.SegformerImageProcessor,SegformerModel:()=>t.SegformerModel,SegformerPreTrainedModel:()=>t.SegformerPreTrainedModel,Seq2SeqLMOutput:()=>t.Seq2SeqLMOutput,SequenceClassifierOutput:()=>t.SequenceClassifierOutput,SiglipImageProcessor:()=>h.SiglipImageProcessor,SiglipModel:()=>t.SiglipModel,SiglipPreTrainedModel:()=>t.SiglipPreTrainedModel,SiglipTextModel:()=>t.SiglipTextModel,SiglipTokenizer:()=>s.SiglipTokenizer,SiglipVisionModel:()=>t.SiglipVisionModel,SmolLM3ForCausalLM:()=>t.SmolLM3ForCausalLM,SmolLM3Model:()=>t.SmolLM3Model,SmolLM3PreTrainedModel:()=>t.SmolLM3PreTrainedModel,SmolVLMForConditionalGeneration:()=>t.SmolVLMForConditionalGeneration,SmolVLMImageProcessor:()=>h.SmolVLMImageProcessor,SmolVLMProcessor:()=>v.SmolVLMProcessor,SnacDecoderModel:()=>t.SnacDecoderModel,SnacEncoderModel:()=>t.SnacEncoderModel,SnacFeatureExtractor:()=>u.SnacFeatureExtractor,SnacModel:()=>t.SnacModel,SnacPreTrainedModel:()=>t.SnacPreTrainedModel,SpeechT5FeatureExtractor:()=>u.SpeechT5FeatureExtractor,SpeechT5ForSpeechToText:()=>t.SpeechT5ForSpeechToText,SpeechT5ForTextToSpeech:()=>t.SpeechT5ForTextToSpeech,SpeechT5HifiGan:()=>t.SpeechT5HifiGan,SpeechT5Model:()=>t.SpeechT5Model,SpeechT5PreTrainedModel:()=>t.SpeechT5PreTrainedModel,SpeechT5Processor:()=>v.SpeechT5Processor,SpeechT5Tokenizer:()=>s.SpeechT5Tokenizer,SqueezeBertForMaskedLM:()=>t.SqueezeBertForMaskedLM,SqueezeBertForQuestionAnswering:()=>t.SqueezeBertForQuestionAnswering,SqueezeBertForSequenceClassification:()=>t.SqueezeBertForSequenceClassification,SqueezeBertModel:()=>t.SqueezeBertModel,SqueezeBertPreTrainedModel:()=>t.SqueezeBertPreTrainedModel,SqueezeBertTokenizer:()=>s.SqueezeBertTokenizer,StableLmForCausalLM:()=>t.StableLmForCausalLM,StableLmModel:()=>t.StableLmModel,StableLmPreTrainedModel:()=>t.StableLmPreTrainedModel,Starcoder2ForCausalLM:()=>t.Starcoder2ForCausalLM,Starcoder2Model:()=>t.Starcoder2Model,Starcoder2PreTrainedModel:()=>t.Starcoder2PreTrainedModel,StoppingCriteria:()=>y.StoppingCriteria,StoppingCriteriaList:()=>y.StoppingCriteriaList,StyleTextToSpeech2Model:()=>t.StyleTextToSpeech2Model,StyleTextToSpeech2PreTrainedModel:()=>t.StyleTextToSpeech2PreTrainedModel,SummarizationPipeline:()=>r.SummarizationPipeline,SupertonicForConditionalGeneration:()=>t.SupertonicForConditionalGeneration,SupertonicPreTrainedModel:()=>t.SupertonicPreTrainedModel,SuppressTokensAtBeginLogitsProcessor:()=>P.SuppressTokensAtBeginLogitsProcessor,Swin2SRForImageSuperResolution:()=>t.Swin2SRForImageSuperResolution,Swin2SRImageProcessor:()=>h.Swin2SRImageProcessor,Swin2SRModel:()=>t.Swin2SRModel,Swin2SRPreTrainedModel:()=>t.Swin2SRPreTrainedModel,SwinForImageClassification:()=>t.SwinForImageClassification,SwinForSemanticSegmentation:()=>t.SwinForSemanticSegmentation,SwinModel:()=>t.SwinModel,SwinPreTrainedModel:()=>t.SwinPreTrainedModel,T5ForConditionalGeneration:()=>t.T5ForConditionalGeneration,T5Model:()=>t.T5Model,T5PreTrainedModel:()=>t.T5PreTrainedModel,T5Tokenizer:()=>s.T5Tokenizer,TableTransformerForObjectDetection:()=>t.TableTransformerForObjectDetection,TableTransformerModel:()=>t.TableTransformerModel,TableTransformerObjectDetectionOutput:()=>t.TableTransformerObjectDetectionOutput,TableTransformerPreTrainedModel:()=>t.TableTransformerPreTrainedModel,TemperatureLogitsWarper:()=>P.TemperatureLogitsWarper,Tensor:()=>l.Tensor,Text2TextGenerationPipeline:()=>r.Text2TextGenerationPipeline,TextClassificationPipeline:()=>r.TextClassificationPipeline,TextGenerationPipeline:()=>r.TextGenerationPipeline,TextStreamer:()=>C.TextStreamer,TextToAudioPipeline:()=>r.TextToAudioPipeline,TokenClassificationPipeline:()=>r.TokenClassificationPipeline,TokenClassifierOutput:()=>t.TokenClassifierOutput,TokenizerModel:()=>s.TokenizerModel,TopKLogitsWarper:()=>P.TopKLogitsWarper,TopPLogitsWarper:()=>P.TopPLogitsWarper,TrOCRForCausalLM:()=>t.TrOCRForCausalLM,TrOCRPreTrainedModel:()=>t.TrOCRPreTrainedModel,TranslationPipeline:()=>r.TranslationPipeline,UltravoxModel:()=>t.UltravoxModel,UltravoxPreTrainedModel:()=>t.UltravoxPreTrainedModel,UltravoxProcessor:()=>v.UltravoxProcessor,UniSpeechForCTC:()=>t.UniSpeechForCTC,UniSpeechForSequenceClassification:()=>t.UniSpeechForSequenceClassification,UniSpeechModel:()=>t.UniSpeechModel,UniSpeechPreTrainedModel:()=>t.UniSpeechPreTrainedModel,UniSpeechSatForAudioFrameClassification:()=>t.UniSpeechSatForAudioFrameClassification,UniSpeechSatForCTC:()=>t.UniSpeechSatForCTC,UniSpeechSatForSequenceClassification:()=>t.UniSpeechSatForSequenceClassification,UniSpeechSatModel:()=>t.UniSpeechSatModel,UniSpeechSatPreTrainedModel:()=>t.UniSpeechSatPreTrainedModel,VLChatProcessor:()=>v.VLChatProcessor,VLMImageProcessor:()=>h.VLMImageProcessor,VaultGemmaForCausalLM:()=>t.VaultGemmaForCausalLM,VaultGemmaModel:()=>t.VaultGemmaModel,VaultGemmaPreTrainedModel:()=>t.VaultGemmaPreTrainedModel,ViTFeatureExtractor:()=>h.ViTFeatureExtractor,ViTForImageClassification:()=>t.ViTForImageClassification,ViTImageProcessor:()=>h.ViTImageProcessor,ViTMAEModel:()=>t.ViTMAEModel,ViTMAEPreTrainedModel:()=>t.ViTMAEPreTrainedModel,ViTMSNForImageClassification:()=>t.ViTMSNForImageClassification,ViTMSNModel:()=>t.ViTMSNModel,ViTMSNPreTrainedModel:()=>t.ViTMSNPreTrainedModel,ViTModel:()=>t.ViTModel,ViTPreTrainedModel:()=>t.ViTPreTrainedModel,VisionEncoderDecoderModel:()=>t.VisionEncoderDecoderModel,VitMatteForImageMatting:()=>t.VitMatteForImageMatting,VitMatteImageProcessor:()=>h.VitMatteImageProcessor,VitMattePreTrainedModel:()=>t.VitMattePreTrainedModel,VitPoseForPoseEstimation:()=>t.VitPoseForPoseEstimation,VitPoseImageProcessor:()=>h.VitPoseImageProcessor,VitPosePreTrainedModel:()=>t.VitPosePreTrainedModel,VitsModel:()=>t.VitsModel,VitsModelOutput:()=>t.VitsModelOutput,VitsPreTrainedModel:()=>t.VitsPreTrainedModel,VitsTokenizer:()=>s.VitsTokenizer,VoxtralForConditionalGeneration:()=>t.VoxtralForConditionalGeneration,VoxtralProcessor:()=>v.VoxtralProcessor,Wav2Vec2BertForCTC:()=>t.Wav2Vec2BertForCTC,Wav2Vec2BertForSequenceClassification:()=>t.Wav2Vec2BertForSequenceClassification,Wav2Vec2BertModel:()=>t.Wav2Vec2BertModel,Wav2Vec2BertPreTrainedModel:()=>t.Wav2Vec2BertPreTrainedModel,Wav2Vec2CTCTokenizer:()=>s.Wav2Vec2CTCTokenizer,Wav2Vec2FeatureExtractor:()=>u.Wav2Vec2FeatureExtractor,Wav2Vec2ForAudioFrameClassification:()=>t.Wav2Vec2ForAudioFrameClassification,Wav2Vec2ForCTC:()=>t.Wav2Vec2ForCTC,Wav2Vec2ForSequenceClassification:()=>t.Wav2Vec2ForSequenceClassification,Wav2Vec2Model:()=>t.Wav2Vec2Model,Wav2Vec2PreTrainedModel:()=>t.Wav2Vec2PreTrainedModel,Wav2Vec2Processor:()=>v.Wav2Vec2Processor,Wav2Vec2ProcessorWithLM:()=>v.Wav2Vec2ProcessorWithLM,WavLMForAudioFrameClassification:()=>t.WavLMForAudioFrameClassification,WavLMForCTC:()=>t.WavLMForCTC,WavLMForSequenceClassification:()=>t.WavLMForSequenceClassification,WavLMForXVector:()=>t.WavLMForXVector,WavLMModel:()=>t.WavLMModel,WavLMPreTrainedModel:()=>t.WavLMPreTrainedModel,WeSpeakerFeatureExtractor:()=>u.WeSpeakerFeatureExtractor,WeSpeakerResNetModel:()=>t.WeSpeakerResNetModel,WeSpeakerResNetPreTrainedModel:()=>t.WeSpeakerResNetPreTrainedModel,WhisperFeatureExtractor:()=>u.WhisperFeatureExtractor,WhisperForConditionalGeneration:()=>t.WhisperForConditionalGeneration,WhisperModel:()=>t.WhisperModel,WhisperPreTrainedModel:()=>t.WhisperPreTrainedModel,WhisperProcessor:()=>v.WhisperProcessor,WhisperTextStreamer:()=>C.WhisperTextStreamer,WhisperTimeStampLogitsProcessor:()=>P.WhisperTimeStampLogitsProcessor,WhisperTokenizer:()=>s.WhisperTokenizer,XLMForQuestionAnswering:()=>t.XLMForQuestionAnswering,XLMForSequenceClassification:()=>t.XLMForSequenceClassification,XLMForTokenClassification:()=>t.XLMForTokenClassification,XLMModel:()=>t.XLMModel,XLMPreTrainedModel:()=>t.XLMPreTrainedModel,XLMRobertaForMaskedLM:()=>t.XLMRobertaForMaskedLM,XLMRobertaForQuestionAnswering:()=>t.XLMRobertaForQuestionAnswering,XLMRobertaForSequenceClassification:()=>t.XLMRobertaForSequenceClassification,XLMRobertaForTokenClassification:()=>t.XLMRobertaForTokenClassification,XLMRobertaModel:()=>t.XLMRobertaModel,XLMRobertaPreTrainedModel:()=>t.XLMRobertaPreTrainedModel,XLMRobertaTokenizer:()=>s.XLMRobertaTokenizer,XLMTokenizer:()=>s.XLMTokenizer,XLMWithLMHeadModel:()=>t.XLMWithLMHeadModel,XVectorOutput:()=>t.XVectorOutput,YolosFeatureExtractor:()=>h.YolosFeatureExtractor,YolosForObjectDetection:()=>t.YolosForObjectDetection,YolosImageProcessor:()=>h.YolosImageProcessor,YolosModel:()=>t.YolosModel,YolosObjectDetectionOutput:()=>t.YolosObjectDetectionOutput,YolosPreTrainedModel:()=>t.YolosPreTrainedModel,ZeroShotAudioClassificationPipeline:()=>r.ZeroShotAudioClassificationPipeline,ZeroShotClassificationPipeline:()=>r.ZeroShotClassificationPipeline,ZeroShotImageClassificationPipeline:()=>r.ZeroShotImageClassificationPipeline,ZeroShotObjectDetectionPipeline:()=>r.ZeroShotObjectDetectionPipeline,bankers_round:()=>c.bankers_round,cat:()=>l.cat,cos_sim:()=>c.cos_sim,dot:()=>c.dot,dynamic_time_warping:()=>c.dynamic_time_warping,env:()=>e.env,full:()=>l.full,full_like:()=>l.full_like,getCacheShapes:()=>o.getCacheShapes,hamming:()=>a.hamming,hanning:()=>a.hanning,interpolate:()=>l.interpolate,interpolate_4d:()=>l.interpolate_4d,interpolate_data:()=>c.interpolate_data,is_chinese_char:()=>s.is_chinese_char,layer_norm:()=>l.layer_norm,load_image:()=>n.load_image,load_video:()=>i.load_video,log_softmax:()=>c.log_softmax,magnitude:()=>c.magnitude,matmul:()=>l.matmul,max:()=>c.max,mean:()=>l.mean,mean_pooling:()=>l.mean_pooling,medianFilter:()=>c.medianFilter,mel_filter_bank:()=>a.mel_filter_bank,min:()=>c.min,ones:()=>l.ones,ones_like:()=>l.ones_like,permute:()=>l.permute,permute_data:()=>c.permute_data,pipeline:()=>r.pipeline,quantize_embeddings:()=>l.quantize_embeddings,rand:()=>l.rand,randn:()=>l.randn,read_audio:()=>a.read_audio,rfft:()=>l.rfft,round:()=>c.round,slice:()=>l.slice,softmax:()=>c.softmax,spectrogram:()=>a.spectrogram,stack:()=>l.stack,std_mean:()=>l.std_mean,topk:()=>l.topk,window_function:()=>a.window_function,zeros:()=>l.zeros,zeros_like:()=>l.zeros_like});var e=Vt("./src/env.js"),r=Vt("./src/pipelines.js"),t=Vt("./src/models.js"),s=Vt("./src/tokenizers.js"),o=Vt("./src/configs.js"),a=Vt("./src/utils/audio.js"),n=Vt("./src/utils/image.js"),i=Vt("./src/utils/video.js"),l=Vt("./src/utils/tensor.js"),c=Vt("./src/utils/maths.js"),_=Vt("./src/base/feature_extraction_utils.js"),u=Vt("./src/models/feature_extractors.js"),d=Vt("./src/models/auto/feature_extraction_auto.js"),g=Vt("./src/base/image_processors_utils.js"),h=Vt("./src/models/image_processors.js"),x=Vt("./src/models/auto/image_processing_auto.js"),F=Vt("./src/base/processing_utils.js"),v=Vt("./src/models/processors.js"),b=Vt("./src/models/auto/processing_auto.js"),C=Vt("./src/generation/streamers.js"),y=Vt("./src/generation/stopping_criteria.js"),P=Vt("./src/generation/logits_process.js")})();var VS=p.ASTFeatureExtractor,WS=p.ASTForAudioClassification,US=p.ASTModel,GS=p.ASTPreTrainedModel,KS=p.AlbertForMaskedLM,HS=p.AlbertForQuestionAnswering,qS=p.AlbertForSequenceClassification,QS=p.AlbertModel,XS=p.AlbertPreTrainedModel,JS=p.AlbertTokenizer,YS=p.ArceeForCausalLM,ZS=p.ArceeModel,eF=p.ArceePreTrainedModel,tF=p.AudioClassificationPipeline,rF=p.AutoConfig,sF=p.AutoFeatureExtractor,oF=p.AutoImageProcessor,aF=p.AutoModel,nF=p.AutoModelForAudioClassification,iF=p.AutoModelForAudioFrameClassification,lF=p.AutoModelForAudioTextToText,cF=p.AutoModelForCTC,dF=p.AutoModelForCausalLM,uF=p.AutoModelForDepthEstimation,_F=p.AutoModelForDocumentQuestionAnswering,pF=p.AutoModelForImageClassification,mF=p.AutoModelForImageFeatureExtraction,hF=p.AutoModelForImageMatting,fF=p.AutoModelForImageSegmentation,gF=p.AutoModelForImageTextToText,MF=p.AutoModelForImageToImage,wF=p.AutoModelForMaskGeneration,bF=p.AutoModelForMaskedLM,vF=p.AutoModelForNormalEstimation,xF=p.AutoModelForObjectDetection,yF=p.AutoModelForPoseEstimation,TF=p.AutoModelForQuestionAnswering,PF=p.AutoModelForSemanticSegmentation,EF=p.AutoModelForSeq2SeqLM,kF=p.AutoModelForSequenceClassification,CF=p.AutoModelForSpeechSeq2Seq,SF=p.AutoModelForTextToSpectrogram,FF=p.AutoModelForTextToWaveform,IF=p.AutoModelForTokenClassification,AF=p.AutoModelForUniversalSegmentation,$F=p.AutoModelForVision2Seq,DF=p.AutoModelForXVector,OF=p.AutoModelForZeroShotObjectDetection,LF=p.AutoProcessor,BF=p.AutoTokenizer,zF=p.AutomaticSpeechRecognitionPipeline,RF=p.BackgroundRemovalPipeline,NF=p.BartForConditionalGeneration,jF=p.BartForSequenceClassification,VF=p.BartModel,WF=p.BartPretrainedModel,UF=p.BartTokenizer,GF=p.BaseModelOutput,KF=p.BaseStreamer,HF=p.BeitFeatureExtractor,qF=p.BeitForImageClassification,QF=p.BeitModel,XF=p.BeitPreTrainedModel,JF=p.BertForMaskedLM,YF=p.BertForQuestionAnswering,ZF=p.BertForSequenceClassification,eI=p.BertForTokenClassification,tI=p.BertModel,rI=p.BertPreTrainedModel,sI=p.BertTokenizer,oI=p.BitImageProcessor,aI=p.BlenderbotForConditionalGeneration,nI=p.BlenderbotModel,iI=p.BlenderbotPreTrainedModel,lI=p.BlenderbotSmallForConditionalGeneration,cI=p.BlenderbotSmallModel,dI=p.BlenderbotSmallPreTrainedModel,uI=p.BlenderbotSmallTokenizer,_I=p.BlenderbotTokenizer,pI=p.BloomForCausalLM,mI=p.BloomModel,hI=p.BloomPreTrainedModel,fI=p.BloomTokenizer,gI=p.CLIPFeatureExtractor,MI=p.CLIPImageProcessor,wI=p.CLIPModel,bI=p.CLIPPreTrainedModel,vI=p.CLIPSegForImageSegmentation,xI=p.CLIPSegModel,yI=p.CLIPSegPreTrainedModel,TI=p.CLIPTextModel,PI=p.CLIPTextModelWithProjection,EI=p.CLIPTokenizer,kI=p.CLIPVisionModel,CI=p.CLIPVisionModelWithProjection,SI=p.CamembertForMaskedLM,FI=p.CamembertForQuestionAnswering,II=p.CamembertForSequenceClassification,AI=p.CamembertForTokenClassification,$I=p.CamembertModel,DI=p.CamembertPreTrainedModel,OI=p.CamembertTokenizer,LI=p.CausalLMOutput,BI=p.CausalLMOutputWithPast,zI=p.ChineseCLIPFeatureExtractor,RI=p.ChineseCLIPModel,NI=p.ChineseCLIPPreTrainedModel,jI=p.ClapAudioModelWithProjection,VI=p.ClapFeatureExtractor,WI=p.ClapModel,UI=p.ClapPreTrainedModel,GI=p.ClapTextModelWithProjection,KI=p.ClassifierFreeGuidanceLogitsProcessor,HI=p.CodeGenForCausalLM,qI=p.CodeGenModel,QI=p.CodeGenPreTrainedModel,XI=p.CodeGenTokenizer,JI=p.CodeLlamaTokenizer,YI=p.CohereForCausalLM,ZI=p.CohereModel,eA=p.CoherePreTrainedModel,tA=p.CohereTokenizer,rA=p.ConvBertForMaskedLM,sA=p.ConvBertForQuestionAnswering,oA=p.ConvBertForSequenceClassification,aA=p.ConvBertForTokenClassification,nA=p.ConvBertModel,iA=p.ConvBertPreTrainedModel,lA=p.ConvBertTokenizer,cA=p.ConvNextFeatureExtractor,dA=p.ConvNextForImageClassification,uA=p.ConvNextImageProcessor,_A=p.ConvNextModel,pA=p.ConvNextPreTrainedModel,mA=p.ConvNextV2ForImageClassification,hA=p.ConvNextV2Model,fA=p.ConvNextV2PreTrainedModel,gA=p.DFineForObjectDetection,MA=p.DFineModel,wA=p.DFinePreTrainedModel,bA=p.DINOv3ConvNextModel,vA=p.DINOv3ConvNextPreTrainedModel,xA=p.DINOv3ViTImageProcessor,yA=p.DINOv3ViTModel,TA=p.DINOv3ViTPreTrainedModel,PA=p.DPTFeatureExtractor,EA=p.DPTForDepthEstimation,kA=p.DPTImageProcessor,CA=p.DPTModel,SA=p.DPTPreTrainedModel,FA=p.DacDecoderModel,IA=p.DacDecoderOutput,AA=p.DacEncoderModel,$A=p.DacEncoderOutput,DA=p.DacFeatureExtractor,OA=p.DacModel,LA=p.DacPreTrainedModel,BA=p.DataTypeMap,zA=p.DebertaForMaskedLM,RA=p.DebertaForQuestionAnswering,NA=p.DebertaForSequenceClassification,jA=p.DebertaForTokenClassification,VA=p.DebertaModel,WA=p.DebertaPreTrainedModel,UA=p.DebertaTokenizer,GA=p.DebertaV2ForMaskedLM,KA=p.DebertaV2ForQuestionAnswering,HA=p.DebertaV2ForSequenceClassification,qA=p.DebertaV2ForTokenClassification,QA=p.DebertaV2Model,XA=p.DebertaV2PreTrainedModel,JA=p.DebertaV2Tokenizer,YA=p.DecisionTransformerModel,ZA=p.DecisionTransformerPreTrainedModel,e$=p.DeiTFeatureExtractor,t$=p.DeiTForImageClassification,r$=p.DeiTImageProcessor,s$=p.DeiTModel,o$=p.DeiTPreTrainedModel,a$=p.DepthAnythingForDepthEstimation,n$=p.DepthAnythingPreTrainedModel,i$=p.DepthEstimationPipeline,l$=p.DepthProForDepthEstimation,c$=p.DepthProPreTrainedModel,d$=p.DetrFeatureExtractor,u$=p.DetrForObjectDetection,_$=p.DetrForSegmentation,p$=p.DetrImageProcessor,m$=p.DetrModel,h$=p.DetrObjectDetectionOutput,f$=p.DetrPreTrainedModel,g$=p.DetrSegmentationOutput,M$=p.Dinov2ForImageClassification,w$=p.Dinov2Model,b$=p.Dinov2PreTrainedModel,v$=p.Dinov2WithRegistersForImageClassification,x$=p.Dinov2WithRegistersModel,y$=p.Dinov2WithRegistersPreTrainedModel,T$=p.DistilBertForMaskedLM,P$=p.DistilBertForQuestionAnswering,E$=p.DistilBertForSequenceClassification,k$=p.DistilBertForTokenClassification,C$=p.DistilBertModel,S$=p.DistilBertPreTrainedModel,F$=p.DistilBertTokenizer,I$=p.DocumentQuestionAnsweringPipeline,A$=p.DonutFeatureExtractor,$$=p.DonutImageProcessor,D$=p.DonutSwinModel,O$=p.DonutSwinPreTrainedModel,L$=p.EdgeTamModel,B$=p.EfficientNetForImageClassification,z$=p.EfficientNetImageProcessor,R$=p.EfficientNetModel,N$=p.EfficientNetPreTrainedModel,j$=p.ElectraForMaskedLM,V$=p.ElectraForQuestionAnswering,W$=p.ElectraForSequenceClassification,U$=p.ElectraForTokenClassification,G$=p.ElectraModel,K$=p.ElectraPreTrainedModel,H$=p.ElectraTokenizer,q$=p.EncodecFeatureExtractor,Q$=p.EosTokenCriteria,X$=p.Ernie4_5ForCausalLM,J$=p.Ernie4_5Model,Y$=p.Ernie4_5PreTrainedModel,Z$=p.EsmForMaskedLM,eD=p.EsmForSequenceClassification,tD=p.EsmForTokenClassification,rD=p.EsmModel,sD=p.EsmPreTrainedModel,oD=p.EsmTokenizer,aD=p.ExaoneForCausalLM,nD=p.ExaoneModel,iD=p.ExaonePreTrainedModel,lD=p.FFT,cD=p.FalconForCausalLM,dD=p.FalconModel,uD=p.FalconPreTrainedModel,_D=p.FalconTokenizer,pD=p.FastViTForImageClassification,mD=p.FastViTModel,hD=p.FastViTPreTrainedModel,fD=p.FeatureExtractionPipeline,gD=p.FeatureExtractor,MD=p.FillMaskPipeline,wD=p.Florence2ForConditionalGeneration,bD=p.Florence2PreTrainedModel,vD=p.Florence2Processor,xD=p.ForcedBOSTokenLogitsProcessor,yD=p.ForcedEOSTokenLogitsProcessor,TD=p.GLPNFeatureExtractor,PD=p.GLPNForDepthEstimation,ED=p.GLPNModel,kD=p.GLPNPreTrainedModel,CD=p.GPT2LMHeadModel,SD=p.GPT2Model,FD=p.GPT2PreTrainedModel,ID=p.GPT2Tokenizer,AD=p.GPTBigCodeForCausalLM,$D=p.GPTBigCodeModel,DD=p.GPTBigCodePreTrainedModel,OD=p.GPTJForCausalLM,LD=p.GPTJModel,BD=p.GPTJPreTrainedModel,zD=p.GPTNeoForCausalLM,RD=p.GPTNeoModel,ND=p.GPTNeoPreTrainedModel,jD=p.GPTNeoXForCausalLM,VD=p.GPTNeoXModel,WD=p.GPTNeoXPreTrainedModel,UD=p.GPTNeoXTokenizer,GD=p.Gemma2ForCausalLM,KD=p.Gemma2Model,HD=p.Gemma2PreTrainedModel,qD=p.Gemma3ForCausalLM,QD=p.Gemma3Model,XD=p.Gemma3PreTrainedModel,JD=p.Gemma3nAudioFeatureExtractor,YD=p.Gemma3nForConditionalGeneration,ZD=p.Gemma3nPreTrainedModel,eO=p.Gemma3nProcessor,tO=p.GemmaForCausalLM,rO=p.GemmaModel,sO=p.GemmaPreTrainedModel,oO=p.GemmaTokenizer,aO=p.GlmForCausalLM,nO=p.GlmModel,iO=p.GlmPreTrainedModel,lO=p.GraniteForCausalLM,cO=p.GraniteModel,dO=p.GraniteMoeHybridForCausalLM,uO=p.GraniteMoeHybridModel,_O=p.GraniteMoeHybridPreTrainedModel,pO=p.GranitePreTrainedModel,mO=p.Grok1Tokenizer,hO=p.GroundingDinoForObjectDetection,fO=p.GroundingDinoImageProcessor,gO=p.GroundingDinoPreTrainedModel,MO=p.GroundingDinoProcessor,wO=p.GroupViTModel,bO=p.GroupViTPreTrainedModel,vO=p.HeliumForCausalLM,xO=p.HeliumModel,yO=p.HeliumPreTrainedModel,TO=p.HerbertTokenizer,PO=p.HieraForImageClassification,EO=p.HieraModel,kO=p.HieraPreTrainedModel,CO=p.HubertForCTC,SO=p.HubertForSequenceClassification,FO=p.HubertModel,IO=p.HubertPreTrainedModel,AO=p.IJepaForImageClassification,$O=p.IJepaModel,DO=p.IJepaPreTrainedModel,OO=p.Idefics3ForConditionalGeneration,LO=p.Idefics3ImageProcessor,BO=p.Idefics3PreTrainedModel,zO=p.Idefics3Processor,RO=p.ImageClassificationPipeline,NO=p.ImageFeatureExtractionPipeline,jO=p.ImageFeatureExtractor,VO=p.ImageMattingOutput,WO=p.ImageProcessor,UO=p.ImageSegmentationPipeline,GO=p.ImageToImagePipeline,KO=p.ImageToTextPipeline,HO=p.InterruptableStoppingCriteria,qO=p.JAISLMHeadModel,QO=p.JAISModel,XO=p.JAISPreTrainedModel,JO=p.JinaCLIPImageProcessor,YO=p.JinaCLIPModel,ZO=p.JinaCLIPPreTrainedModel,eL=p.JinaCLIPProcessor,tL=p.JinaCLIPTextModel,rL=p.JinaCLIPVisionModel,sL=p.Lfm2ForCausalLM,oL=p.Lfm2Model,aL=p.Lfm2PreTrainedModel,nL=p.LiteWhisperForConditionalGeneration,iL=p.Llama4ForCausalLM,lL=p.Llama4PreTrainedModel,cL=p.LlamaForCausalLM,dL=p.LlamaModel,uL=p.LlamaPreTrainedModel,_L=p.LlamaTokenizer,pL=p.LlavaForConditionalGeneration,mL=p.LlavaOnevisionForConditionalGeneration,hL=p.LlavaOnevisionImageProcessor,fL=p.LlavaPreTrainedModel,gL=p.LlavaProcessor,ML=p.LlavaQwen2ForCausalLM,wL=p.LogitsProcessor,bL=p.LogitsProcessorList,vL=p.LogitsWarper,xL=p.LongT5ForConditionalGeneration,yL=p.LongT5Model,TL=p.LongT5PreTrainedModel,PL=p.M2M100ForConditionalGeneration,EL=p.M2M100Model,kL=p.M2M100PreTrainedModel,CL=p.M2M100Tokenizer,SL=p.MBart50Tokenizer,FL=p.MBartForCausalLM,IL=p.MBartForConditionalGeneration,AL=p.MBartForSequenceClassification,$L=p.MBartModel,DL=p.MBartPreTrainedModel,OL=p.MBartTokenizer,LL=p.MPNetForMaskedLM,BL=p.MPNetForQuestionAnswering,zL=p.MPNetForSequenceClassification,RL=p.MPNetForTokenClassification,NL=p.MPNetModel,jL=p.MPNetPreTrainedModel,VL=p.MPNetTokenizer,WL=p.MT5ForConditionalGeneration,UL=p.MT5Model,GL=p.MT5PreTrainedModel,KL=p.MarianMTModel,HL=p.MarianModel,qL=p.MarianPreTrainedModel,QL=p.MarianTokenizer,XL=p.Mask2FormerImageProcessor,JL=p.MaskFormerFeatureExtractor,YL=p.MaskFormerForInstanceSegmentation,ZL=p.MaskFormerImageProcessor,e3=p.MaskFormerModel,t3=p.MaskFormerPreTrainedModel,r3=p.MaskedLMOutput,s3=p.MaxLengthCriteria,o3=p.Metric3DForDepthEstimation,a3=p.Metric3DPreTrainedModel,n3=p.Metric3Dv2ForDepthEstimation,i3=p.Metric3Dv2PreTrainedModel,l3=p.MgpstrForSceneTextRecognition,c3=p.MgpstrModelOutput,d3=p.MgpstrPreTrainedModel,u3=p.MgpstrProcessor,_3=p.MgpstrTokenizer,p3=p.MimiDecoderModel,m3=p.MimiDecoderOutput,h3=p.MimiEncoderModel,f3=p.MimiEncoderOutput,g3=p.MimiModel,M3=p.MimiPreTrainedModel,w3=p.MinLengthLogitsProcessor,b3=p.MinNewTokensLengthLogitsProcessor,v3=p.Ministral3ForCausalLM,x3=p.Ministral3Model,y3=p.Ministral3PreTrainedModel,T3=p.MinistralForCausalLM,P3=p.MinistralModel,E3=p.MinistralPreTrainedModel,k3=p.Mistral3ForConditionalGeneration,C3=p.MistralForCausalLM,S3=p.MistralModel,F3=p.MistralPreTrainedModel,I3=p.MobileBertForMaskedLM,A3=p.MobileBertForQuestionAnswering,$3=p.MobileBertForSequenceClassification,D3=p.MobileBertModel,O3=p.MobileBertPreTrainedModel,L3=p.MobileBertTokenizer,B3=p.MobileLLMForCausalLM,z3=p.MobileLLMModel,R3=p.MobileLLMPreTrainedModel,N3=p.MobileNetV1FeatureExtractor,j3=p.MobileNetV1ForImageClassification,V3=p.MobileNetV1ForSemanticSegmentation,W3=p.MobileNetV1ImageProcessor,U3=p.MobileNetV1Model,G3=p.MobileNetV1PreTrainedModel,K3=p.MobileNetV2FeatureExtractor,H3=p.MobileNetV2ForImageClassification,q3=p.MobileNetV2ForSemanticSegmentation,Q3=p.MobileNetV2ImageProcessor,X3=p.MobileNetV2Model,J3=p.MobileNetV2PreTrainedModel,Y3=p.MobileNetV3FeatureExtractor,Z3=p.MobileNetV3ForImageClassification,eB=p.MobileNetV3ForSemanticSegmentation,tB=p.MobileNetV3ImageProcessor,rB=p.MobileNetV3Model,sB=p.MobileNetV3PreTrainedModel,oB=p.MobileNetV4FeatureExtractor,aB=p.MobileNetV4ForImageClassification,nB=p.MobileNetV4ForSemanticSegmentation,iB=p.MobileNetV4ImageProcessor,lB=p.MobileNetV4Model,cB=p.MobileNetV4PreTrainedModel,dB=p.MobileViTFeatureExtractor,uB=p.MobileViTForImageClassification,_B=p.MobileViTImageProcessor,pB=p.MobileViTModel,mB=p.MobileViTPreTrainedModel,hB=p.MobileViTV2ForImageClassification,fB=p.MobileViTV2Model,gB=p.MobileViTV2PreTrainedModel,MB=p.ModelOutput,wB=p.ModernBertDecoderForCausalLM,bB=p.ModernBertDecoderModel,vB=p.ModernBertDecoderPreTrainedModel,xB=p.ModernBertForMaskedLM,yB=p.ModernBertForSequenceClassification,TB=p.ModernBertForTokenClassification,PB=p.ModernBertModel,EB=p.ModernBertPreTrainedModel,kB=p.Moondream1ForConditionalGeneration,CB=p.MoonshineFeatureExtractor,SB=p.MoonshineForConditionalGeneration,FB=p.MoonshineModel,IB=p.MoonshinePreTrainedModel,AB=p.MoonshineProcessor,$B=p.MptForCausalLM,DB=p.MptModel,OB=p.MptPreTrainedModel,LB=p.MultiModalityCausalLM,BB=p.MultiModalityPreTrainedModel,zB=p.MusicgenForCausalLM,RB=p.MusicgenForConditionalGeneration,NB=p.MusicgenModel,jB=p.MusicgenPreTrainedModel,VB=p.NanoChatForCausalLM,WB=p.NanoChatModel,UB=p.NanoChatPreTrainedModel,GB=p.NeoBertForMaskedLM,KB=p.NeoBertForQuestionAnswering,HB=p.NeoBertForSequenceClassification,qB=p.NeoBertForTokenClassification,QB=p.NeoBertModel,XB=p.NeoBertPreTrainedModel,JB=p.NllbTokenizer,YB=p.NoBadWordsLogitsProcessor,ZB=p.NoRepeatNGramLogitsProcessor,ez=p.NomicBertModel,tz=p.NomicBertPreTrainedModel,rz=p.NougatImageProcessor,sz=p.NougatTokenizer,oz=p.OPTForCausalLM,az=p.OPTModel,nz=p.OPTPreTrainedModel,iz=p.ObjectDetectionPipeline,lz=p.Olmo2ForCausalLM,cz=p.Olmo2Model,dz=p.Olmo2PreTrainedModel,uz=p.OlmoForCausalLM,_z=p.OlmoModel,pz=p.OlmoPreTrainedModel,mz=p.OpenELMForCausalLM,hz=p.OpenELMModel,fz=p.OpenELMPreTrainedModel,gz=p.OwlViTFeatureExtractor,Mz=p.OwlViTForObjectDetection,wz=p.OwlViTImageProcessor,bz=p.OwlViTModel,vz=p.OwlViTPreTrainedModel,xz=p.OwlViTProcessor,yz=p.Owlv2ForObjectDetection,Tz=p.Owlv2ImageProcessor,Pz=p.Owlv2Model,Ez=p.Owlv2PreTrainedModel,kz=p.PaliGemmaForConditionalGeneration,Cz=p.PaliGemmaPreTrainedModel,Sz=p.PaliGemmaProcessor,Fz=p.ParakeetFeatureExtractor,Iz=p.ParakeetForCTC,Az=p.ParakeetPreTrainedModel,$z=p.PatchTSMixerForPrediction,Dz=p.PatchTSMixerModel,Oz=p.PatchTSMixerPreTrainedModel,Lz=p.PatchTSTForPrediction,Bz=p.PatchTSTModel,zz=p.PatchTSTPreTrainedModel,Rz=p.Phi3ForCausalLM,Nz=p.Phi3Model,jz=p.Phi3PreTrainedModel,Vz=p.Phi3VForCausalLM,Wz=p.Phi3VImageProcessor,Uz=p.Phi3VPreTrainedModel,Gz=p.Phi3VProcessor,Kz=p.PhiForCausalLM,Hz=p.PhiModel,qz=p.PhiPreTrainedModel,Qz=p.Pipeline,Xz=p.PixtralImageProcessor,Jz=p.PixtralProcessor,Yz=p.PreTrainedModel,Zz=p.PreTrainedTokenizer,eR=p.PretrainedConfig,tR=p.PretrainedMixin,rR=p.Processor,sR=p.PvtForImageClassification,oR=p.PvtImageProcessor,aR=p.PvtModel,nR=p.PvtPreTrainedModel,iR=p.PyAnnoteFeatureExtractor,lR=p.PyAnnoteForAudioFrameClassification,cR=p.PyAnnoteModel,dR=p.PyAnnotePreTrainedModel,uR=p.PyAnnoteProcessor,_R=p.QuestionAnsweringModelOutput,pR=p.QuestionAnsweringPipeline,mR=p.Qwen2ForCausalLM,hR=p.Qwen2Model,fR=p.Qwen2PreTrainedModel,gR=p.Qwen2Tokenizer,MR=p.Qwen2VLForConditionalGeneration,wR=p.Qwen2VLImageProcessor,bR=p.Qwen2VLPreTrainedModel,vR=p.Qwen2VLProcessor,xR=p.Qwen3ForCausalLM,yR=p.Qwen3Model,TR=p.Qwen3PreTrainedModel,PR=p.RFDetrForObjectDetection,ER=p.RFDetrModel,kR=p.RFDetrObjectDetectionOutput,CR=p.RFDetrPreTrainedModel,SR=p.RTDetrForObjectDetection,FR=p.RTDetrImageProcessor,IR=p.RTDetrModel,AR=p.RTDetrObjectDetectionOutput,$R=p.RTDetrPreTrainedModel,DR=p.RTDetrV2ForObjectDetection,OR=p.RTDetrV2Model,LR=p.RTDetrV2ObjectDetectionOutput,BR=p.RTDetrV2PreTrainedModel,zR=p.RawAudio,RR=p.RawImage,NR=p.RawVideo,jR=p.RawVideoFrame,VR=p.RepetitionPenaltyLogitsProcessor,WR=p.ResNetForImageClassification,UR=p.ResNetModel,GR=p.ResNetPreTrainedModel,KR=p.RoFormerForMaskedLM,HR=p.RoFormerForQuestionAnswering,qR=p.RoFormerForSequenceClassification,QR=p.RoFormerForTokenClassification,XR=p.RoFormerModel,JR=p.RoFormerPreTrainedModel,YR=p.RoFormerTokenizer,ZR=p.RobertaForMaskedLM,eN=p.RobertaForQuestionAnswering,tN=p.RobertaForSequenceClassification,rN=p.RobertaForTokenClassification,sN=p.RobertaModel,oN=p.RobertaPreTrainedModel,aN=p.RobertaTokenizer,nN=p.Sam2ImageProcessor,iN=p.Sam2ImageSegmentationOutput,lN=p.Sam2Model,cN=p.Sam2PreTrainedModel,dN=p.Sam2Processor,uN=p.Sam2VideoProcessor,_N=p.Sam3ImageProcessor,pN=p.Sam3TrackerModel,mN=p.SamImageProcessor,hN=p.SamImageSegmentationOutput,fN=p.SamModel,gN=p.SamPreTrainedModel,MN=p.SamProcessor,wN=p.SapiensForDepthEstimation,bN=p.SapiensForNormalEstimation,vN=p.SapiensForSemanticSegmentation,xN=p.SapiensPreTrainedModel,yN=p.SeamlessM4TFeatureExtractor,TN=p.SegformerFeatureExtractor,PN=p.SegformerForImageClassification,EN=p.SegformerForSemanticSegmentation,kN=p.SegformerImageProcessor,CN=p.SegformerModel,SN=p.SegformerPreTrainedModel,FN=p.Seq2SeqLMOutput,IN=p.SequenceClassifierOutput,AN=p.SiglipImageProcessor,$N=p.SiglipModel,DN=p.SiglipPreTrainedModel,ON=p.SiglipTextModel,LN=p.SiglipTokenizer,BN=p.SiglipVisionModel,zN=p.SmolLM3ForCausalLM,RN=p.SmolLM3Model,NN=p.SmolLM3PreTrainedModel,jN=p.SmolVLMForConditionalGeneration,VN=p.SmolVLMImageProcessor,WN=p.SmolVLMProcessor,UN=p.SnacDecoderModel,GN=p.SnacEncoderModel,KN=p.SnacFeatureExtractor,HN=p.SnacModel,qN=p.SnacPreTrainedModel,QN=p.SpeechT5FeatureExtractor,XN=p.SpeechT5ForSpeechToText,JN=p.SpeechT5ForTextToSpeech,YN=p.SpeechT5HifiGan,ZN=p.SpeechT5Model,ej=p.SpeechT5PreTrainedModel,tj=p.SpeechT5Processor,rj=p.SpeechT5Tokenizer,sj=p.SqueezeBertForMaskedLM,oj=p.SqueezeBertForQuestionAnswering,aj=p.SqueezeBertForSequenceClassification,nj=p.SqueezeBertModel,ij=p.SqueezeBertPreTrainedModel,lj=p.SqueezeBertTokenizer,cj=p.StableLmForCausalLM,dj=p.StableLmModel,uj=p.StableLmPreTrainedModel,_j=p.Starcoder2ForCausalLM,pj=p.Starcoder2Model,mj=p.Starcoder2PreTrainedModel,hj=p.StoppingCriteria,fj=p.StoppingCriteriaList,gj=p.StyleTextToSpeech2Model,Mj=p.StyleTextToSpeech2PreTrainedModel,wj=p.SummarizationPipeline,bj=p.SupertonicForConditionalGeneration,vj=p.SupertonicPreTrainedModel,xj=p.SuppressTokensAtBeginLogitsProcessor,yj=p.Swin2SRForImageSuperResolution,Tj=p.Swin2SRImageProcessor,Pj=p.Swin2SRModel,Ej=p.Swin2SRPreTrainedModel,kj=p.SwinForImageClassification,Cj=p.SwinForSemanticSegmentation,Sj=p.SwinModel,Fj=p.SwinPreTrainedModel,Ij=p.T5ForConditionalGeneration,Aj=p.T5Model,$j=p.T5PreTrainedModel,Dj=p.T5Tokenizer,Oj=p.TableTransformerForObjectDetection,Lj=p.TableTransformerModel,Bj=p.TableTransformerObjectDetectionOutput,zj=p.TableTransformerPreTrainedModel,Rj=p.TemperatureLogitsWarper,Nj=p.Tensor,jj=p.Text2TextGenerationPipeline,Vj=p.TextClassificationPipeline,Wj=p.TextGenerationPipeline,Uj=p.TextStreamer,Gj=p.TextToAudioPipeline,Kj=p.TokenClassificationPipeline,Hj=p.TokenClassifierOutput,qj=p.TokenizerModel,Qj=p.TopKLogitsWarper,Xj=p.TopPLogitsWarper,Jj=p.TrOCRForCausalLM,Yj=p.TrOCRPreTrainedModel,Zj=p.TranslationPipeline,eV=p.UltravoxModel,tV=p.UltravoxPreTrainedModel,rV=p.UltravoxProcessor,sV=p.UniSpeechForCTC,oV=p.UniSpeechForSequenceClassification,aV=p.UniSpeechModel,nV=p.UniSpeechPreTrainedModel,iV=p.UniSpeechSatForAudioFrameClassification,lV=p.UniSpeechSatForCTC,cV=p.UniSpeechSatForSequenceClassification,dV=p.UniSpeechSatModel,uV=p.UniSpeechSatPreTrainedModel,_V=p.VLChatProcessor,pV=p.VLMImageProcessor,mV=p.VaultGemmaForCausalLM,hV=p.VaultGemmaModel,fV=p.VaultGemmaPreTrainedModel,gV=p.ViTFeatureExtractor,MV=p.ViTForImageClassification,wV=p.ViTImageProcessor,bV=p.ViTMAEModel,vV=p.ViTMAEPreTrainedModel,xV=p.ViTMSNForImageClassification,yV=p.ViTMSNModel,TV=p.ViTMSNPreTrainedModel,PV=p.ViTModel,EV=p.ViTPreTrainedModel,kV=p.VisionEncoderDecoderModel,CV=p.VitMatteForImageMatting,SV=p.VitMatteImageProcessor,FV=p.VitMattePreTrainedModel,IV=p.VitPoseForPoseEstimation,AV=p.VitPoseImageProcessor,$V=p.VitPosePreTrainedModel,DV=p.VitsModel,OV=p.VitsModelOutput,LV=p.VitsPreTrainedModel,BV=p.VitsTokenizer,zV=p.VoxtralForConditionalGeneration,RV=p.VoxtralProcessor,NV=p.Wav2Vec2BertForCTC,jV=p.Wav2Vec2BertForSequenceClassification,VV=p.Wav2Vec2BertModel,WV=p.Wav2Vec2BertPreTrainedModel,UV=p.Wav2Vec2CTCTokenizer,GV=p.Wav2Vec2FeatureExtractor,KV=p.Wav2Vec2ForAudioFrameClassification,HV=p.Wav2Vec2ForCTC,qV=p.Wav2Vec2ForSequenceClassification,QV=p.Wav2Vec2Model,XV=p.Wav2Vec2PreTrainedModel,JV=p.Wav2Vec2Processor,YV=p.Wav2Vec2ProcessorWithLM,ZV=p.WavLMForAudioFrameClassification,e4=p.WavLMForCTC,t4=p.WavLMForSequenceClassification,r4=p.WavLMForXVector,s4=p.WavLMModel,o4=p.WavLMPreTrainedModel,a4=p.WeSpeakerFeatureExtractor,n4=p.WeSpeakerResNetModel,i4=p.WeSpeakerResNetPreTrainedModel,l4=p.WhisperFeatureExtractor,c4=p.WhisperForConditionalGeneration,d4=p.WhisperModel,u4=p.WhisperPreTrainedModel,_4=p.WhisperProcessor,A0=p.WhisperTextStreamer,p4=p.WhisperTimeStampLogitsProcessor,m4=p.WhisperTokenizer,h4=p.XLMForQuestionAnswering,f4=p.XLMForSequenceClassification,g4=p.XLMForTokenClassification,M4=p.XLMModel,w4=p.XLMPreTrainedModel,b4=p.XLMRobertaForMaskedLM,v4=p.XLMRobertaForQuestionAnswering,x4=p.XLMRobertaForSequenceClassification,y4=p.XLMRobertaForTokenClassification,T4=p.XLMRobertaModel,P4=p.XLMRobertaPreTrainedModel,E4=p.XLMRobertaTokenizer,k4=p.XLMTokenizer,C4=p.XLMWithLMHeadModel,S4=p.XVectorOutput,F4=p.YolosFeatureExtractor,I4=p.YolosForObjectDetection,A4=p.YolosImageProcessor,$4=p.YolosModel,D4=p.YolosObjectDetectionOutput,O4=p.YolosPreTrainedModel,L4=p.ZeroShotAudioClassificationPipeline,B4=p.ZeroShotClassificationPipeline,z4=p.ZeroShotImageClassificationPipeline,R4=p.ZeroShotObjectDetectionPipeline,N4=p.bankers_round,j4=p.cat,V4=p.cos_sim,W4=p.dot,U4=p.dynamic_time_warping,G4=p.env,K4=p.full,H4=p.full_like,q4=p.getCacheShapes,Q4=p.hamming,X4=p.hanning,J4=p.interpolate,Y4=p.interpolate_4d,Z4=p.interpolate_data,eW=p.is_chinese_char,tW=p.layer_norm,rW=p.load_image,sW=p.load_video,oW=p.log_softmax,aW=p.magnitude,nW=p.matmul,iW=p.max,lW=p.mean,cW=p.mean_pooling,dW=p.medianFilter,uW=p.mel_filter_bank,_W=p.min,pW=p.ones,mW=p.ones_like,hW=p.permute,fW=p.permute_data,$0=p.pipeline,gW=p.quantize_embeddings,MW=p.rand,wW=p.randn,bW=p.read_audio,vW=p.rfft,xW=p.round,yW=p.slice,TW=p.softmax,PW=p.spectrogram,EW=p.stack,kW=p.std_mean,CW=p.topk,SW=p.window_function,FW=p.zeros,IW=p.zeros_like;async function D0(e){let{spec:r,onLoading:t}=e;return await $0("automatic-speech-recognition",r.model,{device:r.device,dtype:r.dtype,progress_callback:o=>{t({total:o.total,progress:o.progress})}})}async function O0(e){let{pipe:r,spec:t,request:s,callbacks:o}=e;if(!r.processor.feature_extractor)throw new Error("no feature_extractor");let a=r.processor.feature_extractor?.config.chunk_length/r.model.config.max_source_positions,n=0,i=null,l=0,c=0,_=t.chunkLength-t.strideLength,u=()=>{let x=n*_;return Math.min(x/s.duration,1)},d=r.tokenizer,g=new A0(d,{time_precision:a,token_callback_function:()=>{i??=performance.now(),++l>1&&(c=l/(performance.now()-i)*1e3)},callback_function:x=>{o.onTranscription(x),o.onReport({tokensPerSecond:c,progress:u()})},on_finalize:()=>{i=null,l=0,n++,o.onReport({tokensPerSecond:c,progress:u()})}}),h=await r(new Float32Array(s.audio),{top_k:0,do_sample:!1,chunk_length_s:t.chunkLength,stride_length_s:t.strideLength,language:s.language,task:"transcribe",return_timestamps:"word",force_full_sequences:!1,streamer:g});return{text:h.text,chunks:h.chunks}}var L0=ls(),ME=e=>Of(async r=>{L0.resolve({spec:r,pipe:await D0({spec:r,onLoading:t=>e.loading(t)})})});await Yf.worker(e=>({prepare:ME(e.host),async transcribe(t){let{pipe:s,spec:o}=await L0.promise;return O0({pipe:s,spec:o,request:t,callbacks:{onReport:a=>e.host.deliverReport(a),onTranscription:a=>e.host.deliverTranscription(a)}})}}));
|
|
2851
|
+
`:case"\r":return!1;default:return/^\p{Cc}|\p{Cf}|\p{Co}|\p{Cs}$/u.test(S)}}_clean_text(S){let G=[];for(let te of S){let se=te.charCodeAt(0);se===0||se===65533||this._is_control(te)||(/^\s$/.test(te)?G.push(" "):G.push(te))}return G.join("")}normalize(S){return this.config.clean_text&&(S=this._clean_text(S)),this.config.handle_chinese_chars&&(S=this._tokenize_chinese_chars(S)),this.config.lowercase?(S=S.toLowerCase(),this.config.strip_accents!==!1&&(S=this.stripAccents(S))):this.config.strip_accents&&(S=this.stripAccents(S)),S}}class we extends s.Callable{static fromConfig(S){if(S===null)return null;switch(S.type){case"BertPreTokenizer":return new A(S);case"Sequence":return new yr(S);case"Whitespace":return new zs(S);case"WhitespaceSplit":return new Ys(S);case"Metaspace":return new Lt(S);case"ByteLevel":return new le(S);case"Split":return new ge(S);case"Punctuation":return new be(S);case"Digits":return new Ae(S);case"Replace":return new Zs(S);case"FixedLength":return new or(S);default:throw new Error(`Unknown PreTokenizer type: ${S.type}`)}}pre_tokenize_text(S,G){throw Error("pre_tokenize_text should be implemented in subclass.")}pre_tokenize(S,G){return(Array.isArray(S)?S.map(te=>this.pre_tokenize_text(te,G)):this.pre_tokenize_text(S,G)).flat()}_call(S,G){return this.pre_tokenize(S,G)}}class A extends we{constructor(S){super(),this.pattern=new RegExp(`[^\\s${I}]+|[${I}]`,"gu")}pre_tokenize_text(S,G){return S.trim().match(this.pattern)||[]}}class le extends we{constructor(S){super(),this.config=S,this.add_prefix_space=this.config.add_prefix_space,this.trim_offsets=this.config.trim_offsets,this.use_regex=this.config.use_regex??!0,this.pattern=/'s|'t|'re|'ve|'m|'ll|'d| ?\p{L}+| ?\p{N}+| ?[^\s\p{L}\p{N}]+|\s+(?!\S)|\s+/gu,this.byte_encoder=X,this.text_encoder=new TextEncoder}pre_tokenize_text(S,G){return this.add_prefix_space&&!S.startsWith(" ")&&(S=" "+S),(this.use_regex?S.match(this.pattern)||[]:[S]).map(se=>Array.from(this.text_encoder.encode(se),me=>this.byte_encoder[me]).join(""))}}class ge extends we{constructor(S){super(),this.config=S,this.pattern=g(this.config.pattern,this.config.invert)}pre_tokenize_text(S,G){return this.pattern===null?[]:this.config.invert?S.match(this.pattern)||[]:this.config.behavior?.toLowerCase()==="removed"?S.split(this.pattern).filter(te=>te):d(S,this.pattern)}}class be extends we{constructor(S){super(),this.config=S,this.pattern=new RegExp(`[^${I}]+|[${I}]+`,"gu")}pre_tokenize_text(S,G){return S.match(this.pattern)||[]}}class Ae extends we{constructor(S){super(),this.config=S;let G=`[^\\d]+|\\d${this.config.individual_digits?"":"+"}`;this.pattern=new RegExp(G,"gu")}pre_tokenize_text(S,G){return S.match(this.pattern)||[]}}class ve extends s.Callable{constructor(S){super(),this.config=S}static fromConfig(S){if(S===null)return null;switch(S.type){case"TemplateProcessing":return new fe(S);case"ByteLevel":return new Te(S);case"RobertaProcessing":return new Pe(S);case"BertProcessing":return new pe(S);case"Sequence":return new We(S);default:throw new Error(`Unknown PostProcessor type: ${S.type}`)}}post_process(S,...G){throw Error("post_process should be implemented in subclass.")}_call(S,...G){return this.post_process(S,...G)}}class pe extends ve{constructor(S){super(S),this.cls=S.cls[0],this.sep=S.sep[0]}post_process(S,G=null,{add_special_tokens:te=!0}={}){te&&(S=(0,o.mergeArrays)([this.cls],S,[this.sep]));let se=new Array(S.length).fill(0);if(G!==null){let me=te&&this instanceof Pe?[this.sep]:[],Ce=te?[this.sep]:[];S=(0,o.mergeArrays)(S,me,G,Ce),se=(0,o.mergeArrays)(se,new Array(G.length+me.length+Ce.length).fill(1))}return{tokens:S,token_type_ids:se}}}class Pe extends pe{}class fe extends ve{constructor(S){super(S),this.single=S.single,this.pair=S.pair}post_process(S,G=null,{add_special_tokens:te=!0}={}){let se=G===null?this.single:this.pair,me=[],Ce=[];for(let Ye of se)"SpecialToken"in Ye?te&&(me.push(Ye.SpecialToken.id),Ce.push(Ye.SpecialToken.type_id)):"Sequence"in Ye&&(Ye.Sequence.id==="A"?(me=(0,o.mergeArrays)(me,S),Ce=(0,o.mergeArrays)(Ce,new Array(S.length).fill(Ye.Sequence.type_id))):Ye.Sequence.id==="B"&&(me=(0,o.mergeArrays)(me,G),Ce=(0,o.mergeArrays)(Ce,new Array(G.length).fill(Ye.Sequence.type_id))));return{tokens:me,token_type_ids:Ce}}}class Te extends ve{post_process(S,G=null){return G&&(S=(0,o.mergeArrays)(S,G)),{tokens:S}}}class We extends ve{constructor(S){super(S),this.processors=S.processors.map(G=>ve.fromConfig(G))}post_process(S,G=null,te={}){let se;for(let me of this.processors)if(me instanceof Te)S=me.post_process(S).tokens,G&&(G=me.post_process(G).tokens);else{let Ce=me.post_process(S,G,te);S=Ce.tokens,se=Ce.token_type_ids}return{tokens:S,token_type_ids:se}}}class $e extends s.Callable{constructor(S){super(),this.config=S,this.added_tokens=[],this.end_of_word_suffix=null,this.trim_offsets=S.trim_offsets}static fromConfig(S){if(S===null)return null;switch(S.type){case"WordPiece":return new Qe(S);case"Metaspace":return new fr(S);case"ByteLevel":return new je(S);case"Replace":return new Re(S);case"ByteFallback":return new Ne(S);case"Fuse":return new ot(S);case"Strip":return new De(S);case"Sequence":return new Ke(S);case"CTC":return new pt(S);case"BPEDecoder":return new bt(S);default:throw new Error(`Unknown Decoder type: ${S.type}`)}}_call(S){return this.decode(S)}decode(S){return this.decode_chain(S).join("")}decode_chain(S){throw Error("`decode_chain` should be implemented in subclass.")}}class Re extends $e{decode_chain(S){let G=g(this.config.pattern);return G===null?S:S.map(te=>te.replaceAll(G,this.config.content))}}class Ne extends $e{constructor(S){super(S),this.text_decoder=new TextDecoder}decode_chain(S){let G=[],te=[];for(let se of S){let me=null;if(se.length===6&&se.startsWith("<0x")&&se.endsWith(">")){let Ce=parseInt(se.slice(3,5),16);isNaN(Ce)||(me=Ce)}if(me!==null)te.push(me);else{if(te.length>0){let Ce=this.text_decoder.decode(Uint8Array.from(te));G.push(Ce),te=[]}G.push(se)}}if(te.length>0){let se=this.text_decoder.decode(Uint8Array.from(te));G.push(se),te=[]}return G}}class ot extends $e{decode_chain(S){return[S.join("")]}}class De extends $e{constructor(S){super(S),this.content=this.config.content,this.start=this.config.start,this.stop=this.config.stop}decode_chain(S){return S.map(G=>{let te=0;for(let me=0;me<this.start&&G[me]===this.content;++me){te=me+1;continue}let se=G.length;for(let me=0;me<this.stop;++me){let Ce=G.length-me-1;if(G[Ce]===this.content){se=Ce;continue}else break}return G.slice(te,se)})}}class Qe extends $e{constructor(S){super(S),this.cleanup=S.cleanup}decode_chain(S){return S.map((G,te)=>(te!==0&&(G.startsWith(this.config.prefix)?G=G.replace(this.config.prefix,""):G=" "+G),this.cleanup&&(G=F(G)),G))}}class je extends $e{constructor(S){super(S),this.byte_decoder=J,this.text_decoder=new TextDecoder("utf-8",{fatal:!1,ignoreBOM:!0}),this.end_of_word_suffix=null}convert_tokens_to_string(S){let G=S.join(""),te=new Uint8Array([...G].map(me=>this.byte_decoder[me]));return this.text_decoder.decode(te)}decode_chain(S){let G=[],te=[];for(let se of S)this.added_tokens.find(me=>me.content===se)!==void 0?(te.length>0&&(G.push(this.convert_tokens_to_string(te)),te=[]),G.push(se)):te.push(se);return te.length>0&&G.push(this.convert_tokens_to_string(te)),G}}class pt extends $e{constructor(S){super(S),this.pad_token=this.config.pad_token,this.word_delimiter_token=this.config.word_delimiter_token,this.cleanup=this.config.cleanup}convert_tokens_to_string(S){if(S.length===0)return"";let G=[S[0]];for(let me=1;me<S.length;++me)S[me]!==G.at(-1)&&G.push(S[me]);let se=G.filter(me=>me!==this.pad_token).join("");return this.cleanup&&(se=F(se).replaceAll(this.word_delimiter_token," ").trim()),se}decode_chain(S){return[this.convert_tokens_to_string(S)]}}class Ke extends $e{constructor(S){super(S),this.decoders=S.decoders.map(G=>$e.fromConfig(G))}decode_chain(S){return this.decoders.reduce((G,te)=>te.decode_chain(G),S)}}class bt extends $e{constructor(S){super(S),this.suffix=this.config.suffix}decode_chain(S){return S.map((G,te)=>G.replaceAll(this.suffix,te===S.length-1?"":" "))}}class At extends $e{decode_chain(S){let G="";for(let te=1;te<S.length;te+=2)G+=S[te];return[G]}}class Lt extends we{constructor(S){super(),this.replacement=S.replacement,this.strRep=S.str_rep||this.replacement,this.prepend_scheme=S.prepend_scheme??"always"}pre_tokenize_text(S,{section_index:G=void 0}={}){let te=S.replaceAll(" ",this.strRep);return!te.startsWith(this.replacement)&&(this.prepend_scheme==="always"||this.prepend_scheme==="first"&&G===0)&&(te=this.strRep+te),[te]}}class fr extends $e{constructor(S){super(S),this.replacement=S.replacement}decode_chain(S){let G=[];for(let te=0;te<S.length;++te){let se=S[te].replaceAll(this.replacement," ");te==0&&se.startsWith(" ")&&(se=se.substring(1)),G.push(se)}return G}}class zt extends oe{constructor(S){super(S),this.charsmap=S.precompiled_charsmap}normalize(S){return S=S.replace(/[\u0001-\u0008\u000B\u000E-\u001F\u007F\u008F\u009F]/gm,""),S=S.replace(/[\u0009\u000A\u000C\u000D\u00A0\u1680\u2000-\u200F\u2028\u2029\u202F\u205F\u2581\u3000\uFEFF\uFFFD]/gm," "),S.includes("\uFF5E")?S=S.split("\uFF5E").map(te=>te.normalize("NFKC")).join("\uFF5E"):S=S.normalize("NFKC"),S}}class yr extends we{constructor(S){super(),this.tokenizers=S.pretokenizers.map(G=>we.fromConfig(G))}pre_tokenize_text(S,G){return this.tokenizers.reduce((te,se)=>se.pre_tokenize(te,G),[S])}}class zs extends we{constructor(S){super()}pre_tokenize_text(S,G){return S.match(/\w+|[^\w\s]+/g)||[]}}class Ys extends we{constructor(S){super()}pre_tokenize_text(S,G){return P(S)}}class Zs extends we{constructor(S){super(),this.config=S,this.pattern=g(this.config.pattern),this.content=this.config.content}pre_tokenize_text(S,G){return this.pattern===null?[S]:[S.replaceAll(this.pattern,this.config.content)]}}class or extends we{constructor(S){super(),this._length=S.length}pre_tokenize_text(S,G){let te=[];for(let se=0;se<S.length;se+=this._length)te.push(S.slice(se,se+this._length));return te}}let Dr=["bos_token","eos_token","unk_token","sep_token","pad_token","cls_token","mask_token"];function Yr(de,S,G,te){for(let se of Object.keys(de)){let me=S-de[se].length,Ce=G(se),Ye=new Array(me).fill(Ce);de[se]=te==="right"?(0,o.mergeArrays)(de[se],Ye):(0,o.mergeArrays)(Ye,de[se])}}function Rs(de,S){for(let G of Object.keys(de))de[G].length=S}class ft extends s.Callable{return_token_type_ids=!1;padding_side="right";constructor(S,G){super(),this.config=G,this.normalizer=oe.fromConfig(S.normalizer),this.pre_tokenizer=we.fromConfig(S.pre_tokenizer),this.model=U.fromConfig(S.model,G),this.post_processor=ve.fromConfig(S.post_processor),this.decoder=$e.fromConfig(S.decoder),this.special_tokens=[],this.all_special_ids=[],this.added_tokens=[];for(let te of S.added_tokens){let se=new O(te);this.added_tokens.push(se),this.model.tokens_to_ids.set(se.content,se.id),this.model.vocab[se.id]=se.content,se.special&&(this.special_tokens.push(se.content),this.all_special_ids.push(se.id))}if(this.additional_special_tokens=G.additional_special_tokens??[],this.special_tokens.push(...this.additional_special_tokens),this.special_tokens=[...new Set(this.special_tokens)],this.decoder&&(this.decoder.added_tokens=this.added_tokens,this.decoder.end_of_word_suffix=this.model.end_of_word_suffix),this.added_tokens_splitter=new l.DictionarySplitter(this.added_tokens.map(te=>te.content)),this.added_tokens_map=new Map(this.added_tokens.map(te=>[te.content,te])),this.mask_token=this.getToken("mask_token"),this.mask_token_id=this.model.tokens_to_ids.get(this.mask_token),this.pad_token=this.getToken("pad_token","eos_token"),this.pad_token_id=this.model.tokens_to_ids.get(this.pad_token),this.sep_token=this.getToken("sep_token"),this.sep_token_id=this.model.tokens_to_ids.get(this.sep_token),this.unk_token=this.getToken("unk_token"),this.unk_token_id=this.model.tokens_to_ids.get(this.unk_token),this.bos_token=this.getToken("bos_token"),this.bos_token_id=this.model.tokens_to_ids.get(this.bos_token),this.eos_token=this.getToken("eos_token"),this.eos_token_id=this.model.tokens_to_ids.get(this.eos_token),this.model_max_length=G.model_max_length,this.remove_space=G.remove_space,this.clean_up_tokenization_spaces=G.clean_up_tokenization_spaces??!0,this.do_lowercase_and_remove_accent=G.do_lowercase_and_remove_accent??!1,G.padding_side&&(this.padding_side=G.padding_side),this.add_bos_token=G.add_bos_token,this.add_eos_token=G.add_eos_token,this.legacy=!1,this.chat_template=G.chat_template??null,Array.isArray(this.chat_template)){let te=Object.create(null);for(let{name:se,template:me}of this.chat_template){if(typeof se!="string"||typeof me!="string")throw new Error('Chat template must be a list of objects with "name" and "template" properties');te[se]=me}this.chat_template=te}this._compiled_template_cache=new Map}getToken(...S){for(let G of S){let te=this.config[G];if(te)if(typeof te=="object"){if(te.__type==="AddedToken")return te.content;throw Error(`Unknown token: ${te}`)}else return te}return null}static async from_pretrained(S,{progress_callback:G=null,config:te=null,cache_dir:se=null,local_files_only:me=!1,revision:Ce="main",legacy:Ye=null}={}){let Xe=await u(S,{progress_callback:G,config:te,cache_dir:se,local_files_only:me,revision:Ce,legacy:Ye});return new this(...Xe)}_call(S,{text_pair:G=null,add_special_tokens:te=!0,padding:se=!1,truncation:me=null,max_length:Ce=null,return_tensor:Ye=!0,return_token_type_ids:Xe=null}={}){let Ze=Array.isArray(S),He;if(Ze){if(S.length===0)throw Error("text array must be non-empty");if(G!==null){if(Array.isArray(G)){if(S.length!==G.length)throw Error("text and text_pair must have the same length")}else throw Error("text_pair must also be an array");He=S.map((yt,Xt)=>this._encode_plus(yt,{text_pair:G[Xt],add_special_tokens:te,return_token_type_ids:Xe}))}else He=S.map(yt=>this._encode_plus(yt,{add_special_tokens:te,return_token_type_ids:Xe}))}else{if(S==null)throw Error("text may not be null or undefined");if(Array.isArray(G))throw Error("When specifying `text_pair`, since `text` is a string, `text_pair` must also be a string (i.e., not an array).");He=[this._encode_plus(S,{text_pair:G,add_special_tokens:te,return_token_type_ids:Xe})]}if(Ce===null?Ce=this.model_max_length:me===null&&(se===!0?(console.warn("`max_length` is ignored when `padding: true` and there is no truncation strategy. To pad to max length, use `padding: 'max_length'`."),Ce=this.model_max_length):se===!1&&(console.warn("Truncation was not explicitly activated but `max_length` is provided a specific value, please use `truncation: true` to explicitly truncate examples to max length."),me=!0)),se===!0&&(Ce=Math.min((0,n.max)(He.map(yt=>yt.input_ids.length))[0],Ce??1/0)),Ce=Math.min(Ce,this.model_max_length??1/0),se||me)for(let yt=0;yt<He.length;++yt)He[yt].input_ids.length!==Ce&&(He[yt].input_ids.length>Ce?me&&Rs(He[yt],Ce):se&&Yr(He[yt],Ce,Xt=>Xt==="input_ids"?this.pad_token_id:0,this.padding_side));let It={};if(Ye){if(!(se&&me)&&He.some(Xt=>{for(let Mr of Object.keys(Xt))if(Xt[Mr].length!==He[0][Mr]?.length)return!0;return!1}))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=true' and 'truncation=true' to have batched tensors with the same length.");let yt=[He.length,He[0].input_ids.length];for(let Xt of Object.keys(He[0]))It[Xt]=new i.Tensor("int64",BigInt64Array.from(He.flatMap(Mr=>Mr[Xt]).map(BigInt)),yt)}else{for(let yt of Object.keys(He[0]))It[yt]=He.map(Xt=>Xt[yt]);if(!Ze)for(let yt of Object.keys(It))It[yt]=It[yt][0]}return It}_encode_text(S){if(S===null)return null;let G=this.added_tokens_splitter.split(S);for(let se=0;se<G.length;++se){let me=this.added_tokens_map.get(G[se]);me&&(me.lstrip&&se>0&&(G[se-1]=G[se-1].trimEnd()),me.rstrip&&se<G.length-1&&(G[se+1]=G[se+1].trimStart()))}return G.flatMap((se,me)=>{if(se.length===0)return[];if(this.added_tokens_map.has(se))return[se];if(this.remove_space===!0&&(se=se.trim().split(/\s+/).join(" ")),this.do_lowercase_and_remove_accent&&(se=b(se)),this.normalizer!==null&&(se=this.normalizer(se)),se.length===0)return[];let Ce=this.pre_tokenizer!==null?this.pre_tokenizer(se,{section_index:me}):[se];return this.model(Ce)})}_encode_plus(S,{text_pair:G=null,add_special_tokens:te=!0,return_token_type_ids:se=null}={}){let{tokens:me,token_type_ids:Ce}=this._tokenize_helper(S,{pair:G,add_special_tokens:te}),Ye=this.model.convert_tokens_to_ids(me),Xe={input_ids:Ye,attention_mask:new Array(Ye.length).fill(1)};return(se??this.return_token_type_ids)&&Ce&&(Xe.token_type_ids=Ce),Xe}_tokenize_helper(S,{pair:G=null,add_special_tokens:te=!1}={}){let se=this._encode_text(S),me=this._encode_text(G);return this.post_processor?this.post_processor(se,me,{add_special_tokens:te}):{tokens:(0,o.mergeArrays)(se??[],me??[])}}tokenize(S,{pair:G=null,add_special_tokens:te=!1}={}){return this._tokenize_helper(S,{pair:G,add_special_tokens:te}).tokens}encode(S,{text_pair:G=null,add_special_tokens:te=!0,return_token_type_ids:se=null}={}){return this._encode_plus(S,{text_pair:G,add_special_tokens:te,return_token_type_ids:se}).input_ids}batch_decode(S,G={}){return S instanceof i.Tensor&&(S=S.tolist()),S.map(te=>this.decode(te,G))}decode(S,G={}){if(S instanceof i.Tensor&&(S=x(S)),!Array.isArray(S)||S.length===0||!(0,o.isIntegralNumber)(S[0]))throw Error("token_ids must be a non-empty array of integers.");return this.decode_single(S,G)}decode_single(S,{skip_special_tokens:G=!1,clean_up_tokenization_spaces:te=null}){let se=this.model.convert_ids_to_tokens(S);G&&(se=se.filter(Ce=>!this.special_tokens.includes(Ce)));let me=this.decoder?this.decoder(se):se.join(" ");return this.decoder&&this.decoder.end_of_word_suffix&&(me=me.replaceAll(this.decoder.end_of_word_suffix," "),G&&(me=me.trim())),(te??this.clean_up_tokenization_spaces)&&(me=F(me)),me}get_chat_template({chat_template:S=null,tools:G=null}={}){if(this.chat_template&&typeof this.chat_template=="object"){let te=this.chat_template;if(S!==null&&Object.hasOwn(te,S))S=te[S];else if(S===null)if(G!==null&&"tool_use"in te)S=te.tool_use;else if("default"in te)S=te.default;else throw Error(`This model has multiple chat templates with no default specified! Please either pass a chat template or the name of the template you wish to use to the 'chat_template' argument. Available template names are ${Object.keys(te).sort()}.`)}else if(S===null)if(this.chat_template)S=this.chat_template;else throw Error("Cannot use apply_chat_template() because tokenizer.chat_template is not set and no template argument was passed! For information about writing templates and setting the tokenizer.chat_template attribute, please see the documentation at https://huggingface.co/docs/transformers/main/en/chat_templating");return S}apply_chat_template(S,{tools:G=null,documents:te=null,chat_template:se=null,add_generation_prompt:me=!1,tokenize:Ce=!0,padding:Ye=!1,truncation:Xe=!1,max_length:Ze=null,return_tensor:He=!0,return_dict:It=!1,tokenizer_kwargs:yt={},...Xt}={}){if(se=this.get_chat_template({chat_template:se,tools:G}),typeof se!="string")throw Error(`chat_template must be a string, but got ${typeof se}`);let Mr=this._compiled_template_cache.get(se);Mr===void 0&&(Mr=new c.Template(se),this._compiled_template_cache.set(se,Mr));let nr=Object.create(null);for(let ir of Dr){let Tr=this.getToken(ir);Tr&&(nr[ir]=Tr)}let Br=Mr.render({messages:S,add_generation_prompt:me,tools:G,documents:te,...nr,...Xt});if(Ce){let ir=this._call(Br,{add_special_tokens:!1,padding:Ye,truncation:Xe,max_length:Ze,return_tensor:He,...yt});return It?ir:ir.input_ids}return Br}}class Cs extends ft{return_token_type_ids=!0}class qt extends ft{return_token_type_ids=!0}class Ss extends ft{return_token_type_ids=!0}class Qr extends ft{return_token_type_ids=!0}class St extends ft{return_token_type_ids=!0}class Xr extends ft{return_token_type_ids=!0}class k extends ft{return_token_type_ids=!0}class Q extends ft{return_token_type_ids=!0}class N extends ft{return_token_type_ids=!0}class K extends ft{}class Z extends ft{}class ce extends ft{return_token_type_ids=!0;constructor(S,G){super(S,G),console.warn('WARNING: `XLMTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}}class xe extends ft{return_token_type_ids=!0}class et extends ft{}class ut extends ft{}class qe extends ft{}class wt extends ft{constructor(S,G){super(S,G),this.languageRegex=/^[a-z]{2}_[A-Z]{2}$/,this.language_codes=this.special_tokens.filter(te=>this.languageRegex.test(te)),this.lang_to_token=te=>te}_build_translation_inputs(S,G,te){return Gr(this,S,G,te)}}class tt extends wt{}class gt extends ft{}class Nt extends ft{}let Qt="\u2581";class ur extends ft{padding_side="left";constructor(S,G){super(S,G),this.legacy=G.legacy??!0,this.legacy||(this.normalizer=null,this.pre_tokenizer=new Lt({replacement:Qt,prepend_scheme:"first"}))}_encode_text(S){if(S===null)return null;if(this.legacy||S.length===0)return super._encode_text(S);let G=super._encode_text(Qt+S.replaceAll(Qt," "));return G.length>1&&G[0]===Qt&&this.special_tokens.includes(G[1])&&(G=G.slice(1)),G}}class Or extends ft{}class Cr extends ft{}class Lr extends ft{}class _s extends ft{}class Fs extends ft{}class gr extends ft{}class Ns extends ft{}class as extends ft{}class Nr extends ft{}function Gr(de,S,G,te){if(!("language_codes"in de)||!Array.isArray(de.language_codes))throw new Error("Tokenizer must have `language_codes` attribute set and it should be an array of language ids.");if(!("languageRegex"in de)||!(de.languageRegex instanceof RegExp))throw new Error("Tokenizer must have `languageRegex` attribute set and it should be a regular expression.");if(!("lang_to_token"in de)||typeof de.lang_to_token!="function")throw new Error("Tokenizer must have `lang_to_token` attribute set and it should be a function.");let se=te.src_lang,me=te.tgt_lang;if(!de.language_codes.includes(me))throw new Error(`Target language code "${me}" is not valid. Must be one of: {${de.language_codes.join(", ")}}`);if(se!==void 0){if(!de.language_codes.includes(se))throw new Error(`Source language code "${se}" is not valid. Must be one of: {${de.language_codes.join(", ")}}`);for(let Ce of de.post_processor.config.single)if("SpecialToken"in Ce&&de.languageRegex.test(Ce.SpecialToken.id)){Ce.SpecialToken.id=de.lang_to_token(se);break}}return te.forced_bos_token_id=de.model.convert_tokens_to_ids([de.lang_to_token(me)])[0],de._call(S,G)}class ar extends ft{constructor(S,G){super(S,G),this.languageRegex=/^[a-z]{3}_[A-Z][a-z]{3}$/,this.language_codes=this.special_tokens.filter(te=>this.languageRegex.test(te)),this.lang_to_token=te=>te}_build_translation_inputs(S,G,te){return Gr(this,S,G,te)}}class _r extends ft{constructor(S,G){super(S,G),this.languageRegex=/^__[a-z]{2,3}__$/,this.language_codes=this.special_tokens.filter(te=>this.languageRegex.test(te)).map(te=>te.slice(2,-2)),this.lang_to_token=te=>`__${te}__`}_build_translation_inputs(S,G,te){return Gr(this,S,G,te)}}class ps extends ft{get timestamp_begin(){return this.model.convert_tokens_to_ids(["<|notimestamps|>"])[0]+1}_decode_asr(S,{return_timestamps:G=!1,return_language:te=!1,time_precision:se=null,force_full_sequences:me=!0}={}){if(se===null)throw Error("Must specify time_precision");let Ce=null,Ye=G==="word";function Xe(){return{language:Ce,timestamp:[null,null],text:""}}let Ze=[],He=Xe(),It=0,yt=this.timestamp_begin,Mr=yt+1500,nr=[],Br=[],ir=!1,Tr=null,zr=new Set(this.all_special_ids);for(let Yt of S){let vr=Yt.tokens,Sr=Ye?Yt.token_timestamps:null,Jr=null,ms=yt;if("stride"in Yt){let[lr,pr,wr]=Yt.stride;if(It-=pr,Tr=lr-wr,pr&&(ms=pr/se+yt),wr)for(let er=vr.length-1;er>=0;--er){let Kr=Number(vr[er]);if(Kr>=yt){if(Jr!==null&&(Kr-yt)*se<Tr)break;Jr=Kr}}}let Fr=[],is=[];for(let lr=0;lr<vr.length;++lr){let pr=Number(vr[lr]);if(zr.has(pr)){let wr=this.decode([pr]),er=_.WHISPER_LANGUAGE_MAPPING.get(wr.slice(2,-2));if(er!==void 0){if(Ce!==null&&er!==Ce&&!G){nr.push(Fr);let Kr=this.findLongestCommonSequence(nr)[0],Ws=this.decode(Kr);He.text=Ws,Ze.push(He),nr=[],Fr=[],He=Xe()}Ce=He.language=er}}else if(pr>=yt&&pr<=Mr){let wr=(pr-yt)*se+It,er=(0,n.round)(wr,2);if(Jr!==null&&pr>=Jr)ir=!0;else if(ir||nr.length>0&&pr<ms)ir=!1;else if(He.timestamp[0]===null)He.timestamp[0]=er;else if(er!==He.timestamp[0]){He.timestamp[1]=er,nr.push(Fr),Ye&&Br.push(is);let[Kr,Ws]=this.findLongestCommonSequence(nr,Br),Os=this.decode(Kr);He.text=Os,Ye&&(He.words=this.collateWordTimestamps(Kr,Ws,Ce)),Ze.push(He),nr=[],Fr=[],Br=[],is=[],He=Xe()}}else if(Fr.push(pr),Ye){let wr=(0,n.round)(Sr[lr]+It,2),er;if(lr+1<Sr.length){er=(0,n.round)(Sr[lr+1]+It,2);let Kr=this.decode([pr]);f.test(Kr)&&(er=(0,n.round)(Math.min(wr+se,er),2))}else er=null;is.push([wr,er])}}if("stride"in Yt){let[lr,pr,wr]=Yt.stride;It+=lr-wr}Fr.length>0?(nr.push(Fr),Ye&&Br.push(is)):nr.every(lr=>lr.length===0)&&(He=Xe(),nr=[],Fr=[],Br=[],is=[])}if(nr.length>0){if(me&&G)throw new Error("Whisper did not predict an ending timestamp, which can happen if audio is cut off in the middle of a word. Also make sure WhisperTimeStampLogitsProcessor was used during generation.");let[Yt,vr]=this.findLongestCommonSequence(nr,Br),Sr=this.decode(Yt);He.text=Sr,Ye&&(He.words=this.collateWordTimestamps(Yt,vr,Ce)),Ze.push(He)}let Pr=Object.create(null),Zr=Ze.map(Yt=>Yt.text).join("");if(G||te){for(let Yt=0;Yt<Ze.length;++Yt){let vr=Ze[Yt];G||delete vr.timestamp,te||delete vr.language}if(Ye){let Yt=[];for(let vr of Ze)for(let Sr of vr.words)Yt.push(Sr);Pr={chunks:Yt}}else Pr={chunks:Ze}}return[Zr,Pr]}findLongestCommonSequence(S,G=null){let te=S[0],se=te.length,me=[],Ce=Array.isArray(G)&&G.length>0,Ye=Ce?[]:null,Xe=Ce?G[0]:null;for(let Ze=1;Ze<S.length;++Ze){let He=S[Ze],It=0,yt=[se,se,0,0],Xt=He.length;for(let Pr=1;Pr<se+Xt;++Pr){let Zr=Math.max(0,se-Pr),Yt=Math.min(se,se+Xt-Pr),vr=te.slice(Zr,Yt),Sr=Math.max(0,Pr-se),Jr=Math.min(Xt,Pr),ms=He.slice(Sr,Jr);if(vr.length!==ms.length)throw new Error("There is a bug within whisper `decode_asr` function, please report it. Dropping to prevent bad inference.");let Fr;Ce?Fr=vr.filter((pr,wr)=>pr===ms[wr]&&Xe[Zr+wr]<=G[Ze][Sr+wr]).length:Fr=vr.filter((pr,wr)=>pr===ms[wr]).length;let is=Pr/1e4,lr=Fr/Pr+is;Fr>1&&lr>It&&(It=lr,yt=[Zr,Yt,Sr,Jr])}let[Mr,nr,Br,ir]=yt,Tr=Math.floor((nr+Mr)/2),zr=Math.floor((ir+Br)/2);me.push(...te.slice(0,Tr)),te=He.slice(zr),se=te.length,Ce&&(Ye.push(...Xe.slice(0,Tr)),Xe=G[Ze].slice(zr))}return me.push(...te),Ce?(Ye.push(...Xe),[me,Ye]):[me,[]]}collateWordTimestamps(S,G,te){let[se,me,Ce]=this.combineTokensIntoWords(S,te),Ye=[];for(let Xe=0;Xe<se.length;++Xe){let Ze=Ce[Xe];Ye.push({text:se[Xe],timestamp:[G[Ze.at(0)][0],G[Ze.at(-1)][1]]})}return Ye}combineTokensIntoWords(S,G,te=`"'\u201C\xA1\xBF([{-`,se=`"'.\u3002,\uFF0C!\uFF01?\uFF1F:\uFF1A\u201D)]}\u3001`){G=G??"english";let me,Ce,Ye;return["chinese","japanese","thai","lao","myanmar"].includes(G)?[me,Ce,Ye]=this.splitTokensOnUnicode(S):[me,Ce,Ye]=this.splitTokensOnSpaces(S),this.mergePunctuations(me,Ce,Ye,te,se)}decode(S,G){let te;return G?.decode_with_timestamps?(S instanceof i.Tensor&&(S=x(S)),te=this.decodeWithTimestamps(S,G)):te=super.decode(S,G),te}decodeWithTimestamps(S,G){let te=G?.time_precision??.02,se=Array.from(this.all_special_ids).at(-1)+1,me=[[]];for(let Ce of S)if(Ce=Number(Ce),Ce>=se){let Ye=((Ce-se)*te).toFixed(2);me.push(`<|${Ye}|>`),me.push([])}else me[me.length-1].push(Ce);return me=me.map(Ce=>typeof Ce=="string"?Ce:super.decode(Ce,G)),me.join("")}splitTokensOnUnicode(S){let G=this.decode(S,{decode_with_timestamps:!0}),te="\uFFFD",se=[],me=[],Ce=[],Ye=[],Xe=[],Ze=0;for(let He=0;He<S.length;++He){let It=S[He];Ye.push(It),Xe.push(He);let yt=this.decode(Ye,{decode_with_timestamps:!0});(!yt.includes(te)||G[Ze+yt.indexOf(te)]===te)&&(se.push(yt),me.push(Ye),Ce.push(Xe),Ye=[],Xe=[],Ze+=yt.length)}return[se,me,Ce]}splitTokensOnSpaces(S){let[G,te,se]=this.splitTokensOnUnicode(S),me=[],Ce=[],Ye=[],Xe=new RegExp(`^[${I}]$`,"gu");for(let Ze=0;Ze<G.length;++Ze){let He=G[Ze],It=te[Ze],yt=se[Ze],Xt=It[0]>=this.model.tokens_to_ids.get("<|endoftext|>"),Mr=He.startsWith(" "),nr=He.trim(),Br=Xe.test(nr);if(Xt||Mr||Br||me.length===0)me.push(He),Ce.push(It),Ye.push(yt);else{let ir=me.length-1;me[ir]+=He,Ce[ir].push(...It),Ye[ir].push(...yt)}}return[me,Ce,Ye]}mergePunctuations(S,G,te,se,me){let Ce=structuredClone(S),Ye=structuredClone(G),Xe=structuredClone(te),Ze=Ce.length-2,He=Ce.length-1;for(;Ze>=0;)Ce[Ze].startsWith(" ")&&se.includes(Ce[Ze].trim())?(Ce[He]=Ce[Ze]+Ce[He],Ye[He]=(0,o.mergeArrays)(Ye[Ze],Ye[He]),Xe[He]=(0,o.mergeArrays)(Xe[Ze],Xe[He]),Ce[Ze]="",Ye[Ze]=[],Xe[Ze]=[]):He=Ze,--Ze;for(Ze=0,He=1;He<Ce.length;)!Ce[Ze].endsWith(" ")&&me.includes(Ce[He])?(Ce[Ze]+=Ce[He],Ye[Ze]=(0,o.mergeArrays)(Ye[Ze],Ye[He]),Xe[Ze]=(0,o.mergeArrays)(Xe[Ze],Xe[He]),Ce[He]="",Ye[He]=[],Xe[He]=[]):Ze=He,++He;return[Ce.filter(It=>It),Ye.filter(It=>It.length>0),Xe.filter(It=>It.length>0)]}}class Is extends ft{}class As extends ft{}class $s extends ft{}class ns extends ft{constructor(S,G){super(S,G),this.languageRegex=/^(>>\w+<<)\s*/g,this.supported_language_codes=this.model.vocab.filter(te=>this.languageRegex.test(te)),console.warn('WARNING: `MarianTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}_encode_text(S){if(S===null)return null;let[G,...te]=S.trim().split(this.languageRegex);if(te.length===0)return super._encode_text(G);if(te.length===2){let[se,me]=te;return this.supported_language_codes.includes(se)||console.warn(`Unsupported language code "${se}" detected, which may lead to unexpected behavior. Should be one of: ${JSON.stringify(this.supported_language_codes)}`),(0,o.mergeArrays)([se],super._encode_text(me))}}}class Wr extends ft{}class ze extends ft{}class Ue extends ft{}class at extends ft{}class Ht extends ft{}class js extends ft{constructor(S,G){super(S,G),this.decoder=new At({})}}class Ds extends ft{}class Vs extends ft{}class Wo{static TOKENIZER_CLASS_MAPPING={T5Tokenizer:et,DistilBertTokenizer:K,CamembertTokenizer:Z,DebertaTokenizer:St,DebertaV2Tokenizer:Xr,BertTokenizer:Cs,HerbertTokenizer:k,ConvBertTokenizer:Q,RoFormerTokenizer:N,XLMTokenizer:ce,ElectraTokenizer:xe,MobileBertTokenizer:Ss,SqueezeBertTokenizer:Qr,AlbertTokenizer:qt,GPT2Tokenizer:ut,BartTokenizer:qe,MBartTokenizer:wt,MBart50Tokenizer:tt,RobertaTokenizer:gt,WhisperTokenizer:ps,CodeGenTokenizer:Is,CLIPTokenizer:As,SiglipTokenizer:$s,MarianTokenizer:ns,BloomTokenizer:Nt,NllbTokenizer:ar,M2M100Tokenizer:_r,LlamaTokenizer:ur,CodeLlamaTokenizer:Or,XLMRobertaTokenizer:Cr,MPNetTokenizer:Lr,FalconTokenizer:_s,GPTNeoXTokenizer:Fs,EsmTokenizer:gr,Wav2Vec2CTCTokenizer:Wr,BlenderbotTokenizer:ze,BlenderbotSmallTokenizer:Ue,SpeechT5Tokenizer:at,NougatTokenizer:Ht,VitsTokenizer:js,Qwen2Tokenizer:Ns,GemmaTokenizer:as,Grok1Tokenizer:Nr,CohereTokenizer:Ds,MgpstrTokenizer:Vs,PreTrainedTokenizer:ft};static async from_pretrained(S,{progress_callback:G=null,config:te=null,cache_dir:se=null,local_files_only:me=!1,revision:Ce="main",legacy:Ye=null}={}){let[Xe,Ze]=await u(S,{progress_callback:G,config:te,cache_dir:se,local_files_only:me,revision:Ce,legacy:Ye}),He=Ze.tokenizer_class?.replace(/Fast$/,"")??"PreTrainedTokenizer",It=this.TOKENIZER_CLASS_MAPPING[He];return It||(console.warn(`Unknown tokenizer class "${He}", attempting to construct from base class.`),It=ft),new It(Xe,Ze)}}}),"./src/utils/audio.js":((e,r,t)=>{t.r(r),t.d(r,{RawAudio:()=>W,hamming:()=>d,hanning:()=>u,mel_filter_bank:()=>C,read_audio:()=>c,spectrogram:()=>E,window_function:()=>D});var s=t("./src/utils/hub.js"),o=t("./src/utils/maths.js"),a=t("./src/utils/core.js"),n=t("./src/env.js"),i=t("./src/utils/tensor.js"),l=t("?7992");async function c(z,X){if(typeof AudioContext>"u")throw Error("Unable to load audio from path/URL since `AudioContext` is not available in your environment. Instead, audio data should be passed directly to the pipeline/processor. For more information and some example code, see https://huggingface.co/docs/transformers.js/guides/node-audio-processing.");let J=await(await(0,s.getFile)(z)).arrayBuffer(),q=new AudioContext({sampleRate:X});typeof X>"u"&&console.warn(`No sampling rate provided, using default of ${q.sampleRate}Hz.`);let re=await q.decodeAudioData(J),oe;if(re.numberOfChannels===2){let ne=Math.sqrt(2),ye=re.getChannelData(0),Y=re.getChannelData(1);oe=new Float32Array(ye.length);for(let H=0;H<re.length;++H)oe[H]=ne*(ye[H]+Y[H])/2}else oe=re.getChannelData(0);return oe}function _(z,X){if(z<1)return new Float64Array;if(z===1)return new Float64Array([1]);let J=1-X,q=2*Math.PI/(z-1),re=new Float64Array(z);for(let oe=0;oe<z;++oe)re[oe]=X-J*Math.cos(oe*q);return re}function u(z){return _(z,.5)}function d(z){return _(z,.54)}let g={htk:z=>2595*Math.log10(1+z/700),kaldi:z=>1127*Math.log(1+z/700),slaney:(z,X=1e3,J=15,q=27/Math.log(6.4))=>z>=X?J+Math.log(z/X)*q:3*z/200};function h(z,X="htk"){let J=g[X];if(!J)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof z=="number"?J(z):z.map(q=>J(q))}let x={htk:z=>700*(10**(z/2595)-1),kaldi:z=>700*(Math.exp(z/1127)-1),slaney:(z,X=1e3,J=15,q=Math.log(6.4)/27)=>z>=J?X*Math.exp(q*(z-J)):200*z/3};function F(z,X="htk"){let J=x[X];if(!J)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof z=="number"?J(z):z.map(q=>J(q))}function v(z,X){let J=Float64Array.from({length:X.length-1},(ne,ye)=>X[ye+1]-X[ye]),q=Array.from({length:z.length},()=>new Array(X.length));for(let ne=0;ne<z.length;++ne){let ye=q[ne];for(let Y=0;Y<X.length;++Y)ye[Y]=X[Y]-z[ne]}let re=X.length-2,oe=Array.from({length:re},()=>new Array(z.length));for(let ne=0;ne<z.length;++ne){let ye=q[ne];for(let Y=0;Y<re;++Y){let H=-ye[Y]/J[Y],R=ye[Y+2]/J[Y+1];oe[Y][ne]=Math.max(0,Math.min(H,R))}}return oe}function b(z,X,J){let q=(X-z)/(J-1);return Float64Array.from({length:J},(re,oe)=>z+q*oe)}function C(z,X,J,q,re,oe=null,ne="htk",ye=!1){if(oe!==null&&oe!=="slaney")throw new Error('norm must be one of null or "slaney"');if(z<2)throw new Error(`Require num_frequency_bins: ${z} >= 2`);if(J>q)throw new Error(`Require min_frequency: ${J} <= max_frequency: ${q}`);let Y=h(J,ne),H=h(q,ne),R=b(Y,H,X+2),L=F(R,ne),ee;if(ye){let ke=re/((z-1)*2);ee=h(Float64Array.from({length:z},(Ie,Le)=>Le*ke),ne),L=R}else ee=b(0,Math.floor(re/2),z);let ue=v(ee,L);if(oe!==null&&oe==="slaney")for(let ke=0;ke<X;++ke){let Ie=ue[ke],Le=2/(L[ke+2]-L[ke]);for(let rt=0;rt<z;++rt)Ie[rt]*=Le}return ue}function y(z,X,J){let q=new z.constructor(z.length+X+J),re=z.length-1;for(let oe=0;oe<z.length;++oe)q[X+oe]=z[oe];for(let oe=1;oe<=X;++oe)q[X-oe]=z[(0,a.calculateReflectOffset)(oe,re)];for(let oe=1;oe<=J;++oe)q[re+X+oe]=z[(0,a.calculateReflectOffset)(re-oe,re)];return q}function P(z,X,J,q,re){if(J<=0)throw new Error("reference must be greater than zero");if(q<=0)throw new Error("min_value must be greater than zero");J=Math.max(q,J);let oe=Math.log10(J);for(let ne=0;ne<z.length;++ne)z[ne]=X*Math.log10(Math.max(q,z[ne])-oe);if(re!==null){if(re<=0)throw new Error("db_range must be greater than zero");let ne=(0,o.max)(z)[0]-re;for(let ye=0;ye<z.length;++ye)z[ye]=Math.max(z[ye],ne)}return z}function I(z,X=1,J=1e-5,q=null){return P(z,20,X,J,q)}function f(z,X=1,J=1e-10,q=null){return P(z,10,X,J,q)}async function E(z,X,J,q,{fft_length:re=null,power:oe=1,center:ne=!0,pad_mode:ye="reflect",onesided:Y=!0,preemphasis:H=null,preemphasis_htk_flavor:R=!0,mel_filters:L=null,mel_floor:ee=1e-10,log_mel:ue=null,reference:ke=1,min_value:Ie=1e-10,db_range:Le=null,remove_dc_offset:rt=null,min_num_frames:we=null,max_num_frames:A=null,do_pad:le=!0,transpose:ge=!1,mel_offset:be=0}={}){let Ae=X.length;if(re===null&&(re=J),J>re)throw Error(`frame_length (${J}) may not be larger than fft_length (${re})`);if(Ae!==J)throw new Error(`Length of the window (${Ae}) must equal frame_length (${J})`);if(q<=0)throw new Error("hop_length must be greater than zero");if(oe===null&&L!==null)throw new Error("You have provided `mel_filters` but `power` is `None`. Mel spectrogram computation is not yet supported for complex-valued spectrogram. Specify `power` to fix this issue.");if(!R)throw new Error("`preemphasis_htk_flavor=false` is not currently supported.");if(ne)switch(ye){case"reflect":{let Qe=Math.floor((re-1)/2)+1;z=y(z,Qe,Qe);break}case"constant":{let Qe=Math.floor(re/2),je=new z.constructor(z.length+2*Qe);je.set(z,Qe),z=je;break}default:throw new Error(`pad_mode="${ye}" not implemented yet.`)}let ve=Math.floor(1+Math.floor((z.length-J)/q));we!==null&&ve<we&&(ve=we);let pe=Y?Math.floor(re/2)+1:re,Pe=ve,fe=ve;A!==null&&(A>ve?le&&(fe=A):fe=Pe=A);let Te=new o.FFT(re),We=new Float64Array(re),$e=new Float64Array(Te.outputBufferSize),Re=new Float32Array(pe*fe);for(let Qe=0;Qe<Pe;++Qe){let je=Qe*q,pt=Math.min(z.length-je,J);pt!==J&&We.fill(0,0,J);for(let Ke=0;Ke<pt;++Ke)We[Ke]=z[je+Ke];if(rt){let Ke=0;for(let At=0;At<pt;++At)Ke+=We[At];let bt=Ke/pt;for(let At=0;At<pt;++At)We[At]-=bt}if(H!==null){for(let Ke=pt-1;Ke>=1;--Ke)We[Ke]-=H*We[Ke-1];We[0]*=1-H}for(let Ke=0;Ke<X.length;++Ke)We[Ke]*=X[Ke];Te.realTransform($e,We);for(let Ke=0;Ke<pe;++Ke){let bt=Ke<<1;Re[Ke*fe+Qe]=$e[bt]**2+$e[bt+1]**2}}if(oe!==null&&oe!==2){let Qe=oe/2;for(let je=0;je<Re.length;++je)Re[je]**=Qe}let Ne=L.length,ot=await(0,i.matmul)(new i.Tensor("float32",L.flat(),[Ne,pe]),new i.Tensor("float32",Re,[pe,fe]));ge&&(ot=ot.transpose(1,0));let De=ot.data;for(let Qe=0;Qe<De.length;++Qe)De[Qe]=be+Math.max(ee,De[Qe]);if(oe!==null&&ue!==null){let Qe=Math.min(De.length,Pe*Ne);switch(ue){case"log":for(let je=0;je<Qe;++je)De[je]=Math.log(De[je]);break;case"log10":for(let je=0;je<Qe;++je)De[je]=Math.log10(De[je]);break;case"dB":if(oe===1)I(De,ke,Ie,Le);else if(oe===2)f(De,ke,Ie,Le);else throw new Error(`Cannot use log_mel option '${ue}' with power ${oe}`);break;default:throw new Error(`log_mel must be one of null, 'log', 'log10' or 'dB'. Got '${ue}'`)}}return ot}function D(z,X,{periodic:J=!0,frame_length:q=null,center:re=!0}={}){let oe=J?z+1:z,ne;switch(X){case"boxcar":ne=new Float64Array(oe).fill(1);break;case"hann":case"hann_window":ne=u(oe);break;case"hamming":ne=d(oe);break;case"povey":ne=u(oe).map(ye=>Math.pow(ye,.85));break;default:throw new Error(`Unknown window type ${X}.`)}if(J&&(ne=ne.subarray(0,z)),q===null)return ne;if(z>q)throw new Error(`Length of the window (${z}) may not be larger than frame_length (${q})`);return ne}function O(z,X){let J=44,q=new ArrayBuffer(J+z.length*4),re=new DataView(q);U(re,0,"RIFF"),re.setUint32(4,36+z.length*4,!0),U(re,8,"WAVE"),U(re,12,"fmt "),re.setUint32(16,16,!0),re.setUint16(20,3,!0),re.setUint16(22,1,!0),re.setUint32(24,X,!0),re.setUint32(28,X*4,!0),re.setUint16(32,4,!0),re.setUint16(34,32,!0),U(re,36,"data"),re.setUint32(40,z.length*4,!0);for(let oe=0;oe<z.length;++oe,J+=4)re.setFloat32(J,z[oe],!0);return q}function U(z,X,J){for(let q=0;q<J.length;++q)z.setUint8(X+q,J.charCodeAt(q))}class W{constructor(X,J){this.audio=X,this.sampling_rate=J}toWav(){return O(this.audio,this.sampling_rate)}toBlob(){let X=this.toWav();return new Blob([X],{type:"audio/wav"})}async save(X){let J;if(n.apis.IS_BROWSER_ENV){if(n.apis.IS_WEBWORKER_ENV)throw new Error("Unable to save a file from a Web Worker.");J=a.saveBlob}else if(n.apis.IS_FS_AVAILABLE)J=async(q,re)=>{let oe=await re.arrayBuffer();l.writeFileSync(q,Buffer.from(oe))};else throw new Error("Unable to save because filesystem is disabled in this environment.");await J(X,this.toBlob())}}}),"./src/utils/constants.js":((e,r,t)=>{t.r(r),t.d(r,{CHAT_TEMPLATE_NAME:()=>l,CONFIG_NAME:()=>o,FEATURE_EXTRACTOR_NAME:()=>a,GENERATION_CONFIG_NAME:()=>c,GITHUB_ISSUE_URL:()=>s,IMAGE_PROCESSOR_NAME:()=>n,PROCESSOR_NAME:()=>i});let s="https://github.com/huggingface/transformers.js/issues/new/choose",o="config.json",a="preprocessor_config.json",n=a,i="processor_config.json",l="chat_template.jinja",c="generation_config.json"}),"./src/utils/core.js":((e,r,t)=>{t.r(r),t.d(r,{calculateDimensions:()=>c,calculateReflectOffset:()=>g,count:()=>v,dispatchCallback:()=>s,escapeRegExp:()=>a,isIntegralNumber:()=>i,isNullishDimension:()=>l,isTypedArray:()=>n,len:()=>F,mergeArrays:()=>u,pick:()=>x,pop:()=>_,product:()=>d,reverseDictionary:()=>o,saveBlob:()=>h});function s(b,C){b&&b(C)}function o(b){return Object.fromEntries(Object.entries(b).map(([C,y])=>[y,C]))}function a(b){return b.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function n(b){return b?.prototype?.__proto__?.constructor?.name==="TypedArray"}function i(b){return Number.isInteger(b)||typeof b=="bigint"}function l(b){return b==null||b===-1}function c(b){let C=[],y=b;for(;Array.isArray(y);)C.push(y.length),y=y[0];return C}function _(b,C,y=void 0){let P=b[C];if(P!==void 0)return delete b[C],P;if(y===void 0)throw Error(`Key ${C} does not exist in object.`);return y}function u(...b){return Array.prototype.concat.apply([],b)}function d(...b){return b.reduce((C,y)=>C.flatMap(P=>y.map(I=>[P,I])))}function g(b,C){return Math.abs((b+C)%(2*C)-C)}function h(b,C){let y=URL.createObjectURL(C),P=document.createElement("a");P.href=y,P.download=b,P.click(),P.remove(),URL.revokeObjectURL(y)}function x(b,C){return Object.assign({},...C.map(y=>{if(b[y]!==void 0)return{[y]:b[y]}}))}function F(b){let C=0;for(let y of b)++C;return C}function v(b,C){let y=0;for(let P of b)P===C&&++y;return y}}),"./src/utils/data-structures.js":((e,r,t)=>{t.r(r),t.d(r,{CharTrie:()=>o,DictionarySplitter:()=>l,LRUCache:()=>c,PriorityQueue:()=>s,TokenLattice:()=>n});class s{constructor(u=(g,h)=>g>h,d=1/0){this._heap=[],this._comparator=u,this._maxSize=d}get size(){return this._heap.length}isEmpty(){return this.size===0}peek(){return this._heap[0]}push(...u){return this.extend(u)}extend(u){for(let d of u)if(this.size<this._maxSize)this._heap.push(d),this._siftUp();else{let g=this._smallest();this._comparator(d,this._heap[g])&&(this._heap[g]=d,this._siftUpFrom(g))}return this.size}pop(){let u=this.peek(),d=this.size-1;return d>0&&this._swap(0,d),this._heap.pop(),this._siftDown(),u}replace(u){let d=this.peek();return this._heap[0]=u,this._siftDown(),d}_parent(u){return(u+1>>>1)-1}_left(u){return(u<<1)+1}_right(u){return u+1<<1}_greater(u,d){return this._comparator(this._heap[u],this._heap[d])}_swap(u,d){let g=this._heap[u];this._heap[u]=this._heap[d],this._heap[d]=g}_siftUp(){this._siftUpFrom(this.size-1)}_siftUpFrom(u){for(;u>0&&this._greater(u,this._parent(u));)this._swap(u,this._parent(u)),u=this._parent(u)}_siftDown(){let u=0;for(;this._left(u)<this.size&&this._greater(this._left(u),u)||this._right(u)<this.size&&this._greater(this._right(u),u);){let d=this._right(u)<this.size&&this._greater(this._right(u),this._left(u))?this._right(u):this._left(u);this._swap(u,d),u=d}}_smallest(){return 2**Math.floor(Math.log2(this.size))-1}}class o{constructor(){this.root=a.default()}extend(u){for(let d of u)this.push(d)}push(u){let d=this.root;for(let g of u){let h=d.children.get(g);h===void 0&&(h=a.default(),d.children.set(g,h)),d=h}d.isLeaf=!0}*commonPrefixSearch(u){let d=this.root;if(d===void 0)return;let g="";for(let h of u){if(g+=h,d=d.children.get(h),d===void 0)return;d.isLeaf&&(yield g)}}}class a{constructor(u,d){this.isLeaf=u,this.children=d}static default(){return new a(!1,new Map)}}class n{constructor(u,d,g){this.chars=Array.from(u),this.len=this.chars.length,this.bosTokenId=d,this.eosTokenId=g,this.nodes=[],this.beginNodes=Array.from({length:this.len+1},()=>[]),this.endNodes=Array.from({length:this.len+1},()=>[]);let h=new i(this.bosTokenId,0,0,0,0),x=new i(this.eosTokenId,1,this.len,0,0);this.nodes.push(h.clone()),this.nodes.push(x.clone()),this.beginNodes[this.len].push(x),this.endNodes[0].push(h)}insert(u,d,g,h){let x=this.nodes.length,F=new i(h,x,u,d,g);this.beginNodes[u].push(F),this.endNodes[u+d].push(F),this.nodes.push(F)}viterbi(){let u=this.len,d=0;for(;d<=u;){if(this.beginNodes[d].length==0)return[];for(let v of this.beginNodes[d]){v.prev=null;let b=0,C=null;for(let y of this.endNodes[d]){let P=y.backtraceScore+v.score;(C===null||P>b)&&(C=y.clone(),b=P)}if(C!==null)v.prev=C,v.backtraceScore=b;else return[]}++d}let g=[],x=this.beginNodes[u][0].prev;if(x===null)return[];let F=x.clone();for(;F.prev!==null;)g.push(F.clone()),F=F.clone().prev.clone();return g.reverse(),g}piece(u){return this.chars.slice(u.pos,u.pos+u.length).join("")}tokens(){return this.viterbi().map(d=>this.piece(d))}tokenIds(){return this.viterbi().map(d=>d.tokenId)}}class i{constructor(u,d,g,h,x){this.tokenId=u,this.nodeId=d,this.pos=g,this.length=h,this.score=x,this.prev=null,this.backtraceScore=0}clone(){let u=new i(this.tokenId,this.nodeId,this.pos,this.length,this.score);return u.prev=this.prev,u.backtraceScore=this.backtraceScore,u}}class l{constructor(u){this.trie=this._buildTrie(u)}_buildTrie(u){let d=Object.create(null);for(let g of u){let h=d;for(let x=0;x<g.length;++x)h=h[g[x]]??=Object.create(null);h.end=g}return d}split(u){let d=[],g=u.length,h=0,x=0;for(;x<g;){let F=this.trie,v=null,b=x;for(;b<g&&(F=F[u[b]]);)F.end&&(v=F.end),++b;v?(x>h&&d.push(u.slice(h,x)),d.push(v),x+=v.length,h=x):++x}return h<g&&d.push(u.slice(h)),d}}class c{constructor(u){this.capacity=u,this.cache=new Map}get(u){if(!this.cache.has(u))return;let d=this.cache.get(u);return this.cache.delete(u),this.cache.set(u,d),d}put(u,d){this.cache.has(u)&&this.cache.delete(u),this.cache.set(u,d),this.cache.size>this.capacity&&this.cache.delete(this.cache.keys().next().value)}clear(){this.cache.clear()}}}),"./src/utils/devices.js":((e,r,t)=>{t.r(r),t.d(r,{DEVICE_TYPES:()=>s});let s=Object.freeze({auto:"auto",gpu:"gpu",cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",webnn:"webnn","webnn-npu":"webnn-npu","webnn-gpu":"webnn-gpu","webnn-cpu":"webnn-cpu"})}),"./src/utils/dtypes.js":((e,r,t)=>{t.r(r),t.d(r,{DATA_TYPES:()=>n,DEFAULT_DEVICE_DTYPE_MAPPING:()=>i,DEFAULT_DTYPE_SUFFIX_MAPPING:()=>l,isWebGpuFp16Supported:()=>a});var s=t("./src/env.js"),o=t("./src/utils/devices.js");let a=(function(){let c;return async function(){if(c===void 0)if(!s.apis.IS_WEBGPU_AVAILABLE)c=!1;else try{c=(await navigator.gpu.requestAdapter()).features.has("shader-f16")}catch{c=!1}return c}})(),n=Object.freeze({auto:"auto",fp32:"fp32",fp16:"fp16",q8:"q8",int8:"int8",uint8:"uint8",q4:"q4",bnb4:"bnb4",q4f16:"q4f16"}),i=Object.freeze({[o.DEVICE_TYPES.wasm]:n.q8}),l=Object.freeze({[n.fp32]:"",[n.fp16]:"_fp16",[n.int8]:"_int8",[n.uint8]:"_uint8",[n.q8]:"_quantized",[n.q4]:"_q4",[n.q4f16]:"_q4f16",[n.bnb4]:"_bnb4"})}),"./src/utils/generic.js":((e,r,t)=>{t.r(r),t.d(r,{Callable:()=>s});let s=class{constructor(){let o=function(...a){return o._call(...a)};return Object.setPrototypeOf(o,new.target.prototype)}_call(...o){throw Error("Must implement _call method in subclass")}}}),"./src/utils/hub.js":((e,r,t)=>{t.r(r),t.d(r,{MAX_EXTERNAL_DATA_CHUNKS:()=>i,getFile:()=>g,getModelFile:()=>b,getModelJSON:()=>y,getModelText:()=>C});var s=t("?7992"),o=t("?5af5"),a=t("./src/env.js"),n=t("./src/utils/core.js");let i=100,l={txt:"text/plain",html:"text/html",css:"text/css",js:"text/javascript",json:"application/json",png:"image/png",jpg:"image/jpeg",jpeg:"image/jpeg",gif:"image/gif"};class c{constructor(E){if(this.filePath=E,this.headers=new Headers,this.exists=s.existsSync(E),this.exists){this.status=200,this.statusText="OK";let D=s.statSync(E);this.headers.set("content-length",D.size.toString()),this.updateContentType();let O=s.createReadStream(E);this.body=new ReadableStream({start(U){O.on("data",W=>U.enqueue(W)),O.on("end",()=>U.close()),O.on("error",W=>U.error(W))},cancel(){O.destroy()}})}else this.status=404,this.statusText="Not Found",this.body=null}updateContentType(){let E=this.filePath.toString().split(".").pop().toLowerCase();this.headers.set("content-type",l[E]??"application/octet-stream")}clone(){let E=new c(this.filePath);return E.exists=this.exists,E.status=this.status,E.statusText=this.statusText,E.headers=new Headers(this.headers),E}async arrayBuffer(){return(await s.promises.readFile(this.filePath)).buffer}async blob(){let E=await s.promises.readFile(this.filePath);return new Blob([E],{type:this.headers.get("content-type")})}async text(){return await s.promises.readFile(this.filePath,"utf8")}async json(){return JSON.parse(await this.text())}}function _(f,E=null,D=null){let O;try{O=new URL(f)}catch{return!1}return!(E&&!E.includes(O.protocol)||D&&!D.includes(O.hostname))}let u=/^(\b[\w\-.]+\b\/)?\b[\w\-.]{1,96}\b$/;function d(f){return!(!u.test(f)||f.includes("..")||f.includes("--")||f.endsWith(".git")||f.endsWith(".ipynb"))}async function g(f){if(a.env.useFS&&!_(f,["http:","https:","blob:"]))return new c(f instanceof URL?f.protocol==="file:"?f.pathname:f.toString():f);if(typeof process<"u"&&process?.release?.name==="node"){let E=!!process.env?.TESTING_REMOTELY,D=a.env.version,O=new Headers;if(O.set("User-Agent",`transformers.js/${D}; is_ci/${E};`),_(f,["http:","https:"],["huggingface.co","hf.co"])){let W=process.env?.HF_TOKEN??process.env?.HF_ACCESS_TOKEN;W&&O.set("Authorization",`Bearer ${W}`)}return fetch(f,{headers:O})}else return fetch(f)}let h={400:"Bad request error occurred while trying to load file",401:"Unauthorized access to file",403:"Forbidden access to file",404:"Could not locate file",408:"Request timeout error occurred while trying to load file",500:"Internal server error error occurred while trying to load file",502:"Bad gateway error occurred while trying to load file",503:"Service unavailable error occurred while trying to load file",504:"Gateway timeout error occurred while trying to load file"};function x(f,E,D){if(!D)return null;let O=h[f]??`Error (${f}) occurred while trying to load file`;throw Error(`${O}: "${E}".`)}class F{constructor(E){this.path=E}async match(E){let D=o.join(this.path,E),O=new c(D);if(O.exists)return O}async put(E,D,O=void 0){let U=o.join(this.path,E);try{let W=D.headers.get("Content-Length"),z=parseInt(W??"0"),X=0;await s.promises.mkdir(o.dirname(U),{recursive:!0});let J=s.createWriteStream(U),q=D.body.getReader();for(;;){let{done:re,value:oe}=await q.read();if(re)break;await new Promise((ye,Y)=>{J.write(oe,H=>{if(H){Y(H);return}ye()})}),X+=oe.length;let ne=z?X/z*100:0;O?.({progress:ne,loaded:X,total:z})}J.close()}catch(W){try{await s.promises.unlink(U)}catch{}throw W}}}async function v(f,...E){for(let D of E)try{let O=await f.match(D);if(O)return O}catch{continue}}async function b(f,E,D=!0,O={},U=!1){if(!a.env.allowLocalModels){if(O.local_files_only)throw Error("Invalid configuration detected: local models are disabled (`env.allowLocalModels=false`) but you have requested to only use local models (`local_files_only=true`).");if(!a.env.allowRemoteModels)throw Error("Invalid configuration detected: both local and remote models are disabled. Fix by setting `env.allowLocalModels` or `env.allowRemoteModels` to `true`.")}(0,n.dispatchCallback)(O.progress_callback,{status:"initiate",name:f,file:E});let W;if(!W&&a.env.useCustomCache){if(!a.env.customCache)throw Error("`env.useCustomCache=true`, but `env.customCache` is not defined.");if(!a.env.customCache.match||!a.env.customCache.put)throw new Error("`env.customCache` must be an object which implements the `match` and `put` functions of the Web Cache API. For more information, see https://developer.mozilla.org/en-US/docs/Web/API/Cache");W=a.env.customCache}if(!W&&a.env.useBrowserCache){if(typeof caches>"u")throw Error("Browser cache is not available in this environment.");try{W=await caches.open("transformers-cache")}catch(ee){console.warn("An error occurred while opening the browser cache:",ee)}}if(!W&&a.env.useFSCache){if(!a.apis.IS_FS_AVAILABLE)throw Error("File System Cache is not available in this environment.");W=new F(O.cache_dir??a.env.cacheDir)}let z=O.revision??"main",X=I(f,E),J=d(f),q=J?I(a.env.localModelPath,X):X,re=I(a.env.remoteHost,a.env.remotePathTemplate.replaceAll("{model}",f).replaceAll("{revision}",encodeURIComponent(z)),E),oe,ne=W instanceof F?z==="main"?X:I(f,z,E):re,ye=!1,Y;W&&(Y=await v(W,q,ne));let H=Y!==void 0;if(Y===void 0){if(a.env.allowLocalModels)if(_(X,["http:","https:"])){if(O.local_files_only)throw new Error(`\`local_files_only=true\`, but attempted to load a remote file from: ${X}.`);if(!a.env.allowRemoteModels)throw new Error(`\`env.allowRemoteModels=false\`, but attempted to load a remote file from: ${X}.`)}else try{Y=await g(q),oe=q}catch(ue){console.warn(`Unable to load from local path "${q}": "${ue}"`)}if(Y===void 0||Y.status===404){if(O.local_files_only||!a.env.allowRemoteModels){if(D)throw Error(`\`local_files_only=true\` or \`env.allowRemoteModels=false\` and file was not found locally at "${q}".`);return null}if(!J)throw Error(`Local file missing at "${q}" and download aborted due to invalid model ID "${f}".`);if(Y=await g(re),Y.status!==200)return x(Y.status,re,D);oe=ne}ye=W&&typeof Response<"u"&&Y instanceof Response&&Y.status===200}(0,n.dispatchCallback)(O.progress_callback,{status:"download",name:f,file:E});let R;if(!(a.apis.IS_NODE_ENV&&U)){let ee;O.progress_callback?H&&typeof navigator<"u"&&/firefox/i.test(navigator.userAgent)?(ee=new Uint8Array(await Y.arrayBuffer()),(0,n.dispatchCallback)(O.progress_callback,{status:"progress",name:f,file:E,progress:100,loaded:ee.length,total:ee.length})):ee=await P(Y,ue=>{(0,n.dispatchCallback)(O.progress_callback,{status:"progress",name:f,file:E,...ue})}):ee=new Uint8Array(await Y.arrayBuffer()),R=ee}if(ye&&oe&&await W.match(oe)===void 0)if(R)await W.put(oe,new Response(R,{headers:Y.headers})).catch(ee=>{console.warn(`Unable to add response to browser cache: ${ee}.`)});else{let ee=O.progress_callback?ue=>(0,n.dispatchCallback)(O.progress_callback,{status:"progress",name:f,file:E,...ue}):void 0;await W.put(oe,Y,ee)}if((0,n.dispatchCallback)(O.progress_callback,{status:"done",name:f,file:E}),R){if(!a.apis.IS_NODE_ENV&&U)throw new Error("Cannot return path in a browser environment.");return R}if(Y instanceof c)return Y.filePath;let L=await W?.match(oe);if(L instanceof c)return L.filePath;if(L instanceof Response)return new Uint8Array(await L.arrayBuffer());if(typeof L=="string")return L;throw new Error("Unable to get model file path or buffer.")}async function C(f,E,D=!0,O={}){let U=await b(f,E,D,O,!1);return U===null?null:new TextDecoder("utf-8").decode(U)}async function y(f,E,D=!0,O={}){let U=await C(f,E,D,O);return U===null?{}:JSON.parse(U)}async function P(f,E){let D=f.headers.get("Content-Length");D===null&&console.warn("Unable to determine content-length from response headers. Will expand buffer when needed.");let O=parseInt(D??"0"),U=new Uint8Array(O),W=0,z=f.body.getReader();async function X(){let{done:J,value:q}=await z.read();if(J)return;let re=W+q.length;if(re>O){O=re;let ne=new Uint8Array(O);ne.set(U),U=ne}U.set(q,W),W=re;let oe=W/O*100;return E({progress:oe,loaded:W,total:O}),X()}return await X(),U}function I(...f){return f=f.map((E,D)=>(D&&(E=E.replace(new RegExp("^/"),"")),D!==f.length-1&&(E=E.replace(new RegExp("/$"),"")),E)),f.join("/")}}),"./src/utils/image.js":((e,r,t)=>{t.r(r),t.d(r,{RawImage:()=>h,load_image:()=>x});var s=t("./src/utils/core.js"),o=t("./src/utils/hub.js"),a=t("./src/env.js"),n=t("./src/utils/tensor.js"),i=t("?2b25");let l,c,_,u=a.apis.IS_BROWSER_ENV||a.apis.IS_WEBWORKER_ENV;if(u)l=(F,v)=>{if(!self.OffscreenCanvas)throw new Error("OffscreenCanvas not supported by this browser.");return new self.OffscreenCanvas(F,v)},_=self.createImageBitmap,c=self.ImageData;else if(i)_=async F=>{let b=(await F.metadata()).channels,{data:C,info:y}=await F.rotate().raw().toBuffer({resolveWithObject:!0}),P=new h(new Uint8ClampedArray(C),y.width,y.height,y.channels);return b!==void 0&&b!==y.channels&&P.convert(b),P};else throw new Error("Unable to load image processing library.");let d={0:"nearest",1:"lanczos",2:"bilinear",3:"bicubic",4:"box",5:"hamming"},g=new Map([["png","image/png"],["jpg","image/jpeg"],["jpeg","image/jpeg"],["gif","image/gif"]]);class h{constructor(v,b,C,y){this.data=v,this.width=b,this.height=C,this.channels=y}get size(){return[this.width,this.height]}static async read(v){if(v instanceof h)return v;if(typeof v=="string"||v instanceof URL)return await this.fromURL(v);if(v instanceof Blob)return await this.fromBlob(v);if(typeof HTMLCanvasElement<"u"&&v instanceof HTMLCanvasElement||typeof OffscreenCanvas<"u"&&v instanceof OffscreenCanvas)return this.fromCanvas(v);throw new Error(`Unsupported input type: ${typeof v}`)}static fromCanvas(v){if(!u)throw new Error("fromCanvas() is only supported in browser environments.");let C=v.getContext("2d").getImageData(0,0,v.width,v.height).data;return new h(C,v.width,v.height,4)}static async fromURL(v){let b=await(0,o.getFile)(v);if(b.status!==200)throw new Error(`Unable to read image from "${v}" (${b.status} ${b.statusText})`);let C=await b.blob();return this.fromBlob(C)}static async fromBlob(v){if(u){let b=await _(v),C=l(b.width,b.height).getContext("2d");return C.drawImage(b,0,0),new this(C.getImageData(0,0,b.width,b.height).data,b.width,b.height,4)}else{let b=i(await v.arrayBuffer());return await _(b)}}static fromTensor(v,b="CHW"){if(v.dims.length!==3)throw new Error(`Tensor should have 3 dimensions, but has ${v.dims.length} dimensions.`);if(b==="CHW")v=v.transpose(1,2,0);else if(b!=="HWC")throw new Error(`Unsupported channel format: ${b}`);if(!(v.data instanceof Uint8ClampedArray||v.data instanceof Uint8Array))throw new Error(`Unsupported tensor type: ${v.type}`);switch(v.dims[2]){case 1:case 2:case 3:case 4:return new h(v.data,v.dims[1],v.dims[0],v.dims[2]);default:throw new Error(`Unsupported number of channels: ${v.dims[2]}`)}}grayscale(){if(this.channels===1)return this;let v=new Uint8ClampedArray(this.width*this.height*1);switch(this.channels){case 3:case 4:for(let b=0,C=0;b<this.data.length;b+=this.channels){let y=this.data[b],P=this.data[b+1],I=this.data[b+2];v[C++]=Math.round(.2989*y+.587*P+.114*I)}break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(v,this.width,this.height,1)}rgb(){if(this.channels===3)return this;let v=new Uint8ClampedArray(this.width*this.height*3);switch(this.channels){case 1:for(let b=0,C=0;b<this.data.length;++b)v[C++]=this.data[b],v[C++]=this.data[b],v[C++]=this.data[b];break;case 4:for(let b=0,C=0;b<this.data.length;b+=4)v[C++]=this.data[b],v[C++]=this.data[b+1],v[C++]=this.data[b+2];break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(v,this.width,this.height,3)}rgba(){if(this.channels===4)return this;let v=new Uint8ClampedArray(this.width*this.height*4);switch(this.channels){case 1:for(let b=0,C=0;b<this.data.length;++b)v[C++]=this.data[b],v[C++]=this.data[b],v[C++]=this.data[b],v[C++]=255;break;case 3:for(let b=0,C=0;b<this.data.length;b+=3)v[C++]=this.data[b],v[C++]=this.data[b+1],v[C++]=this.data[b+2],v[C++]=255;break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(v,this.width,this.height,4)}putAlpha(v){if(v.width!==this.width||v.height!==this.height)throw new Error(`Expected mask size to be ${this.width}x${this.height}, but got ${v.width}x${v.height}`);if(v.channels!==1)throw new Error(`Expected mask to have 1 channel, but got ${v.channels}`);let b=this.data,C=v.data,y=this.width*this.height;if(this.channels===3){let P=new Uint8ClampedArray(y*4);for(let I=0,f=0,E=0;I<y;++I)P[E++]=b[f++],P[E++]=b[f++],P[E++]=b[f++],P[E++]=C[I];return this._update(P,this.width,this.height,4)}else if(this.channels===4){for(let P=0;P<y;++P)b[4*P+3]=C[P];return this}throw new Error(`Expected image to have 3 or 4 channels, but got ${this.channels}`)}async resize(v,b,{resample:C=2}={}){if(this.width===v&&this.height===b)return this;let y=d[C]??C,P=(0,s.isNullishDimension)(v),I=(0,s.isNullishDimension)(b);if(P&&I)return this;if(P?v=b/this.height*this.width:I&&(b=v/this.width*this.height),u){let f=this.channels,E=this.toCanvas(),D=l(v,b).getContext("2d");return D.drawImage(E,0,0,v,b),new h(D.getImageData(0,0,v,b).data,v,b,4).convert(f)}else{let f=this.toSharp();switch(y){case"box":case"hamming":(y==="box"||y==="hamming")&&(console.warn(`Resampling method ${y} is not yet supported. Using bilinear instead.`),y="bilinear");case"nearest":case"bilinear":case"bicubic":f=f.affine([v/this.width,0,0,b/this.height],{interpolator:y});break;case"lanczos":f=f.resize({width:v,height:b,fit:"fill",kernel:"lanczos3"});break;default:throw new Error(`Resampling method ${y} is not supported.`)}return await _(f)}}async pad([v,b,C,y]){if(v=Math.max(v,0),b=Math.max(b,0),C=Math.max(C,0),y=Math.max(y,0),v===0&&b===0&&C===0&&y===0)return this;if(u){let P=this.channels,I=this.toCanvas(),f=this.width+v+b,E=this.height+C+y,D=l(f,E).getContext("2d");return D.drawImage(I,0,0,this.width,this.height,v,C,this.width,this.height),new h(D.getImageData(0,0,f,E).data,f,E,4).convert(P)}else{let P=this.toSharp().extend({left:v,right:b,top:C,bottom:y});return await _(P)}}async crop([v,b,C,y]){if(v=Math.max(v,0),b=Math.max(b,0),C=Math.min(C,this.width-1),y=Math.min(y,this.height-1),v===0&&b===0&&C===this.width-1&&y===this.height-1)return this;let P=C-v+1,I=y-b+1;if(u){let f=this.channels,E=this.toCanvas(),D=l(P,I).getContext("2d");return D.drawImage(E,v,b,P,I,0,0,P,I),new h(D.getImageData(0,0,P,I).data,P,I,4).convert(f)}else{let f=this.toSharp().extract({left:v,top:b,width:P,height:I});return await _(f)}}async center_crop(v,b){if(this.width===v&&this.height===b)return this;let C=(this.width-v)/2,y=(this.height-b)/2;if(u){let P=this.channels,I=this.toCanvas(),f=l(v,b).getContext("2d"),E=0,D=0,O=0,U=0;return C>=0?E=C:O=-C,y>=0?D=y:U=-y,f.drawImage(I,E,D,v,b,O,U,v,b),new h(f.getImageData(0,0,v,b).data,v,b,4).convert(P)}else{let P=this.toSharp();if(C>=0&&y>=0)P=P.extract({left:Math.floor(C),top:Math.floor(y),width:v,height:b});else if(C<=0&&y<=0){let I=Math.floor(-y),f=Math.floor(-C);P=P.extend({top:I,left:f,right:v-this.width-f,bottom:b-this.height-I})}else{let I=[0,0],f=0;y<0?(I[0]=Math.floor(-y),I[1]=b-this.height-I[0]):f=Math.floor(y);let E=[0,0],D=0;C<0?(E[0]=Math.floor(-C),E[1]=v-this.width-E[0]):D=Math.floor(C),P=P.extend({top:I[0],bottom:I[1],left:E[0],right:E[1]}).extract({left:D,top:f,width:v,height:b})}return await _(P)}}async toBlob(v="image/png",b=1){if(!u)throw new Error("toBlob() is only supported in browser environments.");return await this.toCanvas().convertToBlob({type:v,quality:b})}toTensor(v="CHW"){let b=new n.Tensor("uint8",new Uint8Array(this.data),[this.height,this.width,this.channels]);if(v!=="HWC")if(v==="CHW")b=b.permute(2,0,1);else throw new Error(`Unsupported channel format: ${v}`);return b}toCanvas(){if(!u)throw new Error("toCanvas() is only supported in browser environments.");let v=this.clone().rgba(),b=l(v.width,v.height),C=new c(v.data,v.width,v.height);return b.getContext("2d").putImageData(C,0,0),b}split(){let{data:v,width:b,height:C,channels:y}=this,P=v.constructor,I=v.length/y,f=Array.from({length:y},()=>new P(I));for(let E=0;E<I;++E){let D=y*E;for(let O=0;O<y;++O)f[O][E]=v[D+O]}return f.map(E=>new h(E,b,C,1))}_update(v,b,C,y=null){return this.data=v,this.width=b,this.height=C,y!==null&&(this.channels=y),this}clone(){return new h(this.data.slice(),this.width,this.height,this.channels)}convert(v){if(this.channels===v)return this;switch(v){case 1:this.grayscale();break;case 3:this.rgb();break;case 4:this.rgba();break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this}async save(v){if(u){if(a.apis.IS_WEBWORKER_ENV)throw new Error("Unable to save an image from a Web Worker.");let b=v.split(".").pop().toLowerCase(),C=g.get(b)??"image/png",y=await this.toBlob(C);(0,s.saveBlob)(v,y)}else{if(a.apis.IS_FS_AVAILABLE)return await this.toSharp().toFile(v);throw new Error("Unable to save the image because filesystem is disabled in this environment.")}}toSharp(){if(u)throw new Error("toSharp() is only supported in server-side environments.");return i(this.data,{raw:{width:this.width,height:this.height,channels:this.channels}})}}let x=h.read.bind(h)}),"./src/utils/maths.js":((e,r,t)=>{t.r(r),t.d(r,{FFT:()=>x,bankers_round:()=>b,cos_sim:()=>l,dot:()=>i,dynamic_time_warping:()=>C,interpolate_data:()=>s,log_softmax:()=>n,magnitude:()=>c,max:()=>u,medianFilter:()=>F,min:()=>_,permute_data:()=>o,round:()=>v,softmax:()=>a});function s(y,[P,I,f],[E,D],O="bilinear",U=!1){let W=D/f,z=E/I,X=new y.constructor(E*D*P),J=I*f,q=E*D;for(let re=0;re<E;++re)for(let oe=0;oe<D;++oe){let ne=re*D+oe,ye=(oe+.5)/W-.5,Y=(re+.5)/z-.5,H=Math.floor(ye),R=Math.floor(Y),L=Math.min(H+1,f-1),ee=Math.min(R+1,I-1);H=Math.max(H,0),R=Math.max(R,0);let ue=ye-H,ke=Y-R,Ie=(1-ue)*(1-ke),Le=ue*(1-ke),rt=(1-ue)*ke,we=ue*ke,A=R*f,le=ee*f,ge=A+H,be=A+L,Ae=le+H,ve=le+L;for(let pe=0;pe<P;++pe){let Pe=pe*J;X[pe*q+ne]=Ie*y[Pe+ge]+Le*y[Pe+be]+rt*y[Pe+Ae]+we*y[Pe+ve]}}return X}function o(y,P,I){let f=new Array(I.length),E=new Array(I.length);for(let U=I.length-1,W=1;U>=0;--U)E[U]=W,f[U]=P[I[U]],W*=f[U];let D=I.map((U,W)=>E[I.indexOf(W)]),O=new y.constructor(y.length);for(let U=0;U<y.length;++U){let W=0;for(let z=P.length-1,X=U;z>=0;--z)W+=X%P[z]*D[z],X=Math.floor(X/P[z]);O[W]=y[U]}return[O,f]}function a(y){let P=u(y)[0],I=y.map(D=>Math.exp(D-P)),f=I.reduce((D,O)=>D+O,0);return I.map(D=>D/f)}function n(y){let P=u(y)[0],I=0;for(let D=0;D<y.length;++D)I+=Math.exp(y[D]-P);let f=Math.log(I);return y.map(D=>D-P-f)}function i(y,P){let I=0;for(let f=0;f<y.length;++f)I+=y[f]*P[f];return I}function l(y,P){let I=i(y,P),f=c(y),E=c(P);return I/(f*E)}function c(y){return Math.sqrt(y.reduce((P,I)=>P+I*I,0))}function _(y){if(y.length===0)throw Error("Array must not be empty");let P=y[0],I=0;for(let f=1;f<y.length;++f)y[f]<P&&(P=y[f],I=f);return[P,I]}function u(y){if(y.length===0)throw Error("Array must not be empty");let P=y[0],I=0;for(let f=1;f<y.length;++f)y[f]>P&&(P=y[f],I=f);return[P,I]}function d(y){return y>0&&(y&y-1)===0}class g{constructor(P){if(this.size=P|0,this.size<=1||!d(this.size))throw new Error("FFT size must be a power of two larger than 1");this._csize=P<<1,this.table=new Float64Array(this.size*2);for(let f=0;f<this.table.length;f+=2){let E=Math.PI*f/this.size;this.table[f]=Math.cos(E),this.table[f+1]=-Math.sin(E)}let I=0;for(let f=1;this.size>f;f<<=1)++I;this._width=I%2===0?I-1:I,this._bitrev=new Int32Array(1<<this._width);for(let f=0;f<this._bitrev.length;++f){this._bitrev[f]=0;for(let E=0;E<this._width;E+=2){let D=this._width-E-2;this._bitrev[f]|=(f>>>E&3)<<D}}}createComplexArray(){return new Float64Array(this._csize)}fromComplexArray(P,I){let f=I||new Array(P.length>>>1);for(let E=0;E<P.length;E+=2)f[E>>>1]=P[E];return f}toComplexArray(P,I){let f=I||this.createComplexArray();for(let E=0;E<f.length;E+=2)f[E]=P[E>>>1],f[E+1]=0;return f}transform(P,I){if(P===I)throw new Error("Input and output buffers must be different");this._transform4(P,I,1)}realTransform(P,I){if(P===I)throw new Error("Input and output buffers must be different");this._realTransform4(P,I,1)}inverseTransform(P,I){if(P===I)throw new Error("Input and output buffers must be different");this._transform4(P,I,-1);for(let f=0;f<P.length;++f)P[f]/=this.size}_transform4(P,I,f){let E=this._csize,O=1<<this._width,U=E/O<<1,W,z,X=this._bitrev;if(U===4)for(W=0,z=0;W<E;W+=U,++z){let q=X[z];this._singleTransform2(I,P,W,q,O)}else for(W=0,z=0;W<E;W+=U,++z){let q=X[z];this._singleTransform4(I,P,W,q,O,f)}let J=this.table;for(O>>=2;O>=2;O>>=2){U=E/O<<1;let q=U>>>2;for(W=0;W<E;W+=U){let re=W+q-1;for(let oe=W,ne=0;oe<re;oe+=2,ne+=O){let ye=oe,Y=ye+q,H=Y+q,R=H+q,L=P[ye],ee=P[ye+1],ue=P[Y],ke=P[Y+1],Ie=P[H],Le=P[H+1],rt=P[R],we=P[R+1],A=J[ne],le=f*J[ne+1],ge=ue*A-ke*le,be=ue*le+ke*A,Ae=J[2*ne],ve=f*J[2*ne+1],pe=Ie*Ae-Le*ve,Pe=Ie*ve+Le*Ae,fe=J[3*ne],Te=f*J[3*ne+1],We=rt*fe-we*Te,$e=rt*Te+we*fe,Re=L+pe,Ne=ee+Pe,ot=L-pe,De=ee-Pe,Qe=ge+We,je=be+$e,pt=f*(ge-We),Ke=f*(be-$e);P[ye]=Re+Qe,P[ye+1]=Ne+je,P[Y]=ot+Ke,P[Y+1]=De-pt,P[H]=Re-Qe,P[H+1]=Ne-je,P[R]=ot-Ke,P[R+1]=De+pt}}}}_singleTransform2(P,I,f,E,D){let O=P[E],U=P[E+1],W=P[E+D],z=P[E+D+1];I[f]=O+W,I[f+1]=U+z,I[f+2]=O-W,I[f+3]=U-z}_singleTransform4(P,I,f,E,D,O){let U=D*2,W=D*3,z=P[E],X=P[E+1],J=P[E+D],q=P[E+D+1],re=P[E+U],oe=P[E+U+1],ne=P[E+W],ye=P[E+W+1],Y=z+re,H=X+oe,R=z-re,L=X-oe,ee=J+ne,ue=q+ye,ke=O*(J-ne),Ie=O*(q-ye);I[f]=Y+ee,I[f+1]=H+ue,I[f+2]=R+Ie,I[f+3]=L-ke,I[f+4]=Y-ee,I[f+5]=H-ue,I[f+6]=R-Ie,I[f+7]=L+ke}_realTransform4(P,I,f){let E=this._csize,O=1<<this._width,U=E/O<<1,W,z,X=this._bitrev;if(U===4)for(W=0,z=0;W<E;W+=U,++z){let re=X[z];this._singleRealTransform2(I,P,W,re>>>1,O>>>1)}else for(W=0,z=0;W<E;W+=U,++z){let re=X[z];this._singleRealTransform4(I,P,W,re>>>1,O>>>1,f)}let J=this.table;for(O>>=2;O>=2;O>>=2){U=E/O<<1;let re=U>>>1,oe=re>>>1,ne=oe>>>1;for(W=0;W<E;W+=U)for(let ye=0,Y=0;ye<=ne;ye+=2,Y+=O){let H=W+ye,R=H+oe,L=R+oe,ee=L+oe,ue=P[H],ke=P[H+1],Ie=P[R],Le=P[R+1],rt=P[L],we=P[L+1],A=P[ee],le=P[ee+1],ge=ue,be=ke,Ae=J[Y],ve=f*J[Y+1],pe=Ie*Ae-Le*ve,Pe=Ie*ve+Le*Ae,fe=J[2*Y],Te=f*J[2*Y+1],We=rt*fe-we*Te,$e=rt*Te+we*fe,Re=J[3*Y],Ne=f*J[3*Y+1],ot=A*Re-le*Ne,De=A*Ne+le*Re,Qe=ge+We,je=be+$e,pt=ge-We,Ke=be-$e,bt=pe+ot,At=Pe+De,Lt=f*(pe-ot),fr=f*(Pe-De);if(P[H]=Qe+bt,P[H+1]=je+At,P[R]=pt+fr,P[R+1]=Ke-Lt,ye===0){P[L]=Qe-bt,P[L+1]=je-At;continue}if(ye===ne)continue;let zt=W+oe-ye,yr=W+re-ye;P[zt]=pt-f*fr,P[zt+1]=-Ke-f*Lt,P[yr]=Qe-f*bt,P[yr+1]=-je+f*At}}let q=E>>>1;for(let re=2;re<q;re+=2)P[E-re]=P[re],P[E-re+1]=-P[re+1]}_singleRealTransform2(P,I,f,E,D){let O=P[E],U=P[E+D];I[f]=O+U,I[f+1]=0,I[f+2]=O-U,I[f+3]=0}_singleRealTransform4(P,I,f,E,D,O){let U=D*2,W=D*3,z=P[E],X=P[E+D],J=P[E+U],q=P[E+W],re=z+J,oe=z-J,ne=X+q,ye=O*(X-q);I[f]=re+ne,I[f+1]=0,I[f+2]=oe,I[f+3]=-ye,I[f+4]=re-ne,I[f+5]=0,I[f+6]=oe,I[f+7]=ye}}class h{constructor(P){let I=2*(P-1),f=2*(2*P-1),E=2**Math.ceil(Math.log2(f));this.bufferSize=E,this._a=I;let D=new Float64Array(f),O=new Float64Array(E);this._chirpBuffer=new Float64Array(E),this._buffer1=new Float64Array(E),this._buffer2=new Float64Array(E),this._outBuffer1=new Float64Array(E),this._outBuffer2=new Float64Array(E);let U=-2*Math.PI/P,W=Math.cos(U),z=Math.sin(U);for(let X=0;X<f>>1;++X){let J=(X+1-P)**2/2,q=Math.sqrt(W**2+z**2)**J,re=J*Math.atan2(z,W),oe=2*X;D[oe]=q*Math.cos(re),D[oe+1]=q*Math.sin(re),O[oe]=D[oe],O[oe+1]=-D[oe+1]}this._slicedChirpBuffer=D.subarray(I,f),this._f=new g(E>>1),this._f.transform(this._chirpBuffer,O)}_transform(P,I,f){let E=this._buffer1,D=this._buffer2,O=this._outBuffer1,U=this._outBuffer2,W=this._chirpBuffer,z=this._slicedChirpBuffer,X=this._a;if(f)for(let J=0;J<z.length;J+=2){let q=J+1,re=J>>1,oe=I[re];E[J]=oe*z[J],E[q]=oe*z[q]}else for(let J=0;J<z.length;J+=2){let q=J+1;E[J]=I[J]*z[J]-I[q]*z[q],E[q]=I[J]*z[q]+I[q]*z[J]}this._f.transform(O,E);for(let J=0;J<W.length;J+=2){let q=J+1;D[J]=O[J]*W[J]-O[q]*W[q],D[q]=O[J]*W[q]+O[q]*W[J]}this._f.inverseTransform(U,D);for(let J=0;J<U.length;J+=2){let q=U[J+X],re=U[J+X+1],oe=z[J],ne=z[J+1];P[J]=q*oe-re*ne,P[J+1]=q*ne+re*oe}}transform(P,I){this._transform(P,I,!1)}realTransform(P,I){this._transform(P,I,!0)}}class x{constructor(P){this.fft_length=P,this.isPowerOfTwo=d(P),this.isPowerOfTwo?(this.fft=new g(P),this.outputBufferSize=2*P):(this.fft=new h(P),this.outputBufferSize=this.fft.bufferSize)}realTransform(P,I){this.fft.realTransform(P,I)}transform(P,I){this.fft.transform(P,I)}}function F(y,P){if(P%2===0||P<=0)throw new Error("Window size must be a positive odd number");let I=new y.constructor(y.length),f=new y.constructor(P),E=Math.floor(P/2);for(let D=0;D<y.length;++D){let O=0;for(let U=-E;U<=E;++U){let W=D+U;W<0?W=Math.abs(W):W>=y.length&&(W=2*(y.length-1)-W),f[O++]=y[W]}f.sort(),I[D]=f[E]}return I}function v(y,P){let I=Math.pow(10,P);return Math.round(y*I)/I}function b(y){let P=Math.round(y);return Math.abs(y)%1===.5?P%2===0?P:P-1:P}function C(y){let P=y.length,I=y[0].length,f=[P+1,I+1],E=Array.from({length:f[0]},()=>Array(f[1]).fill(1/0));E[0][0]=0;let D=Array.from({length:f[0]},()=>Array(f[1]).fill(-1));for(let X=1;X<f[1];++X)for(let J=1;J<f[0];++J){let q=E[J-1][X-1],re=E[J-1][X],oe=E[J][X-1],ne,ye;q<re&&q<oe?(ne=q,ye=0):re<q&&re<oe?(ne=re,ye=1):(ne=oe,ye=2),E[J][X]=y[J-1][X-1]+ne,D[J][X]=ye}for(let X=0;X<f[1];++X)D[0][X]=2;for(let X=0;X<f[0];++X)D[X][0]=1;let O=P,U=I,W=[],z=[];for(;O>0||U>0;)switch(W.push(O-1),z.push(U-1),D[O][U]){case 0:--O,--U;break;case 1:--O;break;case 2:--U;break;default:throw new Error(`Internal error in dynamic time warping. Unexpected trace[${O}, ${U}]. Please file a bug report.`)}return W.reverse(),z.reverse(),[W,z]}}),"./src/utils/tensor.js":((e,r,t)=>{t.r(r),t.d(r,{DataTypeMap:()=>n,Tensor:()=>i,cat:()=>I,full:()=>z,full_like:()=>X,interpolate:()=>_,interpolate_4d:()=>u,layer_norm:()=>b,matmul:()=>d,mean:()=>O,mean_pooling:()=>v,ones:()=>J,ones_like:()=>q,permute:()=>c,quantize_embeddings:()=>Y,rand:()=>ne,randn:()=>ye,rfft:()=>g,slice:()=>F,stack:()=>f,std_mean:()=>D,topk:()=>h,zeros:()=>re,zeros_like:()=>oe});var s=t("./src/utils/maths.js"),o=t("./src/backends/onnx.js"),a=t("./src/ops/registry.js");let n=Object.freeze({float32:Float32Array,float16:typeof Float16Array<"u"?Float16Array:Uint16Array,float64:Float64Array,string:Array,int8:Int8Array,uint8:Uint8Array,int16:Int16Array,uint16:Uint16Array,int32:Int32Array,uint32:Uint32Array,int64:BigInt64Array,uint64:BigUint64Array,bool:Uint8Array,uint4:Uint8Array,int4:Int8Array});class i{get dims(){return this.ort_tensor.dims}set dims(R){this.ort_tensor.dims=R}get type(){return this.ort_tensor.type}get data(){return this.ort_tensor.data}get size(){return this.ort_tensor.size}get location(){return this.ort_tensor.location}ort_tensor;constructor(...R){return(0,o.isONNXTensor)(R[0])?this.ort_tensor=R[0]:this.ort_tensor=new o.Tensor(R[0],R[1],R[2]),new Proxy(this,{get:(L,ee)=>{if(typeof ee=="string"){let ue=Number(ee);if(Number.isInteger(ue))return L._getitem(ue)}return L[ee]},set:(L,ee,ue)=>L[ee]=ue})}dispose(){this.ort_tensor.dispose()}*[Symbol.iterator](){let[R,...L]=this.dims;if(L.length>0){let ee=L.reduce((ue,ke)=>ue*ke);for(let ue=0;ue<R;++ue)yield this._subarray(ue,ee,L)}else yield*this.data}_getitem(R){let[L,...ee]=this.dims;if(R=P(R,L),ee.length>0){let ue=ee.reduce((ke,Ie)=>ke*Ie);return this._subarray(R,ue,ee)}else return new i(this.type,[this.data[R]],ee)}indexOf(R){let L=this.data;for(let ee=0;ee<L.length;++ee)if(L[ee]==R)return ee;return-1}_subarray(R,L,ee){let ue=R*L,ke=(R+1)*L,Ie="subarray"in this.data?this.data.subarray(ue,ke):this.data.slice(ue,ke);return new i(this.type,Ie,ee)}item(){let R=this.data;if(R.length!==1)throw new Error(`a Tensor with ${R.length} elements cannot be converted to Scalar`);return R[0]}tolist(){return l(this.data,this.dims)}sigmoid(){return this.clone().sigmoid_()}sigmoid_(){let R=this.data;for(let L=0;L<R.length;++L)R[L]=1/(1+Math.exp(-R[L]));return this}map(R){return this.clone().map_(R)}map_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]=R(L[ee],ee,L);return this}mul(R){return this.clone().mul_(R)}mul_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]*=R;return this}div(R){return this.clone().div_(R)}div_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]/=R;return this}add(R){return this.clone().add_(R)}add_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]+=R;return this}sub(R){return this.clone().sub_(R)}sub_(R){let L=this.data;for(let ee=0;ee<L.length;++ee)L[ee]-=R;return this}clone(){return new i(this.type,this.data.slice(),this.dims.slice())}slice(...R){let L=[],ee=[];for(let A=0;A<this.dims.length;++A){let le=R[A];if(le==null)ee.push([0,this.dims[A]]),L.push(this.dims[A]);else if(typeof le=="number")le=P(le,this.dims[A],A),ee.push([le,le+1]);else if(Array.isArray(le)&&le.length===2){let[ge,be]=le;if(ge=ge===null?0:P(ge,this.dims[A],A,!1),be=be===null?this.dims[A]:P(be,this.dims[A],A,!1),ge>be)throw new Error(`Invalid slice: ${le}`);let Ae=[Math.max(ge,0),Math.min(be,this.dims[A])];ee.push(Ae),L.push(Ae[1]-Ae[0])}else throw new Error(`Invalid slice: ${le}`)}let ue=ee.map(([A,le])=>le-A),ke=ue.reduce((A,le)=>A*le),Ie=this.data,Le=new Ie.constructor(ke),rt=this.stride(),we=!0;for(let A=1;A<ue.length;++A)if(ee[A][0]!==0||ee[A][1]!==this.dims[A]){we=!1;break}if(we){let A=ee[0][0]*rt[0],le=ee[0][1]*rt[0];if(ArrayBuffer.isView(Ie))Le.set(Ie.subarray(A,le));else if(Array.isArray(Ie)){let ge=Ie.slice(A,le);for(let be=0;be<ge.length;++be)Le[be]=ge[be]}else throw new Error("Unsupported data type for slicing")}else for(let A=0;A<ke;++A){let le=0;for(let ge=ue.length-1,be=A;ge>=0;--ge){let Ae=ue[ge];le+=(be%Ae+ee[ge][0])*rt[ge],be=Math.floor(be/Ae)}Le[A]=Ie[le]}return new i(this.type,Le,L)}permute(...R){return c(this,R)}transpose(...R){return this.permute(...R)}sum(R=null,L=!1){return this.norm(1,R,L)}norm(R="fro",L=null,ee=!1){if(R==="fro")R=2;else if(typeof R=="string")throw Error(`Unsupported norm: ${R}`);let ue=this.data,ke=(we,A)=>we+A**R;if(L===null){let we=ue.reduce(ke,0)**(1/R);return new i(this.type,[we],[])}let[Ie,Le,rt]=E(ke,this,L,ee);if(R!==1)for(let we=0;we<Le.length;++we)Le[we]=Le[we]**(1/R);return new i(Ie,Le,rt)}normalize_(R=2,L=1){L=P(L,this.dims.length);let ee=this.norm(R,L,!0),ue=this.data,ke=ee.data;for(let Ie=0;Ie<ue.length;++Ie){let Le=0;for(let rt=this.dims.length-1,we=Ie,A=1;rt>=0;--rt){let le=this.dims[rt];if(rt!==L){let ge=we%le;Le+=ge*A,A*=this.dims[rt]}we=Math.floor(we/le)}ue[Ie]/=ke[Le]}return this}normalize(R=2,L=1){return this.clone().normalize_(R,L)}stride(){return U(this.dims)}squeeze(R=null){return new i(this.type,this.data,C(this.dims,R))}squeeze_(R=null){return this.dims=C(this.dims,R),this}unsqueeze(R=null){return new i(this.type,this.data,y(this.dims,R))}unsqueeze_(R=null){return this.dims=y(this.dims,R),this}flatten_(R=0,L=-1){L=(L+this.dims.length)%this.dims.length;let ee=this.dims.slice(0,R),ue=this.dims.slice(R,L+1),ke=this.dims.slice(L+1);return this.dims=[...ee,ue.reduce((Ie,Le)=>Ie*Le,1),...ke],this}flatten(R=0,L=-1){return this.clone().flatten_(R,L)}view(...R){let L=-1;for(let ue=0;ue<R.length;++ue)if(R[ue]===-1){if(L!==-1)throw new Error("Only one dimension can be inferred");L=ue}let ee=this.data;if(L!==-1){let ue=R.reduce((ke,Ie,Le)=>Le!==L?ke*Ie:ke,1);R[L]=ee.length/ue}return new i(this.type,ee,R)}neg_(){let R=this.data;for(let L=0;L<R.length;++L)R[L]=-R[L];return this}neg(){return this.clone().neg_()}gt(R){let L=new Uint8Array(this.data.length),ee=this.data;for(let ue=0;ue<ee.length;++ue)L[ue]=ee[ue]>R?1:0;return new i("bool",L,this.dims)}lt(R){let L=new Uint8Array(this.data.length),ee=this.data;for(let ue=0;ue<ee.length;++ue)L[ue]=ee[ue]<R?1:0;return new i("bool",L,this.dims)}clamp_(R,L){let ee=this.data;for(let ue=0;ue<ee.length;++ue)ee[ue]=Math.min(Math.max(ee[ue],R),L);return this}clamp(R,L){return this.clone().clamp_(R,L)}round_(){let R=this.data;for(let L=0;L<R.length;++L)R[L]=Math.round(R[L]);return this}round(){return this.clone().round_()}mean(R=null,L=!1){return O(this,R,L)}min(R=null,L=!1){if(R===null){let Ie=(0,s.min)(this.data)[0];return new i(this.type,[Ie],[])}let[ee,ue,ke]=E((Ie,Le)=>Math.min(Ie,Le),this,R,L,1/0);return new i(ee,ue,ke)}max(R=null,L=!1){if(R===null){let Ie=(0,s.max)(this.data)[0];return new i(this.type,[Ie],[])}let[ee,ue,ke]=E((Ie,Le)=>Math.max(Ie,Le),this,R,L,-1/0);return new i(ee,ue,ke)}argmin(R=null,L=!1){if(R!==null)throw new Error("`dim !== null` not yet implemented.");let ee=(0,s.min)(this.data)[1];return new i("int64",[BigInt(ee)],[])}argmax(R=null,L=!1){if(R!==null)throw new Error("`dim !== null` not yet implemented.");let ee=(0,s.max)(this.data)[1];return new i("int64",[BigInt(ee)],[])}to(R){if(this.type===R)return this;if(!n.hasOwnProperty(R))throw new Error(`Unsupported type: ${R}`);let L,ee=["int64","uint64"].includes(this.type),ue=["int64","uint64"].includes(R);return ee&&!ue?L=Number:!ee&&ue&&(["float16","float32","float64"].includes(this.type)?L=ke=>BigInt(Math.floor(ke)):L=BigInt),new i(R,n[R].from(this.data,L),this.dims)}}function l(H,R){let L=H.length,ee=R.reduce((ke,Ie)=>ke*Ie);if(L!==ee)throw Error(`cannot reshape array of size ${L} into shape (${R})`);let ue=H;for(let ke=R.length-1;ke>=0;ke--)ue=ue.reduce((Ie,Le)=>{let rt=Ie[Ie.length-1];return rt.length<R[ke]?rt.push(Le):Ie.push([Le]),Ie},[[]]);return ue[0]}function c(H,R){let[L,ee]=(0,s.permute_data)(H.data,H.dims,R);return new i(H.type,L,ee)}function _(H,[R,L],ee="bilinear",ue=!1){let ke=H.dims.at(-3)??1,Ie=H.dims.at(-2),Le=H.dims.at(-1),rt=(0,s.interpolate_data)(H.data,[ke,Ie,Le],[R,L],ee,ue);return new i(H.type,rt,[ke,R,L])}async function u(H,{size:R=null,mode:L="bilinear"}={}){if(H.dims.length!==4)throw new Error("`interpolate_4d` currently only supports 4D input.");if(!R)throw new Error("`interpolate_4d` requires a `size` argument.");let ee;if(R.length===2)ee=[...H.dims.slice(0,2),...R];else if(R.length===3)ee=[H.dims[0],...R];else if(R.length===4)ee=R;else throw new Error("`size` must be of length 2, 3, or 4.");let ue;if(L==="nearest")ue=await a.TensorOpRegistry.nearest_interpolate_4d;else if(L==="bilinear")ue=await a.TensorOpRegistry.bilinear_interpolate_4d;else if(L==="bicubic")ue=await a.TensorOpRegistry.bicubic_interpolate_4d;else throw new Error(`Unsupported mode: ${L}`);let ke=new i("int64",new BigInt64Array(ee.map(BigInt)),[ee.length]);return await ue({x:H,s:ke})}async function d(H,R){return await(await a.TensorOpRegistry.matmul)({a:H,b:R})}async function g(H,R){return await(await a.TensorOpRegistry.rfft)({x:H,a:R})}async function h(H,R){let L=await a.TensorOpRegistry.top_k;return R==null?R=H.dims.at(-1):R=Math.min(R,H.dims.at(-1)),await L({x:H,k:new i("int64",[BigInt(R)],[1])})}let x=H=>new i("int64",H,[H.length]);async function F(H,R,L,ee,ue){return await(await a.TensorOpRegistry.slice)({x:H,s:x(R),e:x(L),a:x(ee),t:x(ue??new Array(ee.length).fill(1))})}function v(H,R){let L=H.data,ee=R.data,ue=[H.dims[0],H.dims[2]],ke=new L.constructor(ue[0]*ue[1]),[Ie,Le,rt]=H.dims,we=0;for(let A=0;A<Ie;++A){let le=A*rt*Le;for(let ge=0;ge<rt;++ge){let be=0,Ae=0,ve=A*Le,pe=le+ge;for(let fe=0;fe<Le;++fe){let Te=Number(ee[ve+fe]);Ae+=Te,be+=L[pe+fe*rt]*Te}let Pe=be/Ae;ke[we++]=Pe}}return new i(H.type,ke,ue)}function b(H,R,{eps:L=1e-5}={}){if(H.dims.length!==2)throw new Error("`layer_norm` currently only supports 2D input.");let[ee,ue]=H.dims;if(R.length!==1&&R[0]!==ue)throw new Error("`normalized_shape` must be a 1D array with shape `[input.dims[1]]`.");let[ke,Ie]=D(H,1,0,!0),Le=ke.data,rt=Ie.data,we=H.data,A=new we.constructor(we.length);for(let le=0;le<ee;++le){let ge=le*ue;for(let be=0;be<ue;++be){let Ae=ge+be;A[Ae]=(we[Ae]-rt[le])/(Le[le]+L)}}return new i(H.type,A,H.dims)}function C(H,R){return H=H.slice(),R===null?H=H.filter(L=>L!==1):typeof R=="number"?H[R]===1&&H.splice(R,1):Array.isArray(R)&&(H=H.filter((L,ee)=>L!==1||!R.includes(ee))),H}function y(H,R){return R=P(R,H.length+1),H=H.slice(),H.splice(R,0,1),H}function P(H,R,L=null,ee=!0){if(H<-R||H>=R){if(ee)throw new Error(`IndexError: index ${H} is out of bounds for dimension${L===null?"":" "+L} with size ${R}`);return H<-R?0:R}return H<0&&(H=(H%R+R)%R),H}function I(H,R=0){R=P(R,H[0].dims.length);let L=H[0].dims.slice();L[R]=H.reduce((Ie,Le)=>Ie+Le.dims[R],0);let ee=L.reduce((Ie,Le)=>Ie*Le,1),ue=new H[0].data.constructor(ee),ke=H[0].type;if(R===0){let Ie=0;for(let Le of H){let rt=Le.data;ue.set(rt,Ie),Ie+=rt.length}}else{let Ie=0;for(let Le=0;Le<H.length;++Le){let{data:rt,dims:we}=H[Le];for(let A=0;A<rt.length;++A){let le=0;for(let ge=we.length-1,be=A,Ae=1;ge>=0;--ge){let ve=we[ge],pe=be%ve;ge===R&&(pe+=Ie),le+=pe*Ae,Ae*=L[ge],be=Math.floor(be/ve)}ue[le]=rt[A]}Ie+=we[R]}}return new i(ke,ue,L)}function f(H,R=0){return I(H.map(L=>L.unsqueeze(R)),R)}function E(H,R,L=null,ee=!1,ue=null){let ke=R.data,Ie=R.dims;L=P(L,Ie.length);let Le=Ie.slice();Le[L]=1;let rt=new ke.constructor(ke.length/Ie[L]);ue!==null&&rt.fill(ue);for(let we=0;we<ke.length;++we){let A=0;for(let le=Ie.length-1,ge=we,be=1;le>=0;--le){let Ae=Ie[le];if(le!==L){let ve=ge%Ae;A+=ve*be,be*=Le[le]}ge=Math.floor(ge/Ae)}rt[A]=H(rt[A],ke[we],we,A)}return ee||Le.splice(L,1),[R.type,rt,Le]}function D(H,R=null,L=1,ee=!1){let ue=H.data,ke=H.dims;if(R===null){let be=ue.reduce((Pe,fe)=>Pe+fe,0)/ue.length,Ae=Math.sqrt(ue.reduce((Pe,fe)=>Pe+(fe-be)**2,0)/(ue.length-L)),ve=new i(H.type,[be],[]);return[new i(H.type,[Ae],[]),ve]}R=P(R,ke.length);let Ie=O(H,R,ee),Le=Ie.data,[rt,we,A]=E((ge,be,Ae,ve)=>ge+(be-Le[ve])**2,H,R,ee);for(let ge=0;ge<we.length;++ge)we[ge]=Math.sqrt(we[ge]/(ke[R]-L));return[new i(rt,we,A),Ie]}function O(H,R=null,L=!1){let ee=H.dims,ue=H.data;if(R===null){let rt=ue.reduce((we,A)=>we+A,0);return new i(H.type,[rt/ue.length],[])}R=P(R,ee.length);let[ke,Ie,Le]=E((rt,we)=>rt+we,H,R,L);if(ee[R]!==1)for(let rt=0;rt<Ie.length;++rt)Ie[rt]/=ee[R];return new i(ke,Ie,Le)}function U(H){let R=new Array(H.length);for(let L=H.length-1,ee=1;L>=0;--L)R[L]=ee,ee*=H[L];return R}function W(H,R,L,ee){let ue=H.reduce((ke,Ie)=>ke*Ie,1);return new i(L,new ee(ue).fill(R),H)}function z(H,R){let L,ee;if(typeof R=="number")L="float32",ee=Float32Array;else if(typeof R=="bigint")L="int64",ee=BigInt64Array;else if(typeof R=="boolean")L="bool",ee=Uint8Array;else throw new Error(`Unsupported data type: ${typeof R}`);return W(H,R,L,ee)}function X(H,R){return z(H.dims,R)}function J(H){return W(H,1n,"int64",BigInt64Array)}function q(H){return J(H.dims)}function re(H){return W(H,0n,"int64",BigInt64Array)}function oe(H){return re(H.dims)}function ne(H){let R=H.reduce((L,ee)=>L*ee,1);return new i("float32",Float32Array.from({length:R},()=>Math.random()),H)}function ye(H){let R=H.reduce((ee,ue)=>ee*ue,1);function L(){let ee=1-Math.random(),ue=1-Math.random();return Math.sqrt(-2*Math.log(ee))*Math.cos(2*Math.PI*ue)}return new i("float32",Float32Array.from({length:R},()=>L()),H)}function Y(H,R){if(H.dims.length!==2)throw new Error("The tensor must have 2 dimensions");if(H.dims.at(-1)%8!==0)throw new Error("The last dimension of the tensor must be a multiple of 8");if(!["binary","ubinary"].includes(R))throw new Error("The precision must be either 'binary' or 'ubinary'");let L=R==="binary",ee=L?"int8":"uint8",ue=L?Int8Array:Uint8Array,ke=H.data,Ie=new ue(ke.length/8);for(let Le=0;Le<ke.length;++Le){let rt=ke[Le]>0?1:0,we=Math.floor(Le/8),A=Le%8;Ie[we]|=rt<<7-A,L&&A===0&&(Ie[we]-=128)}return new i(ee,Ie,[H.dims[0],H.dims[1]/8])}}),"./src/utils/video.js":((e,r,t)=>{t.r(r),t.d(r,{RawVideo:()=>n,RawVideoFrame:()=>a,load_video:()=>i});var s=t("./src/utils/image.js"),o=t("./src/env.js");class a{constructor(c,_){this.image=c,this.timestamp=_}}class n{constructor(c,_){c.length>0&&c[0]instanceof s.RawImage&&(c=c.map((u,d)=>new a(u,(d+1)/(c.length+1)*_))),this.frames=c,this.duration=_}get width(){return this.frames[0].image.width}get height(){return this.frames[0].image.height}get fps(){return this.frames.length/this.duration}}async function i(l,{num_frames:c=null,fps:_=null}={}){if(!o.apis.IS_BROWSER_ENV)throw new Error("`load_video` is currently only supported in browser environments.");if(c==null&&_==null)throw new Error("Either num_frames or fps must be provided.");let u=[],d=document.createElement("video");if(d.crossOrigin="anonymous",d.muted=!0,typeof l=="string")d.src=l;else if(l instanceof Blob)d.src=URL.createObjectURL(l);else if(l instanceof HTMLVideoElement)d.src=l.src;else throw new Error("Invalid URL or video element provided.");if(await new Promise(C=>d.onloadedmetadata=C),d.seekable.start(0)===d.seekable.end(0)){let y=await(await fetch(d.src)).blob();d.src=URL.createObjectURL(y),await new Promise(P=>d.onloadedmetadata=P)}let g=d.duration,h,x;c!=null?(h=c,x=c===1?0:g/(c-1)):(x=1/_,h=Math.floor(g/x));let F=[];for(let C=0;C<h;++C)F.push(c===1?g/2:C*x);let v=document.createElement("canvas");v.width=d.videoWidth,v.height=d.videoHeight;let b=v.getContext("2d",{willReadFrequently:!0});for(let C of F){d.currentTime=C,await new Promise(f=>{d.onseeked=f}),b.drawImage(d,0,0,v.width,v.height);let y=b.getImageData(0,0,v.width,v.height),P=new s.RawImage(y.data,v.width,v.height,4),I=new a(P,C);u.push(I)}return d.remove(),new n(u,g)}})},I0={};function Vt(e){var r=I0[e];if(r!==void 0)return r.exports;var t=I0[e]={exports:{}};return gE[e](t,t.exports,Vt),t.exports}(()=>{var e=Object.getPrototypeOf?t=>Object.getPrototypeOf(t):t=>t.__proto__,r;Vt.t=function(t,s){if(s&1&&(t=this(t)),s&8||typeof t=="object"&&t&&(s&4&&t.__esModule||s&16&&typeof t.then=="function"))return t;var o=Object.create(null);Vt.r(o);var a={};r=r||[null,e({}),e([]),e(e)];for(var n=s&2&&t;typeof n=="object"&&!~r.indexOf(n);n=e(n))Object.getOwnPropertyNames(n).forEach(i=>a[i]=()=>t[i]);return a.default=()=>t,Vt.d(o,a),o}})();Vt.d=(e,r)=>{for(var t in r)Vt.o(r,t)&&!Vt.o(e,t)&&Object.defineProperty(e,t,{enumerable:!0,get:r[t]})};Vt.o=(e,r)=>Object.prototype.hasOwnProperty.call(e,r);Vt.r=e=>{typeof Symbol<"u"&&Symbol.toStringTag&&Object.defineProperty(e,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(e,"__esModule",{value:!0})};var p={};(()=>{Vt.r(p),Vt.d(p,{ASTFeatureExtractor:()=>u.ASTFeatureExtractor,ASTForAudioClassification:()=>t.ASTForAudioClassification,ASTModel:()=>t.ASTModel,ASTPreTrainedModel:()=>t.ASTPreTrainedModel,AlbertForMaskedLM:()=>t.AlbertForMaskedLM,AlbertForQuestionAnswering:()=>t.AlbertForQuestionAnswering,AlbertForSequenceClassification:()=>t.AlbertForSequenceClassification,AlbertModel:()=>t.AlbertModel,AlbertPreTrainedModel:()=>t.AlbertPreTrainedModel,AlbertTokenizer:()=>s.AlbertTokenizer,ArceeForCausalLM:()=>t.ArceeForCausalLM,ArceeModel:()=>t.ArceeModel,ArceePreTrainedModel:()=>t.ArceePreTrainedModel,AudioClassificationPipeline:()=>r.AudioClassificationPipeline,AutoConfig:()=>o.AutoConfig,AutoFeatureExtractor:()=>d.AutoFeatureExtractor,AutoImageProcessor:()=>x.AutoImageProcessor,AutoModel:()=>t.AutoModel,AutoModelForAudioClassification:()=>t.AutoModelForAudioClassification,AutoModelForAudioFrameClassification:()=>t.AutoModelForAudioFrameClassification,AutoModelForAudioTextToText:()=>t.AutoModelForAudioTextToText,AutoModelForCTC:()=>t.AutoModelForCTC,AutoModelForCausalLM:()=>t.AutoModelForCausalLM,AutoModelForDepthEstimation:()=>t.AutoModelForDepthEstimation,AutoModelForDocumentQuestionAnswering:()=>t.AutoModelForDocumentQuestionAnswering,AutoModelForImageClassification:()=>t.AutoModelForImageClassification,AutoModelForImageFeatureExtraction:()=>t.AutoModelForImageFeatureExtraction,AutoModelForImageMatting:()=>t.AutoModelForImageMatting,AutoModelForImageSegmentation:()=>t.AutoModelForImageSegmentation,AutoModelForImageTextToText:()=>t.AutoModelForImageTextToText,AutoModelForImageToImage:()=>t.AutoModelForImageToImage,AutoModelForMaskGeneration:()=>t.AutoModelForMaskGeneration,AutoModelForMaskedLM:()=>t.AutoModelForMaskedLM,AutoModelForNormalEstimation:()=>t.AutoModelForNormalEstimation,AutoModelForObjectDetection:()=>t.AutoModelForObjectDetection,AutoModelForPoseEstimation:()=>t.AutoModelForPoseEstimation,AutoModelForQuestionAnswering:()=>t.AutoModelForQuestionAnswering,AutoModelForSemanticSegmentation:()=>t.AutoModelForSemanticSegmentation,AutoModelForSeq2SeqLM:()=>t.AutoModelForSeq2SeqLM,AutoModelForSequenceClassification:()=>t.AutoModelForSequenceClassification,AutoModelForSpeechSeq2Seq:()=>t.AutoModelForSpeechSeq2Seq,AutoModelForTextToSpectrogram:()=>t.AutoModelForTextToSpectrogram,AutoModelForTextToWaveform:()=>t.AutoModelForTextToWaveform,AutoModelForTokenClassification:()=>t.AutoModelForTokenClassification,AutoModelForUniversalSegmentation:()=>t.AutoModelForUniversalSegmentation,AutoModelForVision2Seq:()=>t.AutoModelForVision2Seq,AutoModelForXVector:()=>t.AutoModelForXVector,AutoModelForZeroShotObjectDetection:()=>t.AutoModelForZeroShotObjectDetection,AutoProcessor:()=>b.AutoProcessor,AutoTokenizer:()=>s.AutoTokenizer,AutomaticSpeechRecognitionPipeline:()=>r.AutomaticSpeechRecognitionPipeline,BackgroundRemovalPipeline:()=>r.BackgroundRemovalPipeline,BartForConditionalGeneration:()=>t.BartForConditionalGeneration,BartForSequenceClassification:()=>t.BartForSequenceClassification,BartModel:()=>t.BartModel,BartPretrainedModel:()=>t.BartPretrainedModel,BartTokenizer:()=>s.BartTokenizer,BaseModelOutput:()=>t.BaseModelOutput,BaseStreamer:()=>C.BaseStreamer,BeitFeatureExtractor:()=>h.BeitFeatureExtractor,BeitForImageClassification:()=>t.BeitForImageClassification,BeitModel:()=>t.BeitModel,BeitPreTrainedModel:()=>t.BeitPreTrainedModel,BertForMaskedLM:()=>t.BertForMaskedLM,BertForQuestionAnswering:()=>t.BertForQuestionAnswering,BertForSequenceClassification:()=>t.BertForSequenceClassification,BertForTokenClassification:()=>t.BertForTokenClassification,BertModel:()=>t.BertModel,BertPreTrainedModel:()=>t.BertPreTrainedModel,BertTokenizer:()=>s.BertTokenizer,BitImageProcessor:()=>h.BitImageProcessor,BlenderbotForConditionalGeneration:()=>t.BlenderbotForConditionalGeneration,BlenderbotModel:()=>t.BlenderbotModel,BlenderbotPreTrainedModel:()=>t.BlenderbotPreTrainedModel,BlenderbotSmallForConditionalGeneration:()=>t.BlenderbotSmallForConditionalGeneration,BlenderbotSmallModel:()=>t.BlenderbotSmallModel,BlenderbotSmallPreTrainedModel:()=>t.BlenderbotSmallPreTrainedModel,BlenderbotSmallTokenizer:()=>s.BlenderbotSmallTokenizer,BlenderbotTokenizer:()=>s.BlenderbotTokenizer,BloomForCausalLM:()=>t.BloomForCausalLM,BloomModel:()=>t.BloomModel,BloomPreTrainedModel:()=>t.BloomPreTrainedModel,BloomTokenizer:()=>s.BloomTokenizer,CLIPFeatureExtractor:()=>h.CLIPFeatureExtractor,CLIPImageProcessor:()=>h.CLIPImageProcessor,CLIPModel:()=>t.CLIPModel,CLIPPreTrainedModel:()=>t.CLIPPreTrainedModel,CLIPSegForImageSegmentation:()=>t.CLIPSegForImageSegmentation,CLIPSegModel:()=>t.CLIPSegModel,CLIPSegPreTrainedModel:()=>t.CLIPSegPreTrainedModel,CLIPTextModel:()=>t.CLIPTextModel,CLIPTextModelWithProjection:()=>t.CLIPTextModelWithProjection,CLIPTokenizer:()=>s.CLIPTokenizer,CLIPVisionModel:()=>t.CLIPVisionModel,CLIPVisionModelWithProjection:()=>t.CLIPVisionModelWithProjection,CamembertForMaskedLM:()=>t.CamembertForMaskedLM,CamembertForQuestionAnswering:()=>t.CamembertForQuestionAnswering,CamembertForSequenceClassification:()=>t.CamembertForSequenceClassification,CamembertForTokenClassification:()=>t.CamembertForTokenClassification,CamembertModel:()=>t.CamembertModel,CamembertPreTrainedModel:()=>t.CamembertPreTrainedModel,CamembertTokenizer:()=>s.CamembertTokenizer,CausalLMOutput:()=>t.CausalLMOutput,CausalLMOutputWithPast:()=>t.CausalLMOutputWithPast,ChineseCLIPFeatureExtractor:()=>h.ChineseCLIPFeatureExtractor,ChineseCLIPModel:()=>t.ChineseCLIPModel,ChineseCLIPPreTrainedModel:()=>t.ChineseCLIPPreTrainedModel,ClapAudioModelWithProjection:()=>t.ClapAudioModelWithProjection,ClapFeatureExtractor:()=>u.ClapFeatureExtractor,ClapModel:()=>t.ClapModel,ClapPreTrainedModel:()=>t.ClapPreTrainedModel,ClapTextModelWithProjection:()=>t.ClapTextModelWithProjection,ClassifierFreeGuidanceLogitsProcessor:()=>P.ClassifierFreeGuidanceLogitsProcessor,CodeGenForCausalLM:()=>t.CodeGenForCausalLM,CodeGenModel:()=>t.CodeGenModel,CodeGenPreTrainedModel:()=>t.CodeGenPreTrainedModel,CodeGenTokenizer:()=>s.CodeGenTokenizer,CodeLlamaTokenizer:()=>s.CodeLlamaTokenizer,CohereForCausalLM:()=>t.CohereForCausalLM,CohereModel:()=>t.CohereModel,CoherePreTrainedModel:()=>t.CoherePreTrainedModel,CohereTokenizer:()=>s.CohereTokenizer,ConvBertForMaskedLM:()=>t.ConvBertForMaskedLM,ConvBertForQuestionAnswering:()=>t.ConvBertForQuestionAnswering,ConvBertForSequenceClassification:()=>t.ConvBertForSequenceClassification,ConvBertForTokenClassification:()=>t.ConvBertForTokenClassification,ConvBertModel:()=>t.ConvBertModel,ConvBertPreTrainedModel:()=>t.ConvBertPreTrainedModel,ConvBertTokenizer:()=>s.ConvBertTokenizer,ConvNextFeatureExtractor:()=>h.ConvNextFeatureExtractor,ConvNextForImageClassification:()=>t.ConvNextForImageClassification,ConvNextImageProcessor:()=>h.ConvNextImageProcessor,ConvNextModel:()=>t.ConvNextModel,ConvNextPreTrainedModel:()=>t.ConvNextPreTrainedModel,ConvNextV2ForImageClassification:()=>t.ConvNextV2ForImageClassification,ConvNextV2Model:()=>t.ConvNextV2Model,ConvNextV2PreTrainedModel:()=>t.ConvNextV2PreTrainedModel,DFineForObjectDetection:()=>t.DFineForObjectDetection,DFineModel:()=>t.DFineModel,DFinePreTrainedModel:()=>t.DFinePreTrainedModel,DINOv3ConvNextModel:()=>t.DINOv3ConvNextModel,DINOv3ConvNextPreTrainedModel:()=>t.DINOv3ConvNextPreTrainedModel,DINOv3ViTImageProcessor:()=>h.DINOv3ViTImageProcessor,DINOv3ViTModel:()=>t.DINOv3ViTModel,DINOv3ViTPreTrainedModel:()=>t.DINOv3ViTPreTrainedModel,DPTFeatureExtractor:()=>h.DPTFeatureExtractor,DPTForDepthEstimation:()=>t.DPTForDepthEstimation,DPTImageProcessor:()=>h.DPTImageProcessor,DPTModel:()=>t.DPTModel,DPTPreTrainedModel:()=>t.DPTPreTrainedModel,DacDecoderModel:()=>t.DacDecoderModel,DacDecoderOutput:()=>t.DacDecoderOutput,DacEncoderModel:()=>t.DacEncoderModel,DacEncoderOutput:()=>t.DacEncoderOutput,DacFeatureExtractor:()=>u.DacFeatureExtractor,DacModel:()=>t.DacModel,DacPreTrainedModel:()=>t.DacPreTrainedModel,DataTypeMap:()=>l.DataTypeMap,DebertaForMaskedLM:()=>t.DebertaForMaskedLM,DebertaForQuestionAnswering:()=>t.DebertaForQuestionAnswering,DebertaForSequenceClassification:()=>t.DebertaForSequenceClassification,DebertaForTokenClassification:()=>t.DebertaForTokenClassification,DebertaModel:()=>t.DebertaModel,DebertaPreTrainedModel:()=>t.DebertaPreTrainedModel,DebertaTokenizer:()=>s.DebertaTokenizer,DebertaV2ForMaskedLM:()=>t.DebertaV2ForMaskedLM,DebertaV2ForQuestionAnswering:()=>t.DebertaV2ForQuestionAnswering,DebertaV2ForSequenceClassification:()=>t.DebertaV2ForSequenceClassification,DebertaV2ForTokenClassification:()=>t.DebertaV2ForTokenClassification,DebertaV2Model:()=>t.DebertaV2Model,DebertaV2PreTrainedModel:()=>t.DebertaV2PreTrainedModel,DebertaV2Tokenizer:()=>s.DebertaV2Tokenizer,DecisionTransformerModel:()=>t.DecisionTransformerModel,DecisionTransformerPreTrainedModel:()=>t.DecisionTransformerPreTrainedModel,DeiTFeatureExtractor:()=>h.DeiTFeatureExtractor,DeiTForImageClassification:()=>t.DeiTForImageClassification,DeiTImageProcessor:()=>h.DeiTImageProcessor,DeiTModel:()=>t.DeiTModel,DeiTPreTrainedModel:()=>t.DeiTPreTrainedModel,DepthAnythingForDepthEstimation:()=>t.DepthAnythingForDepthEstimation,DepthAnythingPreTrainedModel:()=>t.DepthAnythingPreTrainedModel,DepthEstimationPipeline:()=>r.DepthEstimationPipeline,DepthProForDepthEstimation:()=>t.DepthProForDepthEstimation,DepthProPreTrainedModel:()=>t.DepthProPreTrainedModel,DetrFeatureExtractor:()=>h.DetrFeatureExtractor,DetrForObjectDetection:()=>t.DetrForObjectDetection,DetrForSegmentation:()=>t.DetrForSegmentation,DetrImageProcessor:()=>h.DetrImageProcessor,DetrModel:()=>t.DetrModel,DetrObjectDetectionOutput:()=>t.DetrObjectDetectionOutput,DetrPreTrainedModel:()=>t.DetrPreTrainedModel,DetrSegmentationOutput:()=>t.DetrSegmentationOutput,Dinov2ForImageClassification:()=>t.Dinov2ForImageClassification,Dinov2Model:()=>t.Dinov2Model,Dinov2PreTrainedModel:()=>t.Dinov2PreTrainedModel,Dinov2WithRegistersForImageClassification:()=>t.Dinov2WithRegistersForImageClassification,Dinov2WithRegistersModel:()=>t.Dinov2WithRegistersModel,Dinov2WithRegistersPreTrainedModel:()=>t.Dinov2WithRegistersPreTrainedModel,DistilBertForMaskedLM:()=>t.DistilBertForMaskedLM,DistilBertForQuestionAnswering:()=>t.DistilBertForQuestionAnswering,DistilBertForSequenceClassification:()=>t.DistilBertForSequenceClassification,DistilBertForTokenClassification:()=>t.DistilBertForTokenClassification,DistilBertModel:()=>t.DistilBertModel,DistilBertPreTrainedModel:()=>t.DistilBertPreTrainedModel,DistilBertTokenizer:()=>s.DistilBertTokenizer,DocumentQuestionAnsweringPipeline:()=>r.DocumentQuestionAnsweringPipeline,DonutFeatureExtractor:()=>h.DonutFeatureExtractor,DonutImageProcessor:()=>h.DonutImageProcessor,DonutSwinModel:()=>t.DonutSwinModel,DonutSwinPreTrainedModel:()=>t.DonutSwinPreTrainedModel,EdgeTamModel:()=>t.EdgeTamModel,EfficientNetForImageClassification:()=>t.EfficientNetForImageClassification,EfficientNetImageProcessor:()=>h.EfficientNetImageProcessor,EfficientNetModel:()=>t.EfficientNetModel,EfficientNetPreTrainedModel:()=>t.EfficientNetPreTrainedModel,ElectraForMaskedLM:()=>t.ElectraForMaskedLM,ElectraForQuestionAnswering:()=>t.ElectraForQuestionAnswering,ElectraForSequenceClassification:()=>t.ElectraForSequenceClassification,ElectraForTokenClassification:()=>t.ElectraForTokenClassification,ElectraModel:()=>t.ElectraModel,ElectraPreTrainedModel:()=>t.ElectraPreTrainedModel,ElectraTokenizer:()=>s.ElectraTokenizer,EncodecFeatureExtractor:()=>u.EncodecFeatureExtractor,EosTokenCriteria:()=>y.EosTokenCriteria,Ernie4_5ForCausalLM:()=>t.Ernie4_5ForCausalLM,Ernie4_5Model:()=>t.Ernie4_5Model,Ernie4_5PreTrainedModel:()=>t.Ernie4_5PreTrainedModel,EsmForMaskedLM:()=>t.EsmForMaskedLM,EsmForSequenceClassification:()=>t.EsmForSequenceClassification,EsmForTokenClassification:()=>t.EsmForTokenClassification,EsmModel:()=>t.EsmModel,EsmPreTrainedModel:()=>t.EsmPreTrainedModel,EsmTokenizer:()=>s.EsmTokenizer,ExaoneForCausalLM:()=>t.ExaoneForCausalLM,ExaoneModel:()=>t.ExaoneModel,ExaonePreTrainedModel:()=>t.ExaonePreTrainedModel,FFT:()=>c.FFT,FalconForCausalLM:()=>t.FalconForCausalLM,FalconModel:()=>t.FalconModel,FalconPreTrainedModel:()=>t.FalconPreTrainedModel,FalconTokenizer:()=>s.FalconTokenizer,FastViTForImageClassification:()=>t.FastViTForImageClassification,FastViTModel:()=>t.FastViTModel,FastViTPreTrainedModel:()=>t.FastViTPreTrainedModel,FeatureExtractionPipeline:()=>r.FeatureExtractionPipeline,FeatureExtractor:()=>_.FeatureExtractor,FillMaskPipeline:()=>r.FillMaskPipeline,Florence2ForConditionalGeneration:()=>t.Florence2ForConditionalGeneration,Florence2PreTrainedModel:()=>t.Florence2PreTrainedModel,Florence2Processor:()=>v.Florence2Processor,ForcedBOSTokenLogitsProcessor:()=>P.ForcedBOSTokenLogitsProcessor,ForcedEOSTokenLogitsProcessor:()=>P.ForcedEOSTokenLogitsProcessor,GLPNFeatureExtractor:()=>h.GLPNFeatureExtractor,GLPNForDepthEstimation:()=>t.GLPNForDepthEstimation,GLPNModel:()=>t.GLPNModel,GLPNPreTrainedModel:()=>t.GLPNPreTrainedModel,GPT2LMHeadModel:()=>t.GPT2LMHeadModel,GPT2Model:()=>t.GPT2Model,GPT2PreTrainedModel:()=>t.GPT2PreTrainedModel,GPT2Tokenizer:()=>s.GPT2Tokenizer,GPTBigCodeForCausalLM:()=>t.GPTBigCodeForCausalLM,GPTBigCodeModel:()=>t.GPTBigCodeModel,GPTBigCodePreTrainedModel:()=>t.GPTBigCodePreTrainedModel,GPTJForCausalLM:()=>t.GPTJForCausalLM,GPTJModel:()=>t.GPTJModel,GPTJPreTrainedModel:()=>t.GPTJPreTrainedModel,GPTNeoForCausalLM:()=>t.GPTNeoForCausalLM,GPTNeoModel:()=>t.GPTNeoModel,GPTNeoPreTrainedModel:()=>t.GPTNeoPreTrainedModel,GPTNeoXForCausalLM:()=>t.GPTNeoXForCausalLM,GPTNeoXModel:()=>t.GPTNeoXModel,GPTNeoXPreTrainedModel:()=>t.GPTNeoXPreTrainedModel,GPTNeoXTokenizer:()=>s.GPTNeoXTokenizer,Gemma2ForCausalLM:()=>t.Gemma2ForCausalLM,Gemma2Model:()=>t.Gemma2Model,Gemma2PreTrainedModel:()=>t.Gemma2PreTrainedModel,Gemma3ForCausalLM:()=>t.Gemma3ForCausalLM,Gemma3Model:()=>t.Gemma3Model,Gemma3PreTrainedModel:()=>t.Gemma3PreTrainedModel,Gemma3nAudioFeatureExtractor:()=>u.Gemma3nAudioFeatureExtractor,Gemma3nForConditionalGeneration:()=>t.Gemma3nForConditionalGeneration,Gemma3nPreTrainedModel:()=>t.Gemma3nPreTrainedModel,Gemma3nProcessor:()=>v.Gemma3nProcessor,GemmaForCausalLM:()=>t.GemmaForCausalLM,GemmaModel:()=>t.GemmaModel,GemmaPreTrainedModel:()=>t.GemmaPreTrainedModel,GemmaTokenizer:()=>s.GemmaTokenizer,GlmForCausalLM:()=>t.GlmForCausalLM,GlmModel:()=>t.GlmModel,GlmPreTrainedModel:()=>t.GlmPreTrainedModel,GraniteForCausalLM:()=>t.GraniteForCausalLM,GraniteModel:()=>t.GraniteModel,GraniteMoeHybridForCausalLM:()=>t.GraniteMoeHybridForCausalLM,GraniteMoeHybridModel:()=>t.GraniteMoeHybridModel,GraniteMoeHybridPreTrainedModel:()=>t.GraniteMoeHybridPreTrainedModel,GranitePreTrainedModel:()=>t.GranitePreTrainedModel,Grok1Tokenizer:()=>s.Grok1Tokenizer,GroundingDinoForObjectDetection:()=>t.GroundingDinoForObjectDetection,GroundingDinoImageProcessor:()=>h.GroundingDinoImageProcessor,GroundingDinoPreTrainedModel:()=>t.GroundingDinoPreTrainedModel,GroundingDinoProcessor:()=>v.GroundingDinoProcessor,GroupViTModel:()=>t.GroupViTModel,GroupViTPreTrainedModel:()=>t.GroupViTPreTrainedModel,HeliumForCausalLM:()=>t.HeliumForCausalLM,HeliumModel:()=>t.HeliumModel,HeliumPreTrainedModel:()=>t.HeliumPreTrainedModel,HerbertTokenizer:()=>s.HerbertTokenizer,HieraForImageClassification:()=>t.HieraForImageClassification,HieraModel:()=>t.HieraModel,HieraPreTrainedModel:()=>t.HieraPreTrainedModel,HubertForCTC:()=>t.HubertForCTC,HubertForSequenceClassification:()=>t.HubertForSequenceClassification,HubertModel:()=>t.HubertModel,HubertPreTrainedModel:()=>t.HubertPreTrainedModel,IJepaForImageClassification:()=>t.IJepaForImageClassification,IJepaModel:()=>t.IJepaModel,IJepaPreTrainedModel:()=>t.IJepaPreTrainedModel,Idefics3ForConditionalGeneration:()=>t.Idefics3ForConditionalGeneration,Idefics3ImageProcessor:()=>h.Idefics3ImageProcessor,Idefics3PreTrainedModel:()=>t.Idefics3PreTrainedModel,Idefics3Processor:()=>v.Idefics3Processor,ImageClassificationPipeline:()=>r.ImageClassificationPipeline,ImageFeatureExtractionPipeline:()=>r.ImageFeatureExtractionPipeline,ImageFeatureExtractor:()=>u.ImageFeatureExtractor,ImageMattingOutput:()=>t.ImageMattingOutput,ImageProcessor:()=>g.ImageProcessor,ImageSegmentationPipeline:()=>r.ImageSegmentationPipeline,ImageToImagePipeline:()=>r.ImageToImagePipeline,ImageToTextPipeline:()=>r.ImageToTextPipeline,InterruptableStoppingCriteria:()=>y.InterruptableStoppingCriteria,JAISLMHeadModel:()=>t.JAISLMHeadModel,JAISModel:()=>t.JAISModel,JAISPreTrainedModel:()=>t.JAISPreTrainedModel,JinaCLIPImageProcessor:()=>h.JinaCLIPImageProcessor,JinaCLIPModel:()=>t.JinaCLIPModel,JinaCLIPPreTrainedModel:()=>t.JinaCLIPPreTrainedModel,JinaCLIPProcessor:()=>v.JinaCLIPProcessor,JinaCLIPTextModel:()=>t.JinaCLIPTextModel,JinaCLIPVisionModel:()=>t.JinaCLIPVisionModel,Lfm2ForCausalLM:()=>t.Lfm2ForCausalLM,Lfm2Model:()=>t.Lfm2Model,Lfm2PreTrainedModel:()=>t.Lfm2PreTrainedModel,LiteWhisperForConditionalGeneration:()=>t.LiteWhisperForConditionalGeneration,Llama4ForCausalLM:()=>t.Llama4ForCausalLM,Llama4PreTrainedModel:()=>t.Llama4PreTrainedModel,LlamaForCausalLM:()=>t.LlamaForCausalLM,LlamaModel:()=>t.LlamaModel,LlamaPreTrainedModel:()=>t.LlamaPreTrainedModel,LlamaTokenizer:()=>s.LlamaTokenizer,LlavaForConditionalGeneration:()=>t.LlavaForConditionalGeneration,LlavaOnevisionForConditionalGeneration:()=>t.LlavaOnevisionForConditionalGeneration,LlavaOnevisionImageProcessor:()=>h.LlavaOnevisionImageProcessor,LlavaPreTrainedModel:()=>t.LlavaPreTrainedModel,LlavaProcessor:()=>v.LlavaProcessor,LlavaQwen2ForCausalLM:()=>t.LlavaQwen2ForCausalLM,LogitsProcessor:()=>P.LogitsProcessor,LogitsProcessorList:()=>P.LogitsProcessorList,LogitsWarper:()=>P.LogitsWarper,LongT5ForConditionalGeneration:()=>t.LongT5ForConditionalGeneration,LongT5Model:()=>t.LongT5Model,LongT5PreTrainedModel:()=>t.LongT5PreTrainedModel,M2M100ForConditionalGeneration:()=>t.M2M100ForConditionalGeneration,M2M100Model:()=>t.M2M100Model,M2M100PreTrainedModel:()=>t.M2M100PreTrainedModel,M2M100Tokenizer:()=>s.M2M100Tokenizer,MBart50Tokenizer:()=>s.MBart50Tokenizer,MBartForCausalLM:()=>t.MBartForCausalLM,MBartForConditionalGeneration:()=>t.MBartForConditionalGeneration,MBartForSequenceClassification:()=>t.MBartForSequenceClassification,MBartModel:()=>t.MBartModel,MBartPreTrainedModel:()=>t.MBartPreTrainedModel,MBartTokenizer:()=>s.MBartTokenizer,MPNetForMaskedLM:()=>t.MPNetForMaskedLM,MPNetForQuestionAnswering:()=>t.MPNetForQuestionAnswering,MPNetForSequenceClassification:()=>t.MPNetForSequenceClassification,MPNetForTokenClassification:()=>t.MPNetForTokenClassification,MPNetModel:()=>t.MPNetModel,MPNetPreTrainedModel:()=>t.MPNetPreTrainedModel,MPNetTokenizer:()=>s.MPNetTokenizer,MT5ForConditionalGeneration:()=>t.MT5ForConditionalGeneration,MT5Model:()=>t.MT5Model,MT5PreTrainedModel:()=>t.MT5PreTrainedModel,MarianMTModel:()=>t.MarianMTModel,MarianModel:()=>t.MarianModel,MarianPreTrainedModel:()=>t.MarianPreTrainedModel,MarianTokenizer:()=>s.MarianTokenizer,Mask2FormerImageProcessor:()=>h.Mask2FormerImageProcessor,MaskFormerFeatureExtractor:()=>h.MaskFormerFeatureExtractor,MaskFormerForInstanceSegmentation:()=>t.MaskFormerForInstanceSegmentation,MaskFormerImageProcessor:()=>h.MaskFormerImageProcessor,MaskFormerModel:()=>t.MaskFormerModel,MaskFormerPreTrainedModel:()=>t.MaskFormerPreTrainedModel,MaskedLMOutput:()=>t.MaskedLMOutput,MaxLengthCriteria:()=>y.MaxLengthCriteria,Metric3DForDepthEstimation:()=>t.Metric3DForDepthEstimation,Metric3DPreTrainedModel:()=>t.Metric3DPreTrainedModel,Metric3Dv2ForDepthEstimation:()=>t.Metric3Dv2ForDepthEstimation,Metric3Dv2PreTrainedModel:()=>t.Metric3Dv2PreTrainedModel,MgpstrForSceneTextRecognition:()=>t.MgpstrForSceneTextRecognition,MgpstrModelOutput:()=>t.MgpstrModelOutput,MgpstrPreTrainedModel:()=>t.MgpstrPreTrainedModel,MgpstrProcessor:()=>v.MgpstrProcessor,MgpstrTokenizer:()=>s.MgpstrTokenizer,MimiDecoderModel:()=>t.MimiDecoderModel,MimiDecoderOutput:()=>t.MimiDecoderOutput,MimiEncoderModel:()=>t.MimiEncoderModel,MimiEncoderOutput:()=>t.MimiEncoderOutput,MimiModel:()=>t.MimiModel,MimiPreTrainedModel:()=>t.MimiPreTrainedModel,MinLengthLogitsProcessor:()=>P.MinLengthLogitsProcessor,MinNewTokensLengthLogitsProcessor:()=>P.MinNewTokensLengthLogitsProcessor,Ministral3ForCausalLM:()=>t.Ministral3ForCausalLM,Ministral3Model:()=>t.Ministral3Model,Ministral3PreTrainedModel:()=>t.Ministral3PreTrainedModel,MinistralForCausalLM:()=>t.MinistralForCausalLM,MinistralModel:()=>t.MinistralModel,MinistralPreTrainedModel:()=>t.MinistralPreTrainedModel,Mistral3ForConditionalGeneration:()=>t.Mistral3ForConditionalGeneration,MistralForCausalLM:()=>t.MistralForCausalLM,MistralModel:()=>t.MistralModel,MistralPreTrainedModel:()=>t.MistralPreTrainedModel,MobileBertForMaskedLM:()=>t.MobileBertForMaskedLM,MobileBertForQuestionAnswering:()=>t.MobileBertForQuestionAnswering,MobileBertForSequenceClassification:()=>t.MobileBertForSequenceClassification,MobileBertModel:()=>t.MobileBertModel,MobileBertPreTrainedModel:()=>t.MobileBertPreTrainedModel,MobileBertTokenizer:()=>s.MobileBertTokenizer,MobileLLMForCausalLM:()=>t.MobileLLMForCausalLM,MobileLLMModel:()=>t.MobileLLMModel,MobileLLMPreTrainedModel:()=>t.MobileLLMPreTrainedModel,MobileNetV1FeatureExtractor:()=>h.MobileNetV1FeatureExtractor,MobileNetV1ForImageClassification:()=>t.MobileNetV1ForImageClassification,MobileNetV1ForSemanticSegmentation:()=>t.MobileNetV1ForSemanticSegmentation,MobileNetV1ImageProcessor:()=>h.MobileNetV1ImageProcessor,MobileNetV1Model:()=>t.MobileNetV1Model,MobileNetV1PreTrainedModel:()=>t.MobileNetV1PreTrainedModel,MobileNetV2FeatureExtractor:()=>h.MobileNetV2FeatureExtractor,MobileNetV2ForImageClassification:()=>t.MobileNetV2ForImageClassification,MobileNetV2ForSemanticSegmentation:()=>t.MobileNetV2ForSemanticSegmentation,MobileNetV2ImageProcessor:()=>h.MobileNetV2ImageProcessor,MobileNetV2Model:()=>t.MobileNetV2Model,MobileNetV2PreTrainedModel:()=>t.MobileNetV2PreTrainedModel,MobileNetV3FeatureExtractor:()=>h.MobileNetV3FeatureExtractor,MobileNetV3ForImageClassification:()=>t.MobileNetV3ForImageClassification,MobileNetV3ForSemanticSegmentation:()=>t.MobileNetV3ForSemanticSegmentation,MobileNetV3ImageProcessor:()=>h.MobileNetV3ImageProcessor,MobileNetV3Model:()=>t.MobileNetV3Model,MobileNetV3PreTrainedModel:()=>t.MobileNetV3PreTrainedModel,MobileNetV4FeatureExtractor:()=>h.MobileNetV4FeatureExtractor,MobileNetV4ForImageClassification:()=>t.MobileNetV4ForImageClassification,MobileNetV4ForSemanticSegmentation:()=>t.MobileNetV4ForSemanticSegmentation,MobileNetV4ImageProcessor:()=>h.MobileNetV4ImageProcessor,MobileNetV4Model:()=>t.MobileNetV4Model,MobileNetV4PreTrainedModel:()=>t.MobileNetV4PreTrainedModel,MobileViTFeatureExtractor:()=>h.MobileViTFeatureExtractor,MobileViTForImageClassification:()=>t.MobileViTForImageClassification,MobileViTImageProcessor:()=>h.MobileViTImageProcessor,MobileViTModel:()=>t.MobileViTModel,MobileViTPreTrainedModel:()=>t.MobileViTPreTrainedModel,MobileViTV2ForImageClassification:()=>t.MobileViTV2ForImageClassification,MobileViTV2Model:()=>t.MobileViTV2Model,MobileViTV2PreTrainedModel:()=>t.MobileViTV2PreTrainedModel,ModelOutput:()=>t.ModelOutput,ModernBertDecoderForCausalLM:()=>t.ModernBertDecoderForCausalLM,ModernBertDecoderModel:()=>t.ModernBertDecoderModel,ModernBertDecoderPreTrainedModel:()=>t.ModernBertDecoderPreTrainedModel,ModernBertForMaskedLM:()=>t.ModernBertForMaskedLM,ModernBertForSequenceClassification:()=>t.ModernBertForSequenceClassification,ModernBertForTokenClassification:()=>t.ModernBertForTokenClassification,ModernBertModel:()=>t.ModernBertModel,ModernBertPreTrainedModel:()=>t.ModernBertPreTrainedModel,Moondream1ForConditionalGeneration:()=>t.Moondream1ForConditionalGeneration,MoonshineFeatureExtractor:()=>u.MoonshineFeatureExtractor,MoonshineForConditionalGeneration:()=>t.MoonshineForConditionalGeneration,MoonshineModel:()=>t.MoonshineModel,MoonshinePreTrainedModel:()=>t.MoonshinePreTrainedModel,MoonshineProcessor:()=>v.MoonshineProcessor,MptForCausalLM:()=>t.MptForCausalLM,MptModel:()=>t.MptModel,MptPreTrainedModel:()=>t.MptPreTrainedModel,MultiModalityCausalLM:()=>t.MultiModalityCausalLM,MultiModalityPreTrainedModel:()=>t.MultiModalityPreTrainedModel,MusicgenForCausalLM:()=>t.MusicgenForCausalLM,MusicgenForConditionalGeneration:()=>t.MusicgenForConditionalGeneration,MusicgenModel:()=>t.MusicgenModel,MusicgenPreTrainedModel:()=>t.MusicgenPreTrainedModel,NanoChatForCausalLM:()=>t.NanoChatForCausalLM,NanoChatModel:()=>t.NanoChatModel,NanoChatPreTrainedModel:()=>t.NanoChatPreTrainedModel,NeoBertForMaskedLM:()=>t.NeoBertForMaskedLM,NeoBertForQuestionAnswering:()=>t.NeoBertForQuestionAnswering,NeoBertForSequenceClassification:()=>t.NeoBertForSequenceClassification,NeoBertForTokenClassification:()=>t.NeoBertForTokenClassification,NeoBertModel:()=>t.NeoBertModel,NeoBertPreTrainedModel:()=>t.NeoBertPreTrainedModel,NllbTokenizer:()=>s.NllbTokenizer,NoBadWordsLogitsProcessor:()=>P.NoBadWordsLogitsProcessor,NoRepeatNGramLogitsProcessor:()=>P.NoRepeatNGramLogitsProcessor,NomicBertModel:()=>t.NomicBertModel,NomicBertPreTrainedModel:()=>t.NomicBertPreTrainedModel,NougatImageProcessor:()=>h.NougatImageProcessor,NougatTokenizer:()=>s.NougatTokenizer,OPTForCausalLM:()=>t.OPTForCausalLM,OPTModel:()=>t.OPTModel,OPTPreTrainedModel:()=>t.OPTPreTrainedModel,ObjectDetectionPipeline:()=>r.ObjectDetectionPipeline,Olmo2ForCausalLM:()=>t.Olmo2ForCausalLM,Olmo2Model:()=>t.Olmo2Model,Olmo2PreTrainedModel:()=>t.Olmo2PreTrainedModel,OlmoForCausalLM:()=>t.OlmoForCausalLM,OlmoModel:()=>t.OlmoModel,OlmoPreTrainedModel:()=>t.OlmoPreTrainedModel,OpenELMForCausalLM:()=>t.OpenELMForCausalLM,OpenELMModel:()=>t.OpenELMModel,OpenELMPreTrainedModel:()=>t.OpenELMPreTrainedModel,OwlViTFeatureExtractor:()=>h.OwlViTFeatureExtractor,OwlViTForObjectDetection:()=>t.OwlViTForObjectDetection,OwlViTImageProcessor:()=>h.OwlViTImageProcessor,OwlViTModel:()=>t.OwlViTModel,OwlViTPreTrainedModel:()=>t.OwlViTPreTrainedModel,OwlViTProcessor:()=>v.OwlViTProcessor,Owlv2ForObjectDetection:()=>t.Owlv2ForObjectDetection,Owlv2ImageProcessor:()=>h.Owlv2ImageProcessor,Owlv2Model:()=>t.Owlv2Model,Owlv2PreTrainedModel:()=>t.Owlv2PreTrainedModel,PaliGemmaForConditionalGeneration:()=>t.PaliGemmaForConditionalGeneration,PaliGemmaPreTrainedModel:()=>t.PaliGemmaPreTrainedModel,PaliGemmaProcessor:()=>v.PaliGemmaProcessor,ParakeetFeatureExtractor:()=>u.ParakeetFeatureExtractor,ParakeetForCTC:()=>t.ParakeetForCTC,ParakeetPreTrainedModel:()=>t.ParakeetPreTrainedModel,PatchTSMixerForPrediction:()=>t.PatchTSMixerForPrediction,PatchTSMixerModel:()=>t.PatchTSMixerModel,PatchTSMixerPreTrainedModel:()=>t.PatchTSMixerPreTrainedModel,PatchTSTForPrediction:()=>t.PatchTSTForPrediction,PatchTSTModel:()=>t.PatchTSTModel,PatchTSTPreTrainedModel:()=>t.PatchTSTPreTrainedModel,Phi3ForCausalLM:()=>t.Phi3ForCausalLM,Phi3Model:()=>t.Phi3Model,Phi3PreTrainedModel:()=>t.Phi3PreTrainedModel,Phi3VForCausalLM:()=>t.Phi3VForCausalLM,Phi3VImageProcessor:()=>h.Phi3VImageProcessor,Phi3VPreTrainedModel:()=>t.Phi3VPreTrainedModel,Phi3VProcessor:()=>v.Phi3VProcessor,PhiForCausalLM:()=>t.PhiForCausalLM,PhiModel:()=>t.PhiModel,PhiPreTrainedModel:()=>t.PhiPreTrainedModel,Pipeline:()=>r.Pipeline,PixtralImageProcessor:()=>h.PixtralImageProcessor,PixtralProcessor:()=>v.PixtralProcessor,PreTrainedModel:()=>t.PreTrainedModel,PreTrainedTokenizer:()=>s.PreTrainedTokenizer,PretrainedConfig:()=>o.PretrainedConfig,PretrainedMixin:()=>t.PretrainedMixin,Processor:()=>F.Processor,PvtForImageClassification:()=>t.PvtForImageClassification,PvtImageProcessor:()=>h.PvtImageProcessor,PvtModel:()=>t.PvtModel,PvtPreTrainedModel:()=>t.PvtPreTrainedModel,PyAnnoteFeatureExtractor:()=>u.PyAnnoteFeatureExtractor,PyAnnoteForAudioFrameClassification:()=>t.PyAnnoteForAudioFrameClassification,PyAnnoteModel:()=>t.PyAnnoteModel,PyAnnotePreTrainedModel:()=>t.PyAnnotePreTrainedModel,PyAnnoteProcessor:()=>v.PyAnnoteProcessor,QuestionAnsweringModelOutput:()=>t.QuestionAnsweringModelOutput,QuestionAnsweringPipeline:()=>r.QuestionAnsweringPipeline,Qwen2ForCausalLM:()=>t.Qwen2ForCausalLM,Qwen2Model:()=>t.Qwen2Model,Qwen2PreTrainedModel:()=>t.Qwen2PreTrainedModel,Qwen2Tokenizer:()=>s.Qwen2Tokenizer,Qwen2VLForConditionalGeneration:()=>t.Qwen2VLForConditionalGeneration,Qwen2VLImageProcessor:()=>h.Qwen2VLImageProcessor,Qwen2VLPreTrainedModel:()=>t.Qwen2VLPreTrainedModel,Qwen2VLProcessor:()=>v.Qwen2VLProcessor,Qwen3ForCausalLM:()=>t.Qwen3ForCausalLM,Qwen3Model:()=>t.Qwen3Model,Qwen3PreTrainedModel:()=>t.Qwen3PreTrainedModel,RFDetrForObjectDetection:()=>t.RFDetrForObjectDetection,RFDetrModel:()=>t.RFDetrModel,RFDetrObjectDetectionOutput:()=>t.RFDetrObjectDetectionOutput,RFDetrPreTrainedModel:()=>t.RFDetrPreTrainedModel,RTDetrForObjectDetection:()=>t.RTDetrForObjectDetection,RTDetrImageProcessor:()=>h.RTDetrImageProcessor,RTDetrModel:()=>t.RTDetrModel,RTDetrObjectDetectionOutput:()=>t.RTDetrObjectDetectionOutput,RTDetrPreTrainedModel:()=>t.RTDetrPreTrainedModel,RTDetrV2ForObjectDetection:()=>t.RTDetrV2ForObjectDetection,RTDetrV2Model:()=>t.RTDetrV2Model,RTDetrV2ObjectDetectionOutput:()=>t.RTDetrV2ObjectDetectionOutput,RTDetrV2PreTrainedModel:()=>t.RTDetrV2PreTrainedModel,RawAudio:()=>a.RawAudio,RawImage:()=>n.RawImage,RawVideo:()=>i.RawVideo,RawVideoFrame:()=>i.RawVideoFrame,RepetitionPenaltyLogitsProcessor:()=>P.RepetitionPenaltyLogitsProcessor,ResNetForImageClassification:()=>t.ResNetForImageClassification,ResNetModel:()=>t.ResNetModel,ResNetPreTrainedModel:()=>t.ResNetPreTrainedModel,RoFormerForMaskedLM:()=>t.RoFormerForMaskedLM,RoFormerForQuestionAnswering:()=>t.RoFormerForQuestionAnswering,RoFormerForSequenceClassification:()=>t.RoFormerForSequenceClassification,RoFormerForTokenClassification:()=>t.RoFormerForTokenClassification,RoFormerModel:()=>t.RoFormerModel,RoFormerPreTrainedModel:()=>t.RoFormerPreTrainedModel,RoFormerTokenizer:()=>s.RoFormerTokenizer,RobertaForMaskedLM:()=>t.RobertaForMaskedLM,RobertaForQuestionAnswering:()=>t.RobertaForQuestionAnswering,RobertaForSequenceClassification:()=>t.RobertaForSequenceClassification,RobertaForTokenClassification:()=>t.RobertaForTokenClassification,RobertaModel:()=>t.RobertaModel,RobertaPreTrainedModel:()=>t.RobertaPreTrainedModel,RobertaTokenizer:()=>s.RobertaTokenizer,Sam2ImageProcessor:()=>h.Sam2ImageProcessor,Sam2ImageSegmentationOutput:()=>t.Sam2ImageSegmentationOutput,Sam2Model:()=>t.Sam2Model,Sam2PreTrainedModel:()=>t.Sam2PreTrainedModel,Sam2Processor:()=>v.Sam2Processor,Sam2VideoProcessor:()=>v.Sam2VideoProcessor,Sam3ImageProcessor:()=>h.Sam3ImageProcessor,Sam3TrackerModel:()=>t.Sam3TrackerModel,SamImageProcessor:()=>h.SamImageProcessor,SamImageSegmentationOutput:()=>t.SamImageSegmentationOutput,SamModel:()=>t.SamModel,SamPreTrainedModel:()=>t.SamPreTrainedModel,SamProcessor:()=>v.SamProcessor,SapiensForDepthEstimation:()=>t.SapiensForDepthEstimation,SapiensForNormalEstimation:()=>t.SapiensForNormalEstimation,SapiensForSemanticSegmentation:()=>t.SapiensForSemanticSegmentation,SapiensPreTrainedModel:()=>t.SapiensPreTrainedModel,SeamlessM4TFeatureExtractor:()=>u.SeamlessM4TFeatureExtractor,SegformerFeatureExtractor:()=>h.SegformerFeatureExtractor,SegformerForImageClassification:()=>t.SegformerForImageClassification,SegformerForSemanticSegmentation:()=>t.SegformerForSemanticSegmentation,SegformerImageProcessor:()=>h.SegformerImageProcessor,SegformerModel:()=>t.SegformerModel,SegformerPreTrainedModel:()=>t.SegformerPreTrainedModel,Seq2SeqLMOutput:()=>t.Seq2SeqLMOutput,SequenceClassifierOutput:()=>t.SequenceClassifierOutput,SiglipImageProcessor:()=>h.SiglipImageProcessor,SiglipModel:()=>t.SiglipModel,SiglipPreTrainedModel:()=>t.SiglipPreTrainedModel,SiglipTextModel:()=>t.SiglipTextModel,SiglipTokenizer:()=>s.SiglipTokenizer,SiglipVisionModel:()=>t.SiglipVisionModel,SmolLM3ForCausalLM:()=>t.SmolLM3ForCausalLM,SmolLM3Model:()=>t.SmolLM3Model,SmolLM3PreTrainedModel:()=>t.SmolLM3PreTrainedModel,SmolVLMForConditionalGeneration:()=>t.SmolVLMForConditionalGeneration,SmolVLMImageProcessor:()=>h.SmolVLMImageProcessor,SmolVLMProcessor:()=>v.SmolVLMProcessor,SnacDecoderModel:()=>t.SnacDecoderModel,SnacEncoderModel:()=>t.SnacEncoderModel,SnacFeatureExtractor:()=>u.SnacFeatureExtractor,SnacModel:()=>t.SnacModel,SnacPreTrainedModel:()=>t.SnacPreTrainedModel,SpeechT5FeatureExtractor:()=>u.SpeechT5FeatureExtractor,SpeechT5ForSpeechToText:()=>t.SpeechT5ForSpeechToText,SpeechT5ForTextToSpeech:()=>t.SpeechT5ForTextToSpeech,SpeechT5HifiGan:()=>t.SpeechT5HifiGan,SpeechT5Model:()=>t.SpeechT5Model,SpeechT5PreTrainedModel:()=>t.SpeechT5PreTrainedModel,SpeechT5Processor:()=>v.SpeechT5Processor,SpeechT5Tokenizer:()=>s.SpeechT5Tokenizer,SqueezeBertForMaskedLM:()=>t.SqueezeBertForMaskedLM,SqueezeBertForQuestionAnswering:()=>t.SqueezeBertForQuestionAnswering,SqueezeBertForSequenceClassification:()=>t.SqueezeBertForSequenceClassification,SqueezeBertModel:()=>t.SqueezeBertModel,SqueezeBertPreTrainedModel:()=>t.SqueezeBertPreTrainedModel,SqueezeBertTokenizer:()=>s.SqueezeBertTokenizer,StableLmForCausalLM:()=>t.StableLmForCausalLM,StableLmModel:()=>t.StableLmModel,StableLmPreTrainedModel:()=>t.StableLmPreTrainedModel,Starcoder2ForCausalLM:()=>t.Starcoder2ForCausalLM,Starcoder2Model:()=>t.Starcoder2Model,Starcoder2PreTrainedModel:()=>t.Starcoder2PreTrainedModel,StoppingCriteria:()=>y.StoppingCriteria,StoppingCriteriaList:()=>y.StoppingCriteriaList,StyleTextToSpeech2Model:()=>t.StyleTextToSpeech2Model,StyleTextToSpeech2PreTrainedModel:()=>t.StyleTextToSpeech2PreTrainedModel,SummarizationPipeline:()=>r.SummarizationPipeline,SupertonicForConditionalGeneration:()=>t.SupertonicForConditionalGeneration,SupertonicPreTrainedModel:()=>t.SupertonicPreTrainedModel,SuppressTokensAtBeginLogitsProcessor:()=>P.SuppressTokensAtBeginLogitsProcessor,Swin2SRForImageSuperResolution:()=>t.Swin2SRForImageSuperResolution,Swin2SRImageProcessor:()=>h.Swin2SRImageProcessor,Swin2SRModel:()=>t.Swin2SRModel,Swin2SRPreTrainedModel:()=>t.Swin2SRPreTrainedModel,SwinForImageClassification:()=>t.SwinForImageClassification,SwinForSemanticSegmentation:()=>t.SwinForSemanticSegmentation,SwinModel:()=>t.SwinModel,SwinPreTrainedModel:()=>t.SwinPreTrainedModel,T5ForConditionalGeneration:()=>t.T5ForConditionalGeneration,T5Model:()=>t.T5Model,T5PreTrainedModel:()=>t.T5PreTrainedModel,T5Tokenizer:()=>s.T5Tokenizer,TableTransformerForObjectDetection:()=>t.TableTransformerForObjectDetection,TableTransformerModel:()=>t.TableTransformerModel,TableTransformerObjectDetectionOutput:()=>t.TableTransformerObjectDetectionOutput,TableTransformerPreTrainedModel:()=>t.TableTransformerPreTrainedModel,TemperatureLogitsWarper:()=>P.TemperatureLogitsWarper,Tensor:()=>l.Tensor,Text2TextGenerationPipeline:()=>r.Text2TextGenerationPipeline,TextClassificationPipeline:()=>r.TextClassificationPipeline,TextGenerationPipeline:()=>r.TextGenerationPipeline,TextStreamer:()=>C.TextStreamer,TextToAudioPipeline:()=>r.TextToAudioPipeline,TokenClassificationPipeline:()=>r.TokenClassificationPipeline,TokenClassifierOutput:()=>t.TokenClassifierOutput,TokenizerModel:()=>s.TokenizerModel,TopKLogitsWarper:()=>P.TopKLogitsWarper,TopPLogitsWarper:()=>P.TopPLogitsWarper,TrOCRForCausalLM:()=>t.TrOCRForCausalLM,TrOCRPreTrainedModel:()=>t.TrOCRPreTrainedModel,TranslationPipeline:()=>r.TranslationPipeline,UltravoxModel:()=>t.UltravoxModel,UltravoxPreTrainedModel:()=>t.UltravoxPreTrainedModel,UltravoxProcessor:()=>v.UltravoxProcessor,UniSpeechForCTC:()=>t.UniSpeechForCTC,UniSpeechForSequenceClassification:()=>t.UniSpeechForSequenceClassification,UniSpeechModel:()=>t.UniSpeechModel,UniSpeechPreTrainedModel:()=>t.UniSpeechPreTrainedModel,UniSpeechSatForAudioFrameClassification:()=>t.UniSpeechSatForAudioFrameClassification,UniSpeechSatForCTC:()=>t.UniSpeechSatForCTC,UniSpeechSatForSequenceClassification:()=>t.UniSpeechSatForSequenceClassification,UniSpeechSatModel:()=>t.UniSpeechSatModel,UniSpeechSatPreTrainedModel:()=>t.UniSpeechSatPreTrainedModel,VLChatProcessor:()=>v.VLChatProcessor,VLMImageProcessor:()=>h.VLMImageProcessor,VaultGemmaForCausalLM:()=>t.VaultGemmaForCausalLM,VaultGemmaModel:()=>t.VaultGemmaModel,VaultGemmaPreTrainedModel:()=>t.VaultGemmaPreTrainedModel,ViTFeatureExtractor:()=>h.ViTFeatureExtractor,ViTForImageClassification:()=>t.ViTForImageClassification,ViTImageProcessor:()=>h.ViTImageProcessor,ViTMAEModel:()=>t.ViTMAEModel,ViTMAEPreTrainedModel:()=>t.ViTMAEPreTrainedModel,ViTMSNForImageClassification:()=>t.ViTMSNForImageClassification,ViTMSNModel:()=>t.ViTMSNModel,ViTMSNPreTrainedModel:()=>t.ViTMSNPreTrainedModel,ViTModel:()=>t.ViTModel,ViTPreTrainedModel:()=>t.ViTPreTrainedModel,VisionEncoderDecoderModel:()=>t.VisionEncoderDecoderModel,VitMatteForImageMatting:()=>t.VitMatteForImageMatting,VitMatteImageProcessor:()=>h.VitMatteImageProcessor,VitMattePreTrainedModel:()=>t.VitMattePreTrainedModel,VitPoseForPoseEstimation:()=>t.VitPoseForPoseEstimation,VitPoseImageProcessor:()=>h.VitPoseImageProcessor,VitPosePreTrainedModel:()=>t.VitPosePreTrainedModel,VitsModel:()=>t.VitsModel,VitsModelOutput:()=>t.VitsModelOutput,VitsPreTrainedModel:()=>t.VitsPreTrainedModel,VitsTokenizer:()=>s.VitsTokenizer,VoxtralForConditionalGeneration:()=>t.VoxtralForConditionalGeneration,VoxtralProcessor:()=>v.VoxtralProcessor,Wav2Vec2BertForCTC:()=>t.Wav2Vec2BertForCTC,Wav2Vec2BertForSequenceClassification:()=>t.Wav2Vec2BertForSequenceClassification,Wav2Vec2BertModel:()=>t.Wav2Vec2BertModel,Wav2Vec2BertPreTrainedModel:()=>t.Wav2Vec2BertPreTrainedModel,Wav2Vec2CTCTokenizer:()=>s.Wav2Vec2CTCTokenizer,Wav2Vec2FeatureExtractor:()=>u.Wav2Vec2FeatureExtractor,Wav2Vec2ForAudioFrameClassification:()=>t.Wav2Vec2ForAudioFrameClassification,Wav2Vec2ForCTC:()=>t.Wav2Vec2ForCTC,Wav2Vec2ForSequenceClassification:()=>t.Wav2Vec2ForSequenceClassification,Wav2Vec2Model:()=>t.Wav2Vec2Model,Wav2Vec2PreTrainedModel:()=>t.Wav2Vec2PreTrainedModel,Wav2Vec2Processor:()=>v.Wav2Vec2Processor,Wav2Vec2ProcessorWithLM:()=>v.Wav2Vec2ProcessorWithLM,WavLMForAudioFrameClassification:()=>t.WavLMForAudioFrameClassification,WavLMForCTC:()=>t.WavLMForCTC,WavLMForSequenceClassification:()=>t.WavLMForSequenceClassification,WavLMForXVector:()=>t.WavLMForXVector,WavLMModel:()=>t.WavLMModel,WavLMPreTrainedModel:()=>t.WavLMPreTrainedModel,WeSpeakerFeatureExtractor:()=>u.WeSpeakerFeatureExtractor,WeSpeakerResNetModel:()=>t.WeSpeakerResNetModel,WeSpeakerResNetPreTrainedModel:()=>t.WeSpeakerResNetPreTrainedModel,WhisperFeatureExtractor:()=>u.WhisperFeatureExtractor,WhisperForConditionalGeneration:()=>t.WhisperForConditionalGeneration,WhisperModel:()=>t.WhisperModel,WhisperPreTrainedModel:()=>t.WhisperPreTrainedModel,WhisperProcessor:()=>v.WhisperProcessor,WhisperTextStreamer:()=>C.WhisperTextStreamer,WhisperTimeStampLogitsProcessor:()=>P.WhisperTimeStampLogitsProcessor,WhisperTokenizer:()=>s.WhisperTokenizer,XLMForQuestionAnswering:()=>t.XLMForQuestionAnswering,XLMForSequenceClassification:()=>t.XLMForSequenceClassification,XLMForTokenClassification:()=>t.XLMForTokenClassification,XLMModel:()=>t.XLMModel,XLMPreTrainedModel:()=>t.XLMPreTrainedModel,XLMRobertaForMaskedLM:()=>t.XLMRobertaForMaskedLM,XLMRobertaForQuestionAnswering:()=>t.XLMRobertaForQuestionAnswering,XLMRobertaForSequenceClassification:()=>t.XLMRobertaForSequenceClassification,XLMRobertaForTokenClassification:()=>t.XLMRobertaForTokenClassification,XLMRobertaModel:()=>t.XLMRobertaModel,XLMRobertaPreTrainedModel:()=>t.XLMRobertaPreTrainedModel,XLMRobertaTokenizer:()=>s.XLMRobertaTokenizer,XLMTokenizer:()=>s.XLMTokenizer,XLMWithLMHeadModel:()=>t.XLMWithLMHeadModel,XVectorOutput:()=>t.XVectorOutput,YolosFeatureExtractor:()=>h.YolosFeatureExtractor,YolosForObjectDetection:()=>t.YolosForObjectDetection,YolosImageProcessor:()=>h.YolosImageProcessor,YolosModel:()=>t.YolosModel,YolosObjectDetectionOutput:()=>t.YolosObjectDetectionOutput,YolosPreTrainedModel:()=>t.YolosPreTrainedModel,ZeroShotAudioClassificationPipeline:()=>r.ZeroShotAudioClassificationPipeline,ZeroShotClassificationPipeline:()=>r.ZeroShotClassificationPipeline,ZeroShotImageClassificationPipeline:()=>r.ZeroShotImageClassificationPipeline,ZeroShotObjectDetectionPipeline:()=>r.ZeroShotObjectDetectionPipeline,bankers_round:()=>c.bankers_round,cat:()=>l.cat,cos_sim:()=>c.cos_sim,dot:()=>c.dot,dynamic_time_warping:()=>c.dynamic_time_warping,env:()=>e.env,full:()=>l.full,full_like:()=>l.full_like,getCacheShapes:()=>o.getCacheShapes,hamming:()=>a.hamming,hanning:()=>a.hanning,interpolate:()=>l.interpolate,interpolate_4d:()=>l.interpolate_4d,interpolate_data:()=>c.interpolate_data,is_chinese_char:()=>s.is_chinese_char,layer_norm:()=>l.layer_norm,load_image:()=>n.load_image,load_video:()=>i.load_video,log_softmax:()=>c.log_softmax,magnitude:()=>c.magnitude,matmul:()=>l.matmul,max:()=>c.max,mean:()=>l.mean,mean_pooling:()=>l.mean_pooling,medianFilter:()=>c.medianFilter,mel_filter_bank:()=>a.mel_filter_bank,min:()=>c.min,ones:()=>l.ones,ones_like:()=>l.ones_like,permute:()=>l.permute,permute_data:()=>c.permute_data,pipeline:()=>r.pipeline,quantize_embeddings:()=>l.quantize_embeddings,rand:()=>l.rand,randn:()=>l.randn,read_audio:()=>a.read_audio,rfft:()=>l.rfft,round:()=>c.round,slice:()=>l.slice,softmax:()=>c.softmax,spectrogram:()=>a.spectrogram,stack:()=>l.stack,std_mean:()=>l.std_mean,topk:()=>l.topk,window_function:()=>a.window_function,zeros:()=>l.zeros,zeros_like:()=>l.zeros_like});var e=Vt("./src/env.js"),r=Vt("./src/pipelines.js"),t=Vt("./src/models.js"),s=Vt("./src/tokenizers.js"),o=Vt("./src/configs.js"),a=Vt("./src/utils/audio.js"),n=Vt("./src/utils/image.js"),i=Vt("./src/utils/video.js"),l=Vt("./src/utils/tensor.js"),c=Vt("./src/utils/maths.js"),_=Vt("./src/base/feature_extraction_utils.js"),u=Vt("./src/models/feature_extractors.js"),d=Vt("./src/models/auto/feature_extraction_auto.js"),g=Vt("./src/base/image_processors_utils.js"),h=Vt("./src/models/image_processors.js"),x=Vt("./src/models/auto/image_processing_auto.js"),F=Vt("./src/base/processing_utils.js"),v=Vt("./src/models/processors.js"),b=Vt("./src/models/auto/processing_auto.js"),C=Vt("./src/generation/streamers.js"),y=Vt("./src/generation/stopping_criteria.js"),P=Vt("./src/generation/logits_process.js")})();var VS=p.ASTFeatureExtractor,WS=p.ASTForAudioClassification,US=p.ASTModel,GS=p.ASTPreTrainedModel,KS=p.AlbertForMaskedLM,HS=p.AlbertForQuestionAnswering,qS=p.AlbertForSequenceClassification,QS=p.AlbertModel,XS=p.AlbertPreTrainedModel,JS=p.AlbertTokenizer,YS=p.ArceeForCausalLM,ZS=p.ArceeModel,eF=p.ArceePreTrainedModel,tF=p.AudioClassificationPipeline,rF=p.AutoConfig,sF=p.AutoFeatureExtractor,oF=p.AutoImageProcessor,aF=p.AutoModel,nF=p.AutoModelForAudioClassification,iF=p.AutoModelForAudioFrameClassification,lF=p.AutoModelForAudioTextToText,cF=p.AutoModelForCTC,dF=p.AutoModelForCausalLM,uF=p.AutoModelForDepthEstimation,_F=p.AutoModelForDocumentQuestionAnswering,pF=p.AutoModelForImageClassification,mF=p.AutoModelForImageFeatureExtraction,hF=p.AutoModelForImageMatting,fF=p.AutoModelForImageSegmentation,gF=p.AutoModelForImageTextToText,MF=p.AutoModelForImageToImage,wF=p.AutoModelForMaskGeneration,bF=p.AutoModelForMaskedLM,vF=p.AutoModelForNormalEstimation,xF=p.AutoModelForObjectDetection,yF=p.AutoModelForPoseEstimation,TF=p.AutoModelForQuestionAnswering,PF=p.AutoModelForSemanticSegmentation,EF=p.AutoModelForSeq2SeqLM,kF=p.AutoModelForSequenceClassification,CF=p.AutoModelForSpeechSeq2Seq,SF=p.AutoModelForTextToSpectrogram,FF=p.AutoModelForTextToWaveform,IF=p.AutoModelForTokenClassification,AF=p.AutoModelForUniversalSegmentation,$F=p.AutoModelForVision2Seq,DF=p.AutoModelForXVector,OF=p.AutoModelForZeroShotObjectDetection,LF=p.AutoProcessor,BF=p.AutoTokenizer,zF=p.AutomaticSpeechRecognitionPipeline,RF=p.BackgroundRemovalPipeline,NF=p.BartForConditionalGeneration,jF=p.BartForSequenceClassification,VF=p.BartModel,WF=p.BartPretrainedModel,UF=p.BartTokenizer,GF=p.BaseModelOutput,KF=p.BaseStreamer,HF=p.BeitFeatureExtractor,qF=p.BeitForImageClassification,QF=p.BeitModel,XF=p.BeitPreTrainedModel,JF=p.BertForMaskedLM,YF=p.BertForQuestionAnswering,ZF=p.BertForSequenceClassification,eI=p.BertForTokenClassification,tI=p.BertModel,rI=p.BertPreTrainedModel,sI=p.BertTokenizer,oI=p.BitImageProcessor,aI=p.BlenderbotForConditionalGeneration,nI=p.BlenderbotModel,iI=p.BlenderbotPreTrainedModel,lI=p.BlenderbotSmallForConditionalGeneration,cI=p.BlenderbotSmallModel,dI=p.BlenderbotSmallPreTrainedModel,uI=p.BlenderbotSmallTokenizer,_I=p.BlenderbotTokenizer,pI=p.BloomForCausalLM,mI=p.BloomModel,hI=p.BloomPreTrainedModel,fI=p.BloomTokenizer,gI=p.CLIPFeatureExtractor,MI=p.CLIPImageProcessor,wI=p.CLIPModel,bI=p.CLIPPreTrainedModel,vI=p.CLIPSegForImageSegmentation,xI=p.CLIPSegModel,yI=p.CLIPSegPreTrainedModel,TI=p.CLIPTextModel,PI=p.CLIPTextModelWithProjection,EI=p.CLIPTokenizer,kI=p.CLIPVisionModel,CI=p.CLIPVisionModelWithProjection,SI=p.CamembertForMaskedLM,FI=p.CamembertForQuestionAnswering,II=p.CamembertForSequenceClassification,AI=p.CamembertForTokenClassification,$I=p.CamembertModel,DI=p.CamembertPreTrainedModel,OI=p.CamembertTokenizer,LI=p.CausalLMOutput,BI=p.CausalLMOutputWithPast,zI=p.ChineseCLIPFeatureExtractor,RI=p.ChineseCLIPModel,NI=p.ChineseCLIPPreTrainedModel,jI=p.ClapAudioModelWithProjection,VI=p.ClapFeatureExtractor,WI=p.ClapModel,UI=p.ClapPreTrainedModel,GI=p.ClapTextModelWithProjection,KI=p.ClassifierFreeGuidanceLogitsProcessor,HI=p.CodeGenForCausalLM,qI=p.CodeGenModel,QI=p.CodeGenPreTrainedModel,XI=p.CodeGenTokenizer,JI=p.CodeLlamaTokenizer,YI=p.CohereForCausalLM,ZI=p.CohereModel,eA=p.CoherePreTrainedModel,tA=p.CohereTokenizer,rA=p.ConvBertForMaskedLM,sA=p.ConvBertForQuestionAnswering,oA=p.ConvBertForSequenceClassification,aA=p.ConvBertForTokenClassification,nA=p.ConvBertModel,iA=p.ConvBertPreTrainedModel,lA=p.ConvBertTokenizer,cA=p.ConvNextFeatureExtractor,dA=p.ConvNextForImageClassification,uA=p.ConvNextImageProcessor,_A=p.ConvNextModel,pA=p.ConvNextPreTrainedModel,mA=p.ConvNextV2ForImageClassification,hA=p.ConvNextV2Model,fA=p.ConvNextV2PreTrainedModel,gA=p.DFineForObjectDetection,MA=p.DFineModel,wA=p.DFinePreTrainedModel,bA=p.DINOv3ConvNextModel,vA=p.DINOv3ConvNextPreTrainedModel,xA=p.DINOv3ViTImageProcessor,yA=p.DINOv3ViTModel,TA=p.DINOv3ViTPreTrainedModel,PA=p.DPTFeatureExtractor,EA=p.DPTForDepthEstimation,kA=p.DPTImageProcessor,CA=p.DPTModel,SA=p.DPTPreTrainedModel,FA=p.DacDecoderModel,IA=p.DacDecoderOutput,AA=p.DacEncoderModel,$A=p.DacEncoderOutput,DA=p.DacFeatureExtractor,OA=p.DacModel,LA=p.DacPreTrainedModel,BA=p.DataTypeMap,zA=p.DebertaForMaskedLM,RA=p.DebertaForQuestionAnswering,NA=p.DebertaForSequenceClassification,jA=p.DebertaForTokenClassification,VA=p.DebertaModel,WA=p.DebertaPreTrainedModel,UA=p.DebertaTokenizer,GA=p.DebertaV2ForMaskedLM,KA=p.DebertaV2ForQuestionAnswering,HA=p.DebertaV2ForSequenceClassification,qA=p.DebertaV2ForTokenClassification,QA=p.DebertaV2Model,XA=p.DebertaV2PreTrainedModel,JA=p.DebertaV2Tokenizer,YA=p.DecisionTransformerModel,ZA=p.DecisionTransformerPreTrainedModel,e$=p.DeiTFeatureExtractor,t$=p.DeiTForImageClassification,r$=p.DeiTImageProcessor,s$=p.DeiTModel,o$=p.DeiTPreTrainedModel,a$=p.DepthAnythingForDepthEstimation,n$=p.DepthAnythingPreTrainedModel,i$=p.DepthEstimationPipeline,l$=p.DepthProForDepthEstimation,c$=p.DepthProPreTrainedModel,d$=p.DetrFeatureExtractor,u$=p.DetrForObjectDetection,_$=p.DetrForSegmentation,p$=p.DetrImageProcessor,m$=p.DetrModel,h$=p.DetrObjectDetectionOutput,f$=p.DetrPreTrainedModel,g$=p.DetrSegmentationOutput,M$=p.Dinov2ForImageClassification,w$=p.Dinov2Model,b$=p.Dinov2PreTrainedModel,v$=p.Dinov2WithRegistersForImageClassification,x$=p.Dinov2WithRegistersModel,y$=p.Dinov2WithRegistersPreTrainedModel,T$=p.DistilBertForMaskedLM,P$=p.DistilBertForQuestionAnswering,E$=p.DistilBertForSequenceClassification,k$=p.DistilBertForTokenClassification,C$=p.DistilBertModel,S$=p.DistilBertPreTrainedModel,F$=p.DistilBertTokenizer,I$=p.DocumentQuestionAnsweringPipeline,A$=p.DonutFeatureExtractor,$$=p.DonutImageProcessor,D$=p.DonutSwinModel,O$=p.DonutSwinPreTrainedModel,L$=p.EdgeTamModel,B$=p.EfficientNetForImageClassification,z$=p.EfficientNetImageProcessor,R$=p.EfficientNetModel,N$=p.EfficientNetPreTrainedModel,j$=p.ElectraForMaskedLM,V$=p.ElectraForQuestionAnswering,W$=p.ElectraForSequenceClassification,U$=p.ElectraForTokenClassification,G$=p.ElectraModel,K$=p.ElectraPreTrainedModel,H$=p.ElectraTokenizer,q$=p.EncodecFeatureExtractor,Q$=p.EosTokenCriteria,X$=p.Ernie4_5ForCausalLM,J$=p.Ernie4_5Model,Y$=p.Ernie4_5PreTrainedModel,Z$=p.EsmForMaskedLM,eD=p.EsmForSequenceClassification,tD=p.EsmForTokenClassification,rD=p.EsmModel,sD=p.EsmPreTrainedModel,oD=p.EsmTokenizer,aD=p.ExaoneForCausalLM,nD=p.ExaoneModel,iD=p.ExaonePreTrainedModel,lD=p.FFT,cD=p.FalconForCausalLM,dD=p.FalconModel,uD=p.FalconPreTrainedModel,_D=p.FalconTokenizer,pD=p.FastViTForImageClassification,mD=p.FastViTModel,hD=p.FastViTPreTrainedModel,fD=p.FeatureExtractionPipeline,gD=p.FeatureExtractor,MD=p.FillMaskPipeline,wD=p.Florence2ForConditionalGeneration,bD=p.Florence2PreTrainedModel,vD=p.Florence2Processor,xD=p.ForcedBOSTokenLogitsProcessor,yD=p.ForcedEOSTokenLogitsProcessor,TD=p.GLPNFeatureExtractor,PD=p.GLPNForDepthEstimation,ED=p.GLPNModel,kD=p.GLPNPreTrainedModel,CD=p.GPT2LMHeadModel,SD=p.GPT2Model,FD=p.GPT2PreTrainedModel,ID=p.GPT2Tokenizer,AD=p.GPTBigCodeForCausalLM,$D=p.GPTBigCodeModel,DD=p.GPTBigCodePreTrainedModel,OD=p.GPTJForCausalLM,LD=p.GPTJModel,BD=p.GPTJPreTrainedModel,zD=p.GPTNeoForCausalLM,RD=p.GPTNeoModel,ND=p.GPTNeoPreTrainedModel,jD=p.GPTNeoXForCausalLM,VD=p.GPTNeoXModel,WD=p.GPTNeoXPreTrainedModel,UD=p.GPTNeoXTokenizer,GD=p.Gemma2ForCausalLM,KD=p.Gemma2Model,HD=p.Gemma2PreTrainedModel,qD=p.Gemma3ForCausalLM,QD=p.Gemma3Model,XD=p.Gemma3PreTrainedModel,JD=p.Gemma3nAudioFeatureExtractor,YD=p.Gemma3nForConditionalGeneration,ZD=p.Gemma3nPreTrainedModel,eO=p.Gemma3nProcessor,tO=p.GemmaForCausalLM,rO=p.GemmaModel,sO=p.GemmaPreTrainedModel,oO=p.GemmaTokenizer,aO=p.GlmForCausalLM,nO=p.GlmModel,iO=p.GlmPreTrainedModel,lO=p.GraniteForCausalLM,cO=p.GraniteModel,dO=p.GraniteMoeHybridForCausalLM,uO=p.GraniteMoeHybridModel,_O=p.GraniteMoeHybridPreTrainedModel,pO=p.GranitePreTrainedModel,mO=p.Grok1Tokenizer,hO=p.GroundingDinoForObjectDetection,fO=p.GroundingDinoImageProcessor,gO=p.GroundingDinoPreTrainedModel,MO=p.GroundingDinoProcessor,wO=p.GroupViTModel,bO=p.GroupViTPreTrainedModel,vO=p.HeliumForCausalLM,xO=p.HeliumModel,yO=p.HeliumPreTrainedModel,TO=p.HerbertTokenizer,PO=p.HieraForImageClassification,EO=p.HieraModel,kO=p.HieraPreTrainedModel,CO=p.HubertForCTC,SO=p.HubertForSequenceClassification,FO=p.HubertModel,IO=p.HubertPreTrainedModel,AO=p.IJepaForImageClassification,$O=p.IJepaModel,DO=p.IJepaPreTrainedModel,OO=p.Idefics3ForConditionalGeneration,LO=p.Idefics3ImageProcessor,BO=p.Idefics3PreTrainedModel,zO=p.Idefics3Processor,RO=p.ImageClassificationPipeline,NO=p.ImageFeatureExtractionPipeline,jO=p.ImageFeatureExtractor,VO=p.ImageMattingOutput,WO=p.ImageProcessor,UO=p.ImageSegmentationPipeline,GO=p.ImageToImagePipeline,KO=p.ImageToTextPipeline,HO=p.InterruptableStoppingCriteria,qO=p.JAISLMHeadModel,QO=p.JAISModel,XO=p.JAISPreTrainedModel,JO=p.JinaCLIPImageProcessor,YO=p.JinaCLIPModel,ZO=p.JinaCLIPPreTrainedModel,eL=p.JinaCLIPProcessor,tL=p.JinaCLIPTextModel,rL=p.JinaCLIPVisionModel,sL=p.Lfm2ForCausalLM,oL=p.Lfm2Model,aL=p.Lfm2PreTrainedModel,nL=p.LiteWhisperForConditionalGeneration,iL=p.Llama4ForCausalLM,lL=p.Llama4PreTrainedModel,cL=p.LlamaForCausalLM,dL=p.LlamaModel,uL=p.LlamaPreTrainedModel,_L=p.LlamaTokenizer,pL=p.LlavaForConditionalGeneration,mL=p.LlavaOnevisionForConditionalGeneration,hL=p.LlavaOnevisionImageProcessor,fL=p.LlavaPreTrainedModel,gL=p.LlavaProcessor,ML=p.LlavaQwen2ForCausalLM,wL=p.LogitsProcessor,bL=p.LogitsProcessorList,vL=p.LogitsWarper,xL=p.LongT5ForConditionalGeneration,yL=p.LongT5Model,TL=p.LongT5PreTrainedModel,PL=p.M2M100ForConditionalGeneration,EL=p.M2M100Model,kL=p.M2M100PreTrainedModel,CL=p.M2M100Tokenizer,SL=p.MBart50Tokenizer,FL=p.MBartForCausalLM,IL=p.MBartForConditionalGeneration,AL=p.MBartForSequenceClassification,$L=p.MBartModel,DL=p.MBartPreTrainedModel,OL=p.MBartTokenizer,LL=p.MPNetForMaskedLM,BL=p.MPNetForQuestionAnswering,zL=p.MPNetForSequenceClassification,RL=p.MPNetForTokenClassification,NL=p.MPNetModel,jL=p.MPNetPreTrainedModel,VL=p.MPNetTokenizer,WL=p.MT5ForConditionalGeneration,UL=p.MT5Model,GL=p.MT5PreTrainedModel,KL=p.MarianMTModel,HL=p.MarianModel,qL=p.MarianPreTrainedModel,QL=p.MarianTokenizer,XL=p.Mask2FormerImageProcessor,JL=p.MaskFormerFeatureExtractor,YL=p.MaskFormerForInstanceSegmentation,ZL=p.MaskFormerImageProcessor,e3=p.MaskFormerModel,t3=p.MaskFormerPreTrainedModel,r3=p.MaskedLMOutput,s3=p.MaxLengthCriteria,o3=p.Metric3DForDepthEstimation,a3=p.Metric3DPreTrainedModel,n3=p.Metric3Dv2ForDepthEstimation,i3=p.Metric3Dv2PreTrainedModel,l3=p.MgpstrForSceneTextRecognition,c3=p.MgpstrModelOutput,d3=p.MgpstrPreTrainedModel,u3=p.MgpstrProcessor,_3=p.MgpstrTokenizer,p3=p.MimiDecoderModel,m3=p.MimiDecoderOutput,h3=p.MimiEncoderModel,f3=p.MimiEncoderOutput,g3=p.MimiModel,M3=p.MimiPreTrainedModel,w3=p.MinLengthLogitsProcessor,b3=p.MinNewTokensLengthLogitsProcessor,v3=p.Ministral3ForCausalLM,x3=p.Ministral3Model,y3=p.Ministral3PreTrainedModel,T3=p.MinistralForCausalLM,P3=p.MinistralModel,E3=p.MinistralPreTrainedModel,k3=p.Mistral3ForConditionalGeneration,C3=p.MistralForCausalLM,S3=p.MistralModel,F3=p.MistralPreTrainedModel,I3=p.MobileBertForMaskedLM,A3=p.MobileBertForQuestionAnswering,$3=p.MobileBertForSequenceClassification,D3=p.MobileBertModel,O3=p.MobileBertPreTrainedModel,L3=p.MobileBertTokenizer,B3=p.MobileLLMForCausalLM,z3=p.MobileLLMModel,R3=p.MobileLLMPreTrainedModel,N3=p.MobileNetV1FeatureExtractor,j3=p.MobileNetV1ForImageClassification,V3=p.MobileNetV1ForSemanticSegmentation,W3=p.MobileNetV1ImageProcessor,U3=p.MobileNetV1Model,G3=p.MobileNetV1PreTrainedModel,K3=p.MobileNetV2FeatureExtractor,H3=p.MobileNetV2ForImageClassification,q3=p.MobileNetV2ForSemanticSegmentation,Q3=p.MobileNetV2ImageProcessor,X3=p.MobileNetV2Model,J3=p.MobileNetV2PreTrainedModel,Y3=p.MobileNetV3FeatureExtractor,Z3=p.MobileNetV3ForImageClassification,eB=p.MobileNetV3ForSemanticSegmentation,tB=p.MobileNetV3ImageProcessor,rB=p.MobileNetV3Model,sB=p.MobileNetV3PreTrainedModel,oB=p.MobileNetV4FeatureExtractor,aB=p.MobileNetV4ForImageClassification,nB=p.MobileNetV4ForSemanticSegmentation,iB=p.MobileNetV4ImageProcessor,lB=p.MobileNetV4Model,cB=p.MobileNetV4PreTrainedModel,dB=p.MobileViTFeatureExtractor,uB=p.MobileViTForImageClassification,_B=p.MobileViTImageProcessor,pB=p.MobileViTModel,mB=p.MobileViTPreTrainedModel,hB=p.MobileViTV2ForImageClassification,fB=p.MobileViTV2Model,gB=p.MobileViTV2PreTrainedModel,MB=p.ModelOutput,wB=p.ModernBertDecoderForCausalLM,bB=p.ModernBertDecoderModel,vB=p.ModernBertDecoderPreTrainedModel,xB=p.ModernBertForMaskedLM,yB=p.ModernBertForSequenceClassification,TB=p.ModernBertForTokenClassification,PB=p.ModernBertModel,EB=p.ModernBertPreTrainedModel,kB=p.Moondream1ForConditionalGeneration,CB=p.MoonshineFeatureExtractor,SB=p.MoonshineForConditionalGeneration,FB=p.MoonshineModel,IB=p.MoonshinePreTrainedModel,AB=p.MoonshineProcessor,$B=p.MptForCausalLM,DB=p.MptModel,OB=p.MptPreTrainedModel,LB=p.MultiModalityCausalLM,BB=p.MultiModalityPreTrainedModel,zB=p.MusicgenForCausalLM,RB=p.MusicgenForConditionalGeneration,NB=p.MusicgenModel,jB=p.MusicgenPreTrainedModel,VB=p.NanoChatForCausalLM,WB=p.NanoChatModel,UB=p.NanoChatPreTrainedModel,GB=p.NeoBertForMaskedLM,KB=p.NeoBertForQuestionAnswering,HB=p.NeoBertForSequenceClassification,qB=p.NeoBertForTokenClassification,QB=p.NeoBertModel,XB=p.NeoBertPreTrainedModel,JB=p.NllbTokenizer,YB=p.NoBadWordsLogitsProcessor,ZB=p.NoRepeatNGramLogitsProcessor,ez=p.NomicBertModel,tz=p.NomicBertPreTrainedModel,rz=p.NougatImageProcessor,sz=p.NougatTokenizer,oz=p.OPTForCausalLM,az=p.OPTModel,nz=p.OPTPreTrainedModel,iz=p.ObjectDetectionPipeline,lz=p.Olmo2ForCausalLM,cz=p.Olmo2Model,dz=p.Olmo2PreTrainedModel,uz=p.OlmoForCausalLM,_z=p.OlmoModel,pz=p.OlmoPreTrainedModel,mz=p.OpenELMForCausalLM,hz=p.OpenELMModel,fz=p.OpenELMPreTrainedModel,gz=p.OwlViTFeatureExtractor,Mz=p.OwlViTForObjectDetection,wz=p.OwlViTImageProcessor,bz=p.OwlViTModel,vz=p.OwlViTPreTrainedModel,xz=p.OwlViTProcessor,yz=p.Owlv2ForObjectDetection,Tz=p.Owlv2ImageProcessor,Pz=p.Owlv2Model,Ez=p.Owlv2PreTrainedModel,kz=p.PaliGemmaForConditionalGeneration,Cz=p.PaliGemmaPreTrainedModel,Sz=p.PaliGemmaProcessor,Fz=p.ParakeetFeatureExtractor,Iz=p.ParakeetForCTC,Az=p.ParakeetPreTrainedModel,$z=p.PatchTSMixerForPrediction,Dz=p.PatchTSMixerModel,Oz=p.PatchTSMixerPreTrainedModel,Lz=p.PatchTSTForPrediction,Bz=p.PatchTSTModel,zz=p.PatchTSTPreTrainedModel,Rz=p.Phi3ForCausalLM,Nz=p.Phi3Model,jz=p.Phi3PreTrainedModel,Vz=p.Phi3VForCausalLM,Wz=p.Phi3VImageProcessor,Uz=p.Phi3VPreTrainedModel,Gz=p.Phi3VProcessor,Kz=p.PhiForCausalLM,Hz=p.PhiModel,qz=p.PhiPreTrainedModel,Qz=p.Pipeline,Xz=p.PixtralImageProcessor,Jz=p.PixtralProcessor,Yz=p.PreTrainedModel,Zz=p.PreTrainedTokenizer,eR=p.PretrainedConfig,tR=p.PretrainedMixin,rR=p.Processor,sR=p.PvtForImageClassification,oR=p.PvtImageProcessor,aR=p.PvtModel,nR=p.PvtPreTrainedModel,iR=p.PyAnnoteFeatureExtractor,lR=p.PyAnnoteForAudioFrameClassification,cR=p.PyAnnoteModel,dR=p.PyAnnotePreTrainedModel,uR=p.PyAnnoteProcessor,_R=p.QuestionAnsweringModelOutput,pR=p.QuestionAnsweringPipeline,mR=p.Qwen2ForCausalLM,hR=p.Qwen2Model,fR=p.Qwen2PreTrainedModel,gR=p.Qwen2Tokenizer,MR=p.Qwen2VLForConditionalGeneration,wR=p.Qwen2VLImageProcessor,bR=p.Qwen2VLPreTrainedModel,vR=p.Qwen2VLProcessor,xR=p.Qwen3ForCausalLM,yR=p.Qwen3Model,TR=p.Qwen3PreTrainedModel,PR=p.RFDetrForObjectDetection,ER=p.RFDetrModel,kR=p.RFDetrObjectDetectionOutput,CR=p.RFDetrPreTrainedModel,SR=p.RTDetrForObjectDetection,FR=p.RTDetrImageProcessor,IR=p.RTDetrModel,AR=p.RTDetrObjectDetectionOutput,$R=p.RTDetrPreTrainedModel,DR=p.RTDetrV2ForObjectDetection,OR=p.RTDetrV2Model,LR=p.RTDetrV2ObjectDetectionOutput,BR=p.RTDetrV2PreTrainedModel,zR=p.RawAudio,RR=p.RawImage,NR=p.RawVideo,jR=p.RawVideoFrame,VR=p.RepetitionPenaltyLogitsProcessor,WR=p.ResNetForImageClassification,UR=p.ResNetModel,GR=p.ResNetPreTrainedModel,KR=p.RoFormerForMaskedLM,HR=p.RoFormerForQuestionAnswering,qR=p.RoFormerForSequenceClassification,QR=p.RoFormerForTokenClassification,XR=p.RoFormerModel,JR=p.RoFormerPreTrainedModel,YR=p.RoFormerTokenizer,ZR=p.RobertaForMaskedLM,eN=p.RobertaForQuestionAnswering,tN=p.RobertaForSequenceClassification,rN=p.RobertaForTokenClassification,sN=p.RobertaModel,oN=p.RobertaPreTrainedModel,aN=p.RobertaTokenizer,nN=p.Sam2ImageProcessor,iN=p.Sam2ImageSegmentationOutput,lN=p.Sam2Model,cN=p.Sam2PreTrainedModel,dN=p.Sam2Processor,uN=p.Sam2VideoProcessor,_N=p.Sam3ImageProcessor,pN=p.Sam3TrackerModel,mN=p.SamImageProcessor,hN=p.SamImageSegmentationOutput,fN=p.SamModel,gN=p.SamPreTrainedModel,MN=p.SamProcessor,wN=p.SapiensForDepthEstimation,bN=p.SapiensForNormalEstimation,vN=p.SapiensForSemanticSegmentation,xN=p.SapiensPreTrainedModel,yN=p.SeamlessM4TFeatureExtractor,TN=p.SegformerFeatureExtractor,PN=p.SegformerForImageClassification,EN=p.SegformerForSemanticSegmentation,kN=p.SegformerImageProcessor,CN=p.SegformerModel,SN=p.SegformerPreTrainedModel,FN=p.Seq2SeqLMOutput,IN=p.SequenceClassifierOutput,AN=p.SiglipImageProcessor,$N=p.SiglipModel,DN=p.SiglipPreTrainedModel,ON=p.SiglipTextModel,LN=p.SiglipTokenizer,BN=p.SiglipVisionModel,zN=p.SmolLM3ForCausalLM,RN=p.SmolLM3Model,NN=p.SmolLM3PreTrainedModel,jN=p.SmolVLMForConditionalGeneration,VN=p.SmolVLMImageProcessor,WN=p.SmolVLMProcessor,UN=p.SnacDecoderModel,GN=p.SnacEncoderModel,KN=p.SnacFeatureExtractor,HN=p.SnacModel,qN=p.SnacPreTrainedModel,QN=p.SpeechT5FeatureExtractor,XN=p.SpeechT5ForSpeechToText,JN=p.SpeechT5ForTextToSpeech,YN=p.SpeechT5HifiGan,ZN=p.SpeechT5Model,ej=p.SpeechT5PreTrainedModel,tj=p.SpeechT5Processor,rj=p.SpeechT5Tokenizer,sj=p.SqueezeBertForMaskedLM,oj=p.SqueezeBertForQuestionAnswering,aj=p.SqueezeBertForSequenceClassification,nj=p.SqueezeBertModel,ij=p.SqueezeBertPreTrainedModel,lj=p.SqueezeBertTokenizer,cj=p.StableLmForCausalLM,dj=p.StableLmModel,uj=p.StableLmPreTrainedModel,_j=p.Starcoder2ForCausalLM,pj=p.Starcoder2Model,mj=p.Starcoder2PreTrainedModel,hj=p.StoppingCriteria,fj=p.StoppingCriteriaList,gj=p.StyleTextToSpeech2Model,Mj=p.StyleTextToSpeech2PreTrainedModel,wj=p.SummarizationPipeline,bj=p.SupertonicForConditionalGeneration,vj=p.SupertonicPreTrainedModel,xj=p.SuppressTokensAtBeginLogitsProcessor,yj=p.Swin2SRForImageSuperResolution,Tj=p.Swin2SRImageProcessor,Pj=p.Swin2SRModel,Ej=p.Swin2SRPreTrainedModel,kj=p.SwinForImageClassification,Cj=p.SwinForSemanticSegmentation,Sj=p.SwinModel,Fj=p.SwinPreTrainedModel,Ij=p.T5ForConditionalGeneration,Aj=p.T5Model,$j=p.T5PreTrainedModel,Dj=p.T5Tokenizer,Oj=p.TableTransformerForObjectDetection,Lj=p.TableTransformerModel,Bj=p.TableTransformerObjectDetectionOutput,zj=p.TableTransformerPreTrainedModel,Rj=p.TemperatureLogitsWarper,Nj=p.Tensor,jj=p.Text2TextGenerationPipeline,Vj=p.TextClassificationPipeline,Wj=p.TextGenerationPipeline,Uj=p.TextStreamer,Gj=p.TextToAudioPipeline,Kj=p.TokenClassificationPipeline,Hj=p.TokenClassifierOutput,qj=p.TokenizerModel,Qj=p.TopKLogitsWarper,Xj=p.TopPLogitsWarper,Jj=p.TrOCRForCausalLM,Yj=p.TrOCRPreTrainedModel,Zj=p.TranslationPipeline,eV=p.UltravoxModel,tV=p.UltravoxPreTrainedModel,rV=p.UltravoxProcessor,sV=p.UniSpeechForCTC,oV=p.UniSpeechForSequenceClassification,aV=p.UniSpeechModel,nV=p.UniSpeechPreTrainedModel,iV=p.UniSpeechSatForAudioFrameClassification,lV=p.UniSpeechSatForCTC,cV=p.UniSpeechSatForSequenceClassification,dV=p.UniSpeechSatModel,uV=p.UniSpeechSatPreTrainedModel,_V=p.VLChatProcessor,pV=p.VLMImageProcessor,mV=p.VaultGemmaForCausalLM,hV=p.VaultGemmaModel,fV=p.VaultGemmaPreTrainedModel,gV=p.ViTFeatureExtractor,MV=p.ViTForImageClassification,wV=p.ViTImageProcessor,bV=p.ViTMAEModel,vV=p.ViTMAEPreTrainedModel,xV=p.ViTMSNForImageClassification,yV=p.ViTMSNModel,TV=p.ViTMSNPreTrainedModel,PV=p.ViTModel,EV=p.ViTPreTrainedModel,kV=p.VisionEncoderDecoderModel,CV=p.VitMatteForImageMatting,SV=p.VitMatteImageProcessor,FV=p.VitMattePreTrainedModel,IV=p.VitPoseForPoseEstimation,AV=p.VitPoseImageProcessor,$V=p.VitPosePreTrainedModel,DV=p.VitsModel,OV=p.VitsModelOutput,LV=p.VitsPreTrainedModel,BV=p.VitsTokenizer,zV=p.VoxtralForConditionalGeneration,RV=p.VoxtralProcessor,NV=p.Wav2Vec2BertForCTC,jV=p.Wav2Vec2BertForSequenceClassification,VV=p.Wav2Vec2BertModel,WV=p.Wav2Vec2BertPreTrainedModel,UV=p.Wav2Vec2CTCTokenizer,GV=p.Wav2Vec2FeatureExtractor,KV=p.Wav2Vec2ForAudioFrameClassification,HV=p.Wav2Vec2ForCTC,qV=p.Wav2Vec2ForSequenceClassification,QV=p.Wav2Vec2Model,XV=p.Wav2Vec2PreTrainedModel,JV=p.Wav2Vec2Processor,YV=p.Wav2Vec2ProcessorWithLM,ZV=p.WavLMForAudioFrameClassification,e4=p.WavLMForCTC,t4=p.WavLMForSequenceClassification,r4=p.WavLMForXVector,s4=p.WavLMModel,o4=p.WavLMPreTrainedModel,a4=p.WeSpeakerFeatureExtractor,n4=p.WeSpeakerResNetModel,i4=p.WeSpeakerResNetPreTrainedModel,l4=p.WhisperFeatureExtractor,c4=p.WhisperForConditionalGeneration,d4=p.WhisperModel,u4=p.WhisperPreTrainedModel,_4=p.WhisperProcessor,A0=p.WhisperTextStreamer,p4=p.WhisperTimeStampLogitsProcessor,m4=p.WhisperTokenizer,h4=p.XLMForQuestionAnswering,f4=p.XLMForSequenceClassification,g4=p.XLMForTokenClassification,M4=p.XLMModel,w4=p.XLMPreTrainedModel,b4=p.XLMRobertaForMaskedLM,v4=p.XLMRobertaForQuestionAnswering,x4=p.XLMRobertaForSequenceClassification,y4=p.XLMRobertaForTokenClassification,T4=p.XLMRobertaModel,P4=p.XLMRobertaPreTrainedModel,E4=p.XLMRobertaTokenizer,k4=p.XLMTokenizer,C4=p.XLMWithLMHeadModel,S4=p.XVectorOutput,F4=p.YolosFeatureExtractor,I4=p.YolosForObjectDetection,A4=p.YolosImageProcessor,$4=p.YolosModel,D4=p.YolosObjectDetectionOutput,O4=p.YolosPreTrainedModel,L4=p.ZeroShotAudioClassificationPipeline,B4=p.ZeroShotClassificationPipeline,z4=p.ZeroShotImageClassificationPipeline,R4=p.ZeroShotObjectDetectionPipeline,N4=p.bankers_round,j4=p.cat,V4=p.cos_sim,W4=p.dot,U4=p.dynamic_time_warping,G4=p.env,K4=p.full,H4=p.full_like,q4=p.getCacheShapes,Q4=p.hamming,X4=p.hanning,J4=p.interpolate,Y4=p.interpolate_4d,Z4=p.interpolate_data,eW=p.is_chinese_char,tW=p.layer_norm,rW=p.load_image,sW=p.load_video,oW=p.log_softmax,aW=p.magnitude,nW=p.matmul,iW=p.max,lW=p.mean,cW=p.mean_pooling,dW=p.medianFilter,uW=p.mel_filter_bank,_W=p.min,pW=p.ones,mW=p.ones_like,hW=p.permute,fW=p.permute_data,$0=p.pipeline,gW=p.quantize_embeddings,MW=p.rand,wW=p.randn,bW=p.read_audio,vW=p.rfft,xW=p.round,yW=p.slice,TW=p.softmax,PW=p.spectrogram,EW=p.stack,kW=p.std_mean,CW=p.topk,SW=p.window_function,FW=p.zeros,IW=p.zeros_like;async function D0(e){let{spec:r,onLoading:t}=e;return await $0(e.task,r.model,{device:r.device,dtype:r.dtype,progress_callback:o=>{t({total:o.total,progress:o.progress})}})}async function O0(e){let{pipe:r,spec:t,request:s,callbacks:o}=e;if(!r.processor.feature_extractor)throw new Error("no feature_extractor");let a=r.processor.feature_extractor?.config.chunk_length/r.model.config.max_source_positions,n=0,i=null,l=0,c=0,_=t.chunkLength-t.strideLength,u=()=>{let x=n*_;return Math.min(x/s.duration,1)},d=r.tokenizer,g=new A0(d,{time_precision:a,token_callback_function:()=>{i??=performance.now(),++l>1&&(c=l/(performance.now()-i)*1e3)},callback_function:x=>{o.onTranscription(x),o.onReport({tokensPerSecond:c,progress:u()})},on_finalize:()=>{i=null,l=0,n++,o.onReport({tokensPerSecond:c,progress:u()})}}),h=await r(new Float32Array(s.audio),{top_k:0,do_sample:!1,chunk_length_s:t.chunkLength,stride_length_s:t.strideLength,language:s.language,task:"transcribe",return_timestamps:"word",force_full_sequences:!1,streamer:g});return{text:h.text,chunks:h.chunks}}var L0=ls(),ME=e=>Of(async r=>{L0.resolve({spec:r,pipe:await D0({spec:r,task:"automatic-speech-recognition",onLoading:t=>e.loading(t)})})});await Yf.worker(e=>({prepare:ME(e.host),async transcribe(t){let{pipe:s,spec:o}=await L0.promise;return O0({pipe:s,spec:o,request:t,callbacks:{onReport:a=>e.host.deliverReport(a),onTranscription:a=>e.host.deliverTranscription(a)}})}}));
|
|
2852
2852
|
/*! Bundled license information:
|
|
2853
2853
|
|
|
2854
2854
|
onnxruntime-web/dist/ort.bundle.min.mjs:
|