@huggingface/transformers 4.0.0-next.2 → 4.0.0-next.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +2 -2
- package/dist/ort-wasm-simd-threaded.jsep.mjs +23 -23
- package/dist/transformers.js +32 -18
- package/dist/transformers.min.js +18 -18
- package/dist/transformers.node.cjs +23 -9
- package/dist/transformers.node.min.cjs +4 -4
- package/dist/transformers.node.min.mjs +4 -4
- package/dist/transformers.node.mjs +23 -9
- package/dist/transformers.web.js +16 -2
- package/dist/transformers.web.min.js +15 -15
- package/package.json +2 -2
- package/src/env.js +1 -1
- package/src/generation/parameters.js +1 -1
- package/src/generation/streamers.js +21 -0
- package/src/models/modeling_utils.js +1 -1
- package/src/pipelines/automatic-speech-recognition.js +1 -1
- package/src/pipelines/document-question-answering.js +1 -1
- package/src/pipelines/image-to-text.js +2 -2
- package/src/pipelines/summarization.js +1 -1
- package/src/pipelines/text-generation.js +1 -1
- package/src/pipelines/text2text-generation.js +1 -1
- package/src/pipelines/translation.js +1 -1
- package/types/generation/parameters.d.ts +1 -1
- package/types/generation/parameters.d.ts.map +1 -1
- package/types/generation/streamers.d.ts +1 -0
- package/types/generation/streamers.d.ts.map +1 -1
- package/types/models/modeling_utils.d.ts +2 -2
- package/types/models/modeling_utils.d.ts.map +1 -1
- package/types/pipelines/automatic-speech-recognition.d.ts +2 -2
- package/types/pipelines/automatic-speech-recognition.d.ts.map +1 -1
- package/types/pipelines/document-question-answering.d.ts +2 -2
- package/types/pipelines/document-question-answering.d.ts.map +1 -1
- package/types/pipelines/image-to-text.d.ts +4 -4
- package/types/pipelines/image-to-text.d.ts.map +1 -1
- package/types/pipelines/summarization.d.ts +2 -2
- package/types/pipelines/summarization.d.ts.map +1 -1
- package/types/pipelines/text-generation.d.ts +2 -2
- package/types/pipelines/text-generation.d.ts.map +1 -1
- package/types/pipelines/text2text-generation.d.ts +3 -3
- package/types/pipelines/text2text-generation.d.ts.map +1 -1
- package/types/pipelines/translation.d.ts +2 -2
- package/types/pipelines/translation.d.ts.map +1 -1
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
var aS=Object.create;var Zc=Object.defineProperty;var iS=Object.getOwnPropertyDescriptor;var lS=Object.getOwnPropertyNames;var cS=Object.getPrototypeOf,uS=Object.prototype.hasOwnProperty;var cs=(t,e)=>{for(var r in e)Zc(t,r,{get:e[r],enumerable:!0})},wv=(t,e,r,s)=>{if(e&&typeof e=="object"||typeof e=="function")for(let n of lS(e))!uS.call(t,n)&&n!==r&&Zc(t,n,{get:()=>e[n],enumerable:!(s=iS(e,n))||s.enumerable});return t};var Ur=(t,e,r)=>(r=t!=null?aS(cS(t)):{},wv(e||!t||!t.__esModule?Zc(r,"default",{value:t,enumerable:!0}):r,t)),pS=t=>wv(Zc({},"__esModule",{value:!0}),t);var fz={};cs(fz,{ASTFeatureExtractor:()=>Ep,ASTForAudioClassification:()=>pf,ASTModel:()=>uf,ASTPreTrainedModel:()=>Bn,AlbertForMaskedLM:()=>nf,AlbertForQuestionAnswering:()=>sf,AlbertForSequenceClassification:()=>rf,AlbertModel:()=>tf,AlbertPreTrainedModel:()=>Yr,AlbertTokenizer:()=>Pu,ApertusForCausalLM:()=>af,ApertusModel:()=>of,ApertusPreTrainedModel:()=>Rn,ArceeForCausalLM:()=>cf,ArceeModel:()=>lf,ArceePreTrainedModel:()=>Un,AudioClassificationPipeline:()=>kc,AutoConfig:()=>Xr,AutoFeatureExtractor:()=>Ze,AutoImageProcessor:()=>Le,AutoModel:()=>pr,AutoModelForAudioClassification:()=>cc,AutoModelForAudioFrameClassification:()=>sb,AutoModelForAudioTextToText:()=>lb,AutoModelForCTC:()=>lc,AutoModelForCausalLM:()=>tc,AutoModelForDepthEstimation:()=>dc,AutoModelForDocumentQuestionAnswering:()=>uc,AutoModelForImageClassification:()=>oc,AutoModelForImageFeatureExtraction:()=>fc,AutoModelForImageMatting:()=>nb,AutoModelForImageSegmentation:()=>Ba,AutoModelForImageTextToText:()=>ib,AutoModelForImageToImage:()=>pc,AutoModelForMaskGeneration:()=>tb,AutoModelForMaskedLM:()=>rc,AutoModelForNormalEstimation:()=>ob,AutoModelForObjectDetection:()=>ac,AutoModelForPoseEstimation:()=>ab,AutoModelForQuestionAnswering:()=>sc,AutoModelForSemanticSegmentation:()=>Da,AutoModelForSeq2SeqLM:()=>Zs,AutoModelForSequenceClassification:()=>Ua,AutoModelForSpeechSeq2Seq:()=>Jl,AutoModelForTextToSpectrogram:()=>Zl,AutoModelForTextToWaveform:()=>ec,AutoModelForTokenClassification:()=>Ql,AutoModelForUniversalSegmentation:()=>Fa,AutoModelForVision2Seq:()=>nc,AutoModelForXVector:()=>rb,AutoModelForZeroShotObjectDetection:()=>ic,AutoProcessor:()=>lt,AutoTokenizer:()=>J,AutomaticSpeechRecognitionPipeline:()=>Ac,BackgroundRemovalPipeline:()=>Oc,BartForConditionalGeneration:()=>ff,BartForSequenceClassification:()=>mf,BartModel:()=>df,BartPretrainedModel:()=>Ls,BartTokenizer:()=>zu,BaseStreamer:()=>Vx,BeitFeatureExtractor:()=>Fp,BeitForImageClassification:()=>_f,BeitModel:()=>hf,BeitPreTrainedModel:()=>Dn,BertForMaskedLM:()=>wf,BertForQuestionAnswering:()=>bf,BertForSequenceClassification:()=>xf,BertForTokenClassification:()=>yf,BertModel:()=>gf,BertPreTrainedModel:()=>yr,BertTokenizer:()=>Lu,BitImageProcessor:()=>jp,BlenderbotForConditionalGeneration:()=>kf,BlenderbotModel:()=>vf,BlenderbotPreTrainedModel:()=>Fn,BlenderbotSmallForConditionalGeneration:()=>Af,BlenderbotSmallModel:()=>Ef,BlenderbotSmallPreTrainedModel:()=>jn,BlenderbotSmallTokenizer:()=>Nu,BlenderbotTokenizer:()=>$u,BloomForCausalLM:()=>Tf,BloomModel:()=>Mf,BloomPreTrainedModel:()=>Gn,BloomTokenizer:()=>Ru,CLIPFeatureExtractor:()=>qp,CLIPImageProcessor:()=>wi,CLIPModel:()=>Nf,CLIPPreTrainedModel:()=>er,CLIPSegForImageSegmentation:()=>Df,CLIPSegModel:()=>Bf,CLIPSegPreTrainedModel:()=>Xn,CLIPTextModel:()=>$f,CLIPTextModelWithProjection:()=>Hn,CLIPTokenizer:()=>Bu,CLIPVisionModel:()=>Rf,CLIPVisionModelWithProjection:()=>Uf,CamembertForMaskedLM:()=>Of,CamembertForQuestionAnswering:()=>Pf,CamembertForSequenceClassification:()=>If,CamembertForTokenClassification:()=>Cf,CamembertModel:()=>Sf,CamembertPreTrainedModel:()=>br,CamembertTokenizer:()=>Uu,ChatterboxFeatureExtractor:()=>Ap,ChatterboxModel:()=>qn,ChatterboxPreTrainedModel:()=>Ji,ChatterboxProcessor:()=>$p,ChineseCLIPFeatureExtractor:()=>Gp,ChineseCLIPModel:()=>zf,ChineseCLIPPreTrainedModel:()=>Zi,ClapAudioModelWithProjection:()=>Vn,ClapFeatureExtractor:()=>Mp,ClapModel:()=>Lf,ClapPreTrainedModel:()=>Ns,ClapTextModelWithProjection:()=>Wn,ClassifierFreeGuidanceLogitsProcessor:()=>qi,CodeGenForCausalLM:()=>jf,CodeGenModel:()=>Ff,CodeGenPreTrainedModel:()=>Kn,CodeGenTokenizer:()=>Fu,CodeLlamaTokenizer:()=>Du,CohereForCausalLM:()=>qf,CohereModel:()=>Gf,CoherePreTrainedModel:()=>Yn,CohereTokenizer:()=>ju,ConvBertForMaskedLM:()=>Vf,ConvBertForQuestionAnswering:()=>Kf,ConvBertForSequenceClassification:()=>Hf,ConvBertForTokenClassification:()=>Xf,ConvBertModel:()=>Wf,ConvBertPreTrainedModel:()=>vr,ConvBertTokenizer:()=>Gu,ConvNextFeatureExtractor:()=>Wp,ConvNextForImageClassification:()=>Qf,ConvNextImageProcessor:()=>xi,ConvNextModel:()=>Yf,ConvNextPreTrainedModel:()=>Qn,ConvNextV2ForImageClassification:()=>Zf,ConvNextV2Model:()=>Jf,ConvNextV2PreTrainedModel:()=>Jn,DFineForObjectDetection:()=>sm,DFineModel:()=>rm,DFinePreTrainedModel:()=>eo,DINOv3ConvNextModel:()=>Tm,DINOv3ConvNextPreTrainedModel:()=>al,DINOv3ViTImageProcessor:()=>Xp,DINOv3ViTModel:()=>Sm,DINOv3ViTPreTrainedModel:()=>il,DPTFeatureExtractor:()=>Yp,DPTForDepthEstimation:()=>$m,DPTImageProcessor:()=>vi,DPTModel:()=>Nm,DPTPreTrainedModel:()=>ao,DacDecoderModel:()=>ro,DacDecoderOutput:()=>tl,DacEncoderModel:()=>to,DacEncoderOutput:()=>el,DacFeatureExtractor:()=>Tn,DacModel:()=>nm,DacPreTrainedModel:()=>$s,DebertaForMaskedLM:()=>am,DebertaForQuestionAnswering:()=>cm,DebertaForSequenceClassification:()=>im,DebertaForTokenClassification:()=>lm,DebertaModel:()=>om,DebertaPreTrainedModel:()=>kr,DebertaTokenizer:()=>Wu,DebertaV2ForMaskedLM:()=>pm,DebertaV2ForQuestionAnswering:()=>mm,DebertaV2ForSequenceClassification:()=>dm,DebertaV2ForTokenClassification:()=>fm,DebertaV2Model:()=>um,DebertaV2PreTrainedModel:()=>Er,DebertaV2Tokenizer:()=>qu,DecisionTransformerModel:()=>hm,DecisionTransformerPreTrainedModel:()=>rl,DeiTFeatureExtractor:()=>Vp,DeiTForImageClassification:()=>gm,DeiTImageProcessor:()=>yi,DeiTModel:()=>_m,DeiTPreTrainedModel:()=>so,DepthAnythingForDepthEstimation:()=>wm,DepthAnythingPreTrainedModel:()=>sl,DepthEstimationPipeline:()=>Nc,DepthProForDepthEstimation:()=>xm,DepthProPreTrainedModel:()=>nl,DetrFeatureExtractor:()=>Hp,DetrForObjectDetection:()=>bm,DetrForSegmentation:()=>vm,DetrImageProcessor:()=>bi,DetrModel:()=>ym,DetrObjectDetectionOutput:()=>Us,DetrPreTrainedModel:()=>Rs,DetrSegmentationOutput:()=>ol,Dinov2ForImageClassification:()=>Em,Dinov2Model:()=>km,Dinov2PreTrainedModel:()=>no,Dinov2WithRegistersForImageClassification:()=>Mm,Dinov2WithRegistersModel:()=>Am,Dinov2WithRegistersPreTrainedModel:()=>oo,DistilBertForMaskedLM:()=>zm,DistilBertForQuestionAnswering:()=>Pm,DistilBertForSequenceClassification:()=>Im,DistilBertForTokenClassification:()=>Cm,DistilBertModel:()=>Om,DistilBertPreTrainedModel:()=>Ar,DistilBertTokenizer:()=>Vu,DocumentQuestionAnsweringPipeline:()=>zc,DonutFeatureExtractor:()=>Kp,DonutImageProcessor:()=>Ms,DonutSwinModel:()=>Lm,DonutSwinPreTrainedModel:()=>ll,EdgeTamModel:()=>xw,EfficientNetForImageClassification:()=>Um,EfficientNetImageProcessor:()=>Qp,EfficientNetModel:()=>Rm,EfficientNetPreTrainedModel:()=>io,ElectraForMaskedLM:()=>Dm,ElectraForQuestionAnswering:()=>Gm,ElectraForSequenceClassification:()=>Fm,ElectraForTokenClassification:()=>jm,ElectraModel:()=>Bm,ElectraPreTrainedModel:()=>Mr,ElectraTokenizer:()=>Hu,EncodecFeatureExtractor:()=>Mn,EosTokenCriteria:()=>Xi,Ernie4_5ForCausalLM:()=>Wm,Ernie4_5Model:()=>qm,Ernie4_5PretrainedModel:()=>lo,EsmForMaskedLM:()=>Hm,EsmForSequenceClassification:()=>Xm,EsmForTokenClassification:()=>Km,EsmModel:()=>Vm,EsmPreTrainedModel:()=>Qr,EsmTokenizer:()=>Xu,ExaoneForCausalLM:()=>Qm,ExaoneModel:()=>Ym,ExaonePreTrainedModel:()=>co,FalconForCausalLM:()=>Zm,FalconH1ForCausalLM:()=>th,FalconH1Model:()=>eh,FalconH1PreTrainedModel:()=>po,FalconModel:()=>Jm,FalconPreTrainedModel:()=>uo,FalconTokenizer:()=>Ku,FastViTForImageClassification:()=>sh,FastViTModel:()=>rh,FastViTPreTrainedModel:()=>fo,FeatureExtractionPipeline:()=>$c,FeatureExtractor:()=>ze,FillMaskPipeline:()=>wc,Florence2ForConditionalGeneration:()=>nh,Florence2PreTrainedModel:()=>cl,Florence2Processor:()=>Md,ForcedBOSTokenLogitsProcessor:()=>$i,ForcedEOSTokenLogitsProcessor:()=>Ri,GLPNFeatureExtractor:()=>Jp,GLPNForDepthEstimation:()=>mh,GLPNModel:()=>fh,GLPNPreTrainedModel:()=>xo,GPT2LMHeadModel:()=>Eh,GPT2Model:()=>kh,GPT2PreTrainedModel:()=>Eo,GPT2Tokenizer:()=>Ju,GPTBigCodeForCausalLM:()=>_h,GPTBigCodeModel:()=>hh,GPTBigCodePreTrainedModel:()=>yo,GPTJForCausalLM:()=>Mh,GPTJModel:()=>Ah,GPTJPreTrainedModel:()=>Ao,GPTNeoForCausalLM:()=>wh,GPTNeoModel:()=>gh,GPTNeoPreTrainedModel:()=>bo,GPTNeoXForCausalLM:()=>yh,GPTNeoXModel:()=>xh,GPTNeoXPreTrainedModel:()=>vo,GPTNeoXTokenizer:()=>Qu,Gemma2ForCausalLM:()=>lh,Gemma2Model:()=>ih,Gemma2PreTrainedModel:()=>ho,Gemma3ForCausalLM:()=>uh,Gemma3Model:()=>ch,Gemma3PreTrainedModel:()=>_o,Gemma3nAudioFeatureExtractor:()=>Tp,Gemma3nForConditionalGeneration:()=>go,Gemma3nPreTrainedModel:()=>ul,Gemma3nProcessor:()=>Td,GemmaForCausalLM:()=>ah,GemmaModel:()=>oh,GemmaPreTrainedModel:()=>mo,GemmaTokenizer:()=>Yu,GlmForCausalLM:()=>dh,GlmModel:()=>ph,GlmPreTrainedModel:()=>wo,GptOssForCausalLM:()=>vh,GptOssModel:()=>bh,GptOssPreTrainedModel:()=>ko,GraniteForCausalLM:()=>Sh,GraniteModel:()=>Th,GraniteMoeHybridForCausalLM:()=>Ih,GraniteMoeHybridModel:()=>Oh,GraniteMoeHybridPreTrainedModel:()=>To,GranitePreTrainedModel:()=>Mo,GroundingDinoForObjectDetection:()=>Ch,GroundingDinoImageProcessor:()=>Zp,GroundingDinoPreTrainedModel:()=>pl,GroundingDinoProcessor:()=>Sd,GroupViTModel:()=>Ph,GroupViTPreTrainedModel:()=>dl,HeliumForCausalLM:()=>Lh,HeliumModel:()=>zh,HeliumPreTrainedModel:()=>So,HerbertTokenizer:()=>Zu,HieraForImageClassification:()=>$h,HieraModel:()=>Nh,HieraPreTrainedModel:()=>Oo,HubertForCTC:()=>Gh,HubertForSequenceClassification:()=>qh,HubertModel:()=>jh,HubertPreTrainedModel:()=>Fh,HunYuanDenseV1ForCausalLM:()=>Vh,HunYuanDenseV1Model:()=>Wh,HunYuanDenseV1PreTrainedModel:()=>Io,IJepaForImageClassification:()=>Kh,IJepaModel:()=>Xh,IJepaPreTrainedModel:()=>Co,Idefics3ForConditionalGeneration:()=>ml,Idefics3ImageProcessor:()=>ki,Idefics3PreTrainedModel:()=>fl,Idefics3Processor:()=>zi,ImageClassificationPipeline:()=>Sc,ImageFeatureExtractionPipeline:()=>Rc,ImageFeatureExtractor:()=>W,ImageProcessor:()=>W,ImageSegmentationPipeline:()=>en,ImageToImagePipeline:()=>Lc,ImageToTextPipeline:()=>Tc,InterruptableStoppingCriteria:()=>V0,JAISLMHeadModel:()=>Qh,JAISModel:()=>Yh,JAISPreTrainedModel:()=>Po,JinaCLIPImageProcessor:()=>td,JinaCLIPModel:()=>Jh,JinaCLIPPreTrainedModel:()=>Bs,JinaCLIPProcessor:()=>Id,JinaCLIPTextModel:()=>zo,JinaCLIPVisionModel:()=>Zh,Lfm2ForCausalLM:()=>t_,Lfm2Model:()=>e_,Lfm2MoeForCausalLM:()=>s_,Lfm2MoeModel:()=>r_,Lfm2MoePreTrainedModel:()=>No,Lfm2PreTrainedModel:()=>Lo,LiteWhisperForConditionalGeneration:()=>Cx,Llama4ForCausalLM:()=>a_,Llama4PreTrainedModel:()=>hl,LlamaForCausalLM:()=>o_,LlamaModel:()=>n_,LlamaPreTrainedModel:()=>$o,LlamaTokenizer:()=>ep,LlavaForConditionalGeneration:()=>Ds,LlavaOnevisionForConditionalGeneration:()=>Ds,LlavaOnevisionImageProcessor:()=>rd,LlavaPreTrainedModel:()=>_l,LlavaProcessor:()=>Cd,LlavaQwen2ForCausalLM:()=>l_,LogitsProcessor:()=>Nt,LogitsProcessorList:()=>Kr,LogitsWarper:()=>Nn,LongT5ForConditionalGeneration:()=>u_,LongT5Model:()=>c_,LongT5PreTrainedModel:()=>Ro,M2M100ForConditionalGeneration:()=>d_,M2M100Model:()=>p_,M2M100PreTrainedModel:()=>Uo,M2M100Tokenizer:()=>tp,MBart50Tokenizer:()=>sp,MBartForCausalLM:()=>y_,MBartForConditionalGeneration:()=>w_,MBartForSequenceClassification:()=>x_,MBartModel:()=>g_,MBartPreTrainedModel:()=>Jr,MBartTokenizer:()=>vn,MPNetForMaskedLM:()=>ng,MPNetForQuestionAnswering:()=>ig,MPNetForSequenceClassification:()=>og,MPNetForTokenClassification:()=>ag,MPNetModel:()=>sg,MPNetPreTrainedModel:()=>Tr,MPNetTokenizer:()=>ap,MT5ForConditionalGeneration:()=>pg,MT5Model:()=>ug,MT5PreTrainedModel:()=>Yo,MarianMTModel:()=>m_,MarianModel:()=>f_,MarianPreTrainedModel:()=>Bo,MarianTokenizer:()=>rp,Mask2FormerImageProcessor:()=>nd,MaskFormerFeatureExtractor:()=>sd,MaskFormerForInstanceSegmentation:()=>__,MaskFormerImageProcessor:()=>Ts,MaskFormerModel:()=>h_,MaskFormerPreTrainedModel:()=>Do,MaxLengthCriteria:()=>Hi,Metric3DForDepthEstimation:()=>b_,Metric3DPreTrainedModel:()=>gl,Metric3Dv2ForDepthEstimation:()=>v_,Metric3Dv2PreTrainedModel:()=>wl,MgpstrForSceneTextRecognition:()=>k_,MgpstrModelOutput:()=>xl,MgpstrPreTrainedModel:()=>yl,MgpstrProcessor:()=>Pd,MgpstrTokenizer:()=>np,MimiDecoderModel:()=>jo,MimiDecoderOutput:()=>vl,MimiEncoderModel:()=>Fo,MimiEncoderOutput:()=>bl,MimiModel:()=>E_,MimiPreTrainedModel:()=>Fs,MinLengthLogitsProcessor:()=>Fi,MinNewTokensLengthLogitsProcessor:()=>ji,MistralForCausalLM:()=>M_,MistralModel:()=>A_,MistralPreTrainedModel:()=>Go,MobileBertForMaskedLM:()=>S_,MobileBertForQuestionAnswering:()=>I_,MobileBertForSequenceClassification:()=>O_,MobileBertModel:()=>T_,MobileBertPreTrainedModel:()=>Zr,MobileBertTokenizer:()=>op,MobileLLMForCausalLM:()=>P_,MobileLLMModel:()=>C_,MobileLLMPreTrainedModel:()=>qo,MobileNetV1FeatureExtractor:()=>od,MobileNetV1ForImageClassification:()=>L_,MobileNetV1ForSemanticSegmentation:()=>N_,MobileNetV1ImageProcessor:()=>Ei,MobileNetV1Model:()=>z_,MobileNetV1PreTrainedModel:()=>js,MobileNetV2FeatureExtractor:()=>ad,MobileNetV2ForImageClassification:()=>R_,MobileNetV2ForSemanticSegmentation:()=>U_,MobileNetV2ImageProcessor:()=>Ai,MobileNetV2Model:()=>$_,MobileNetV2PreTrainedModel:()=>Gs,MobileNetV3FeatureExtractor:()=>id,MobileNetV3ForImageClassification:()=>D_,MobileNetV3ForSemanticSegmentation:()=>F_,MobileNetV3ImageProcessor:()=>Mi,MobileNetV3Model:()=>B_,MobileNetV3PreTrainedModel:()=>qs,MobileNetV4FeatureExtractor:()=>ld,MobileNetV4ForImageClassification:()=>G_,MobileNetV4ForSemanticSegmentation:()=>q_,MobileNetV4ImageProcessor:()=>Ti,MobileNetV4Model:()=>j_,MobileNetV4PreTrainedModel:()=>Ws,MobileViTFeatureExtractor:()=>cd,MobileViTForImageClassification:()=>V_,MobileViTImageProcessor:()=>Si,MobileViTModel:()=>W_,MobileViTPreTrainedModel:()=>Wo,MobileViTV2ForImageClassification:()=>X_,MobileViTV2Model:()=>H_,MobileViTV2PreTrainedModel:()=>Vo,ModernBertDecoderForCausalLM:()=>eg,ModernBertDecoderModel:()=>Z_,ModernBertDecoderPreTrainedModel:()=>Ho,ModernBertForMaskedLM:()=>Y_,ModernBertForSequenceClassification:()=>Q_,ModernBertForTokenClassification:()=>J_,ModernBertModel:()=>K_,ModernBertPreTrainedModel:()=>es,Moondream1ForConditionalGeneration:()=>i_,MoonshineFeatureExtractor:()=>Sp,MoonshineForConditionalGeneration:()=>rg,MoonshineModel:()=>tg,MoonshinePreTrainedModel:()=>Xo,MoonshineProcessor:()=>zd,MptForCausalLM:()=>cg,MptModel:()=>lg,MptPreTrainedModel:()=>Ko,MultiModalityCausalLM:()=>dg,MultiModalityPreTrainedModel:()=>kl,MusicgenForCausalLM:()=>mg,MusicgenForConditionalGeneration:()=>Jo,MusicgenModel:()=>fg,MusicgenPreTrainedModel:()=>Qo,NanoChatForCausalLM:()=>_g,NanoChatModel:()=>hg,NanoChatPreTrainedModel:()=>Zo,NeoBertForMaskedLM:()=>wg,NeoBertForQuestionAnswering:()=>bg,NeoBertForSequenceClassification:()=>xg,NeoBertForTokenClassification:()=>yg,NeoBertModel:()=>gg,NeoBertPreTrainedModel:()=>Sr,NllbTokenizer:()=>ip,NoBadWordsLogitsProcessor:()=>Gi,NoRepeatNGramLogitsProcessor:()=>Bi,NomicBertModel:()=>vg,NomicBertPreTrainedModel:()=>El,NougatImageProcessor:()=>ud,NougatTokenizer:()=>lp,OPTForCausalLM:()=>Pg,OPTModel:()=>Cg,OPTPreTrainedModel:()=>na,ObjectDetectionPipeline:()=>Cc,Olmo2ForCausalLM:()=>Mg,Olmo2Model:()=>Ag,Olmo2PreTrainedModel:()=>ta,Olmo3ForCausalLM:()=>Sg,Olmo3Model:()=>Tg,Olmo3PreTrainedModel:()=>ra,OlmoForCausalLM:()=>Eg,OlmoModel:()=>kg,OlmoPreTrainedModel:()=>ea,OpenELMForCausalLM:()=>Ig,OpenELMModel:()=>Og,OpenELMPreTrainedModel:()=>sa,OwlViTFeatureExtractor:()=>pd,OwlViTForObjectDetection:()=>$g,OwlViTImageProcessor:()=>Ss,OwlViTModel:()=>Ng,OwlViTPreTrainedModel:()=>aa,OwlViTProcessor:()=>Ld,Owlv2ForObjectDetection:()=>Lg,Owlv2ImageProcessor:()=>dd,Owlv2Model:()=>zg,Owlv2PreTrainedModel:()=>oa,PaliGemmaForConditionalGeneration:()=>Rg,PaliGemmaPreTrainedModel:()=>Al,PaliGemmaProcessor:()=>Nd,ParakeetFeatureExtractor:()=>Op,ParakeetForCTC:()=>Ug,ParakeetPreTrainedModel:()=>Ml,PatchTSMixerForPrediction:()=>Dg,PatchTSMixerModel:()=>Bg,PatchTSMixerPreTrainedModel:()=>ia,PatchTSTForPrediction:()=>jg,PatchTSTModel:()=>Fg,PatchTSTPreTrainedModel:()=>la,Phi3ForCausalLM:()=>Vg,Phi3Model:()=>Wg,Phi3PreTrainedModel:()=>ua,Phi3VForCausalLM:()=>pa,Phi3VImageProcessor:()=>fd,Phi3VPreTrainedModel:()=>Tl,Phi3VProcessor:()=>$d,PhiForCausalLM:()=>qg,PhiModel:()=>Gg,PhiPreTrainedModel:()=>ca,PixtralImageProcessor:()=>md,PixtralProcessor:()=>Rd,PreTrainedModel:()=>y,PreTrainedTokenizer:()=>j,PretrainedConfig:()=>Ni,Processor:()=>ne,PvtForImageClassification:()=>Xg,PvtImageProcessor:()=>hd,PvtModel:()=>Hg,PvtPreTrainedModel:()=>da,PyAnnoteFeatureExtractor:()=>Sn,PyAnnoteForAudioFrameClassification:()=>Yg,PyAnnoteModel:()=>Kg,PyAnnotePreTrainedModel:()=>fa,PyAnnoteProcessor:()=>Ud,QuestionAnsweringPipeline:()=>gc,Qwen2ForCausalLM:()=>Jg,Qwen2Model:()=>Qg,Qwen2PreTrainedModel:()=>ma,Qwen2Tokenizer:()=>cp,Qwen2VLForConditionalGeneration:()=>Zg,Qwen2VLImageProcessor:()=>_d,Qwen2VLPreTrainedModel:()=>Sl,Qwen2VLProcessor:()=>Bd,Qwen3ForCausalLM:()=>tw,Qwen3Model:()=>ew,Qwen3PreTrainedModel:()=>ha,RFDetrForObjectDetection:()=>ow,RFDetrModel:()=>nw,RFDetrObjectDetectionOutput:()=>Ol,RFDetrPreTrainedModel:()=>ga,RTDetrForObjectDetection:()=>tm,RTDetrImageProcessor:()=>gd,RTDetrModel:()=>em,RTDetrObjectDetectionOutput:()=>tr,RTDetrPreTrainedModel:()=>Zn,RTDetrV2ForObjectDetection:()=>gw,RTDetrV2Model:()=>_w,RTDetrV2ObjectDetectionOutput:()=>Il,RTDetrV2PreTrainedModel:()=>wa,RawAudio:()=>An,RawImage:()=>Xe,RawVideo:()=>Uc,RawVideoFrame:()=>ja,RepetitionPenaltyLogitsProcessor:()=>Di,ResNetForImageClassification:()=>sw,ResNetModel:()=>rw,ResNetPreTrainedModel:()=>_a,RoFormerForMaskedLM:()=>dw,RoFormerForQuestionAnswering:()=>hw,RoFormerForSequenceClassification:()=>fw,RoFormerForTokenClassification:()=>mw,RoFormerModel:()=>pw,RoFormerPreTrainedModel:()=>Ir,RoFormerTokenizer:()=>pp,RobertaForMaskedLM:()=>iw,RobertaForQuestionAnswering:()=>uw,RobertaForSequenceClassification:()=>lw,RobertaForTokenClassification:()=>cw,RobertaModel:()=>aw,RobertaPreTrainedModel:()=>Or,RobertaTokenizer:()=>up,Sam2ImageProcessor:()=>In,Sam2ImageSegmentationOutput:()=>zl,Sam2Model:()=>xa,Sam2PreTrainedModel:()=>Ll,Sam2Processor:()=>Li,Sam2VideoProcessor:()=>Dd,Sam3ImageProcessor:()=>In,Sam3TrackerModel:()=>yw,SamImageProcessor:()=>In,SamImageSegmentationOutput:()=>Cl,SamModel:()=>ww,SamPreTrainedModel:()=>Pl,SamProcessor:()=>zn,SapiensFeatureExtractor:()=>wd,SapiensForDepthEstimation:()=>vw,SapiensForNormalEstimation:()=>kw,SapiensForSemanticSegmentation:()=>bw,SapiensImageProcessor:()=>Oi,SapiensPreTrainedModel:()=>Vs,SeamlessM4TFeatureExtractor:()=>Ip,SegformerFeatureExtractor:()=>xd,SegformerForImageClassification:()=>Aw,SegformerForSemanticSegmentation:()=>Mw,SegformerImageProcessor:()=>Ii,SegformerModel:()=>Ew,SegformerPreTrainedModel:()=>Hs,SiglipImageProcessor:()=>yd,SiglipModel:()=>Tw,SiglipPreTrainedModel:()=>ya,SiglipTextModel:()=>ba,SiglipTokenizer:()=>dp,SiglipVisionModel:()=>Sw,SmolLM3ForCausalLM:()=>Iw,SmolLM3Model:()=>Ow,SmolLM3PreTrainedModel:()=>va,SmolVLMForConditionalGeneration:()=>Hh,SmolVLMImageProcessor:()=>ki,SmolVLMProcessor:()=>zi,SnacDecoderModel:()=>Ea,SnacEncoderModel:()=>ka,SnacFeatureExtractor:()=>Cp,SnacModel:()=>Cw,SnacPreTrainedModel:()=>Xs,SpeechT5FeatureExtractor:()=>Pp,SpeechT5ForSpeechToText:()=>zw,SpeechT5ForTextToSpeech:()=>Lw,SpeechT5HifiGan:()=>Nw,SpeechT5Model:()=>Pw,SpeechT5PreTrainedModel:()=>Ks,SpeechT5Processor:()=>Fd,SpeechT5Tokenizer:()=>fp,SqueezeBertForMaskedLM:()=>Rw,SqueezeBertForQuestionAnswering:()=>Bw,SqueezeBertForSequenceClassification:()=>Uw,SqueezeBertModel:()=>$w,SqueezeBertPreTrainedModel:()=>ts,SqueezeBertTokenizer:()=>mp,StableLmForCausalLM:()=>Fw,StableLmModel:()=>Dw,StableLmPreTrainedModel:()=>Aa,Starcoder2ForCausalLM:()=>Gw,Starcoder2Model:()=>jw,Starcoder2PreTrainedModel:()=>Ma,StoppingCriteria:()=>Is,StoppingCriteriaList:()=>Vi,StyleTextToSpeech2Model:()=>qw,StyleTextToSpeech2PreTrainedModel:()=>Nl,SummarizationPipeline:()=>xc,SupertonicForConditionalGeneration:()=>Ta,SupertonicPreTrainedModel:()=>$l,SuppressTokensAtBeginLogitsProcessor:()=>Os,Swin2SRForImageSuperResolution:()=>Kw,Swin2SRImageProcessor:()=>bd,Swin2SRModel:()=>Xw,Swin2SRPreTrainedModel:()=>Sa,SwinForImageClassification:()=>Vw,SwinForSemanticSegmentation:()=>Hw,SwinModel:()=>Ww,SwinPreTrainedModel:()=>Ys,T5ForConditionalGeneration:()=>Qw,T5Model:()=>Yw,T5PreTrainedModel:()=>Oa,T5Tokenizer:()=>hp,TableTransformerForObjectDetection:()=>Zw,TableTransformerModel:()=>Jw,TableTransformerObjectDetectionOutput:()=>Rl,TableTransformerPreTrainedModel:()=>Ia,TemperatureLogitsWarper:()=>Wi,Tensor:()=>U,Text2TextGenerationPipeline:()=>Lr,TextClassificationPipeline:()=>hc,TextGenerationPipeline:()=>bc,TextStreamer:()=>Hx,TextToAudioPipeline:()=>Mc,TokenClassificationPipeline:()=>_c,TokenizersBackend:()=>j,TopKLogitsWarper:()=>W0,TopPLogitsWarper:()=>q0,TrOCRForCausalLM:()=>ex,TrOCRPreTrainedModel:()=>Ul,TranslationPipeline:()=>yc,UltravoxModel:()=>Dl,UltravoxPreTrainedModel:()=>Bl,UltravoxProcessor:()=>jd,UniSpeechForCTC:()=>sx,UniSpeechForSequenceClassification:()=>nx,UniSpeechModel:()=>rx,UniSpeechPreTrainedModel:()=>Qs,UniSpeechSatForAudioFrameClassification:()=>lx,UniSpeechSatForCTC:()=>ax,UniSpeechSatForSequenceClassification:()=>ix,UniSpeechSatModel:()=>ox,UniSpeechSatPreTrainedModel:()=>rs,VLChatProcessor:()=>Od,VLMImageProcessor:()=>ed,VaultGemmaForCausalLM:()=>ux,VaultGemmaModel:()=>cx,VaultGemmaPreTrainedModel:()=>Ca,ViTFeatureExtractor:()=>vd,ViTForImageClassification:()=>fx,ViTImageProcessor:()=>Ci,ViTMAEModel:()=>mx,ViTMAEPreTrainedModel:()=>Fl,ViTMSNForImageClassification:()=>_x,ViTMSNModel:()=>hx,ViTMSNPreTrainedModel:()=>za,ViTModel:()=>dx,ViTPreTrainedModel:()=>Pa,VisionEncoderDecoderModel:()=>px,VitMatteForImageMatting:()=>gx,VitMatteImageProcessor:()=>kd,VitMattePreTrainedModel:()=>jl,VitPoseForPoseEstimation:()=>wx,VitPoseImageProcessor:()=>Ed,VitPosePreTrainedModel:()=>Gl,VitsModel:()=>xx,VitsModelOutput:()=>ql,VitsPreTrainedModel:()=>Wl,VitsTokenizer:()=>_p,VoxtralForConditionalGeneration:()=>tx,VoxtralProcessor:()=>qd,Wav2Vec2BertForCTC:()=>bx,Wav2Vec2BertForSequenceClassification:()=>vx,Wav2Vec2BertModel:()=>yx,Wav2Vec2BertPreTrainedModel:()=>Js,Wav2Vec2CTCTokenizer:()=>gp,Wav2Vec2FeatureExtractor:()=>zp,Wav2Vec2ForAudioFrameClassification:()=>Dh,Wav2Vec2ForCTC:()=>Uh,Wav2Vec2ForSequenceClassification:()=>Bh,Wav2Vec2Model:()=>Rh,Wav2Vec2PreTrainedModel:()=>Wt,Wav2Vec2Processor:()=>Wd,Wav2Vec2ProcessorWithLM:()=>Vd,WavLMForAudioFrameClassification:()=>Tx,WavLMForCTC:()=>Ex,WavLMForSequenceClassification:()=>Ax,WavLMForXVector:()=>Mx,WavLMModel:()=>kx,WavLMPreTrainedModel:()=>Cr,WeSpeakerFeatureExtractor:()=>Lp,WeSpeakerResNetModel:()=>Sx,WeSpeakerResNetPreTrainedModel:()=>Hl,WhisperFeatureExtractor:()=>Np,WhisperForConditionalGeneration:()=>Xl,WhisperModel:()=>Ix,WhisperPreTrainedModel:()=>La,WhisperProcessor:()=>Hd,WhisperTextStreamer:()=>cb,WhisperTimeStampLogitsProcessor:()=>Ui,WhisperTokenizer:()=>wp,XLMForQuestionAnswering:()=>$x,XLMForSequenceClassification:()=>Lx,XLMForTokenClassification:()=>Nx,XLMModel:()=>Px,XLMPreTrainedModel:()=>Pr,XLMRobertaForMaskedLM:()=>Ux,XLMRobertaForQuestionAnswering:()=>Fx,XLMRobertaForSequenceClassification:()=>Bx,XLMRobertaForTokenClassification:()=>Dx,XLMRobertaModel:()=>Rx,XLMRobertaPreTrainedModel:()=>zr,XLMRobertaTokenizer:()=>xp,XLMTokenizer:()=>yp,XLMWithLMHeadModel:()=>zx,XVectorOutput:()=>Vl,YolosFeatureExtractor:()=>Ad,YolosForObjectDetection:()=>Gx,YolosImageProcessor:()=>Pi,YolosModel:()=>jx,YolosObjectDetectionOutput:()=>Kl,YolosPreTrainedModel:()=>Na,YoutuForCausalLM:()=>Wx,YoutuModel:()=>qx,YoutuPreTrainedModel:()=>$a,ZeroShotAudioClassificationPipeline:()=>Ec,ZeroShotClassificationPipeline:()=>vc,ZeroShotImageClassificationPipeline:()=>Ic,ZeroShotObjectDetectionPipeline:()=>Pc,cat:()=>Ee,cos_sim:()=>mk,dot:()=>Cy,env:()=>De,full:()=>Ge,full_like:()=>yn,interpolate:()=>Su,interpolate_4d:()=>Pt,layer_norm:()=>dP,load_image:()=>fA,load_video:()=>s2,log_softmax:()=>pu,matmul:()=>I0,mean:()=>fi,mean_pooling:()=>C0,ones:()=>rt,ones_like:()=>mi,permute:()=>ZE,pipeline:()=>uz,quantize_embeddings:()=>L0,rand:()=>fP,randn:()=>z0,read_audio:()=>kp,rfft:()=>pP,slice:()=>di,softmax:()=>Oe,stack:()=>zt,std_mean:()=>Ou,topk:()=>Gt,zeros:()=>Iu,zeros_like:()=>Cu});module.exports=pS(fz);var yv=Ur(require("fs"),1),us=Ur(require("path"),1),bv=Ur(require("url"),1),yS={},dS="4.0.0-next.2",vv=typeof process<"u",kv=vv&&process?.release?.name==="node",Ha=!Tv(yv.default),Ev=!Tv(us.default),fS=typeof globalThis.Deno<"u",hz=typeof globalThis.Bun<"u",Av=typeof window<"u"&&typeof window.document<"u",Mv=typeof self<"u"&&["DedicatedWorkerGlobalScope","ServiceWorkerGlobalScope","SharedWorkerGlobalScope"].includes(self.constructor?.name),by=typeof self<"u"&&"caches"in self,mS=kv||typeof navigator<"u"&&"gpu"in navigator,hS=typeof navigator<"u"&&"ml"in navigator,_S=()=>{if(typeof navigator>"u")return!1;let t=navigator.userAgent,r=(navigator.vendor||"").indexOf("Apple")>-1,s=!t.match(/CriOS|FxiOS|EdgiOS|OPiOS|mercury|brave/i)&&!t.includes("Chrome")&&!t.includes("Android");return r&&s},gS=_S(),be=Object.freeze({IS_BROWSER_ENV:Av,IS_WEBWORKER_ENV:Mv,IS_WEB_CACHE_AVAILABLE:by,IS_WEBGPU_AVAILABLE:mS,IS_WEBNN_AVAILABLE:hS,IS_SAFARI:gS,IS_PROCESS_AVAILABLE:vv,IS_NODE_ENV:kv,IS_FS_AVAILABLE:Ha,IS_PATH_AVAILABLE:Ev}),vy=Ha&&Ev,eu="./";if(vy){let t=Object(yS).url;t?eu=us.default.dirname(us.default.dirname(bv.default.fileURLToPath(t))):typeof __dirname<"u"&&(eu=us.default.dirname(__dirname))}var wS=vy?us.default.join(eu,"/.cache/"):null,xv="/models/",xS=vy?us.default.join(eu,xv):xv,De={version:dS,backends:{onnx:{}},allowRemoteModels:!0,remoteHost:"https://huggingface.co/",remotePathTemplate:"{model}/resolve/{revision}/",allowLocalModels:!(Av||Mv),localModelPath:xS,useFS:Ha,useBrowserCache:by&&!fS,useFSCache:Ha,cacheDir:wS,useCustomCache:!1,customCache:null,useWasmCache:by||Ha,cacheKey:"transformers-cache"};function Tv(t){return Object.keys(t).length===0}var bS=class{constructor(t){this.trie=this._build_trie(t)}_build_trie(t){let e=Object.create(null);for(let r of t){let s=e;for(let n=0;n<r.length;++n){let o=r[n];s=s[o]??=Object.create(null)}s.end=r}return e}split(t){let e=[],r=t.length,s=0,n=0;for(;n<r;){let o=this.trie,a=null,i=n;for(;i<r&&(o=o[t[i]]);)o.end&&(a=o.end),++i;a?(n>s&&e.push(t.slice(s,n)),e.push(a),n+=a.length,s=n):++n}return s<r&&e.push(t.slice(s)),e}},Sv=bS,vS=class{constructor(t){this.content=t.content,this.id=t.id,this.single_word=t.single_word??!1,this.lstrip=t.lstrip??!1,this.rstrip=t.rstrip??!1,this.special=t.special??!1,this.normalized=t.normalized??!this.special}},kS=vS,Nv=(()=>{let t=[...Array.from({length:94},(n,o)=>o+33),...Array.from({length:12},(n,o)=>o+161),...Array.from({length:82},(n,o)=>o+174)],e=t.slice(),r=0;for(let n=0;n<256;++n)t.includes(n)||(t.push(n),e.push(256+r),r+=1);let s=e.map(n=>String.fromCharCode(n));return Object.fromEntries(t.map((n,o)=>[n,s[o]]))})(),ES=t=>Object.fromEntries(Object.entries(t).map(([e,r])=>[r,e])),AS=ES(Nv),Ov=".,!?\u2026\u3002\uFF0C\u3001\u0964\u06D4\u060C",MS=new Map([["(?i:'s|'t|'re|'ve|'m|'ll|'d)","(?:'([sS]|[tT]|[rR][eE]|[vV][eE]|[mM]|[lL][lL]|[dD]))"],["(?i:[sdmt]|ll|ve|re)","(?:[sS]|[dD]|[mM]|[tT]|[lL][lL]|[vV][eE]|[rR][eE])"],["[^\\r\\n\\p{L}\\p{N}]?+","[^\\r\\n\\p{L}\\p{N}]?"],["[^\\s\\p{L}\\p{N}]++","[^\\s\\p{L}\\p{N}]+"],[` ?[^(\\s|[${Ov}])]+`,` ?[^\\s${Ov}]+`]]),tu="\\p{P}\\u0021-\\u002F\\u003A-\\u0040\\u005B-\\u0060\\u007B-\\u007E",Ey=t=>t.replace(/ \./g,".").replace(/ \?/g,"?").replace(/ \!/g,"!").replace(/ ,/g,",").replace(/ \' /g,"'").replace(/ n't/g,"n't").replace(/ 'm/g,"'m").replace(/ 's/g,"'s").replace(/ 've/g,"'ve").replace(/ 're/g,"'re"),ru=(t,e=!0)=>{if(t.Regex!==void 0){let r=t.Regex.replace(/\\([#&~])/g,"$1");for(let[s,n]of MS)r=r.replaceAll(s,n);try{return new RegExp(r,"gu")}catch(s){if(!(s instanceof SyntaxError)||!s.message.toLowerCase().includes("invalid property name"))throw s;let n=!1,o=r.replace(/(\\[pP])\{([^}=]+)\}/g,(a,i,l)=>{try{return new RegExp(`\\p{${l}}`,"u"),`${i}{${l}}`}catch{return n=!0,`${i}{Script=${l}}`}});if(!n)throw s;try{return new RegExp(o,"gu")}catch{throw s}}}else if(t.String!==void 0){let r=TS(t.String);return new RegExp(e?r:`(${r})`,"gu")}else return console.warn("Unknown pattern type:",t),null},TS=t=>t.replace(/[.*+?^${}()|[\]\\]/g,"\\$&"),SS=(t,e,r)=>{let s=[],n=0;for(;n<t.length;){if(s.push(t[n]),(e.get(t[n])??r)!==r){++n;continue}for(;++n<t.length&&(e.get(t[n])??r)===r;)e.get(s.at(-1))!==r&&(s[s.length-1]+=t[n])}return s},OS=t=>t>=19968&&t<=40959||t>=13312&&t<=19903||t>=131072&&t<=173791||t>=173824&&t<=177983||t>=177984&&t<=178207||t>=178208&&t<=183983||t>=63744&&t<=64255||t>=194560&&t<=195103,IS=t=>Number.isInteger(t)||typeof t=="bigint",CS=t=>{let e=0;for(let r of t)++e;return e},PS=t=>$v(t.toLowerCase()),Ht=(...t)=>Array.prototype.concat.apply([],t),Ay=t=>new Map(Object.entries(t)),zS=(t,e)=>{let r=[],s=0;for(let n of t.matchAll(e)){let o=n[0];s<n.index&&r.push(t.slice(s,n.index)),o.length>0&&r.push(o),s=n.index+o.length}return s<t.length&&r.push(t.slice(s)),r},$v=t=>t.replace(/\p{M}/gu,""),Iv=(t,e,r=[])=>{if(!t||Array.isArray(t)||typeof t!="object")return`${e} must be a valid object`;for(let s of r)if(!(s in t))return`${e} must contain a "${s}" property`;return null},LS=t=>t.match(/\S+/g)||[],NS=class{constructor(){let t=function(...e){return t._call(...e)};return Object.setPrototypeOf(t,new.target.prototype)}},Xa=NS,$S=class extends Xa{constructor(t){super(),this.config=t}_call(t){return this.normalize(t)}},gr=$S,RS=class extends gr{tokenize_chinese_chars(t){let e=[];for(let r=0;r<t.length;++r){let s=t[r],n=s.charCodeAt(0);OS(n)?(e.push(" "),e.push(s),e.push(" ")):e.push(s)}return e.join("")}strip_accents(t){return t.normalize("NFD").replace(/\p{Mn}/gu,"")}is_control(t){switch(t){case" ":case`
|
|
1
|
+
var aS=Object.create;var Zc=Object.defineProperty;var iS=Object.getOwnPropertyDescriptor;var lS=Object.getOwnPropertyNames;var cS=Object.getPrototypeOf,uS=Object.prototype.hasOwnProperty;var cs=(t,e)=>{for(var r in e)Zc(t,r,{get:e[r],enumerable:!0})},wv=(t,e,r,s)=>{if(e&&typeof e=="object"||typeof e=="function")for(let n of lS(e))!uS.call(t,n)&&n!==r&&Zc(t,n,{get:()=>e[n],enumerable:!(s=iS(e,n))||s.enumerable});return t};var Ur=(t,e,r)=>(r=t!=null?aS(cS(t)):{},wv(e||!t||!t.__esModule?Zc(r,"default",{value:t,enumerable:!0}):r,t)),pS=t=>wv(Zc({},"__esModule",{value:!0}),t);var fz={};cs(fz,{ASTFeatureExtractor:()=>Ep,ASTForAudioClassification:()=>pf,ASTModel:()=>uf,ASTPreTrainedModel:()=>Bn,AlbertForMaskedLM:()=>nf,AlbertForQuestionAnswering:()=>sf,AlbertForSequenceClassification:()=>rf,AlbertModel:()=>tf,AlbertPreTrainedModel:()=>Yr,AlbertTokenizer:()=>Pu,ApertusForCausalLM:()=>af,ApertusModel:()=>of,ApertusPreTrainedModel:()=>Rn,ArceeForCausalLM:()=>cf,ArceeModel:()=>lf,ArceePreTrainedModel:()=>Un,AudioClassificationPipeline:()=>kc,AutoConfig:()=>Xr,AutoFeatureExtractor:()=>Ze,AutoImageProcessor:()=>Le,AutoModel:()=>pr,AutoModelForAudioClassification:()=>cc,AutoModelForAudioFrameClassification:()=>sb,AutoModelForAudioTextToText:()=>lb,AutoModelForCTC:()=>lc,AutoModelForCausalLM:()=>tc,AutoModelForDepthEstimation:()=>dc,AutoModelForDocumentQuestionAnswering:()=>uc,AutoModelForImageClassification:()=>oc,AutoModelForImageFeatureExtraction:()=>fc,AutoModelForImageMatting:()=>nb,AutoModelForImageSegmentation:()=>Ba,AutoModelForImageTextToText:()=>ib,AutoModelForImageToImage:()=>pc,AutoModelForMaskGeneration:()=>tb,AutoModelForMaskedLM:()=>rc,AutoModelForNormalEstimation:()=>ob,AutoModelForObjectDetection:()=>ac,AutoModelForPoseEstimation:()=>ab,AutoModelForQuestionAnswering:()=>sc,AutoModelForSemanticSegmentation:()=>Da,AutoModelForSeq2SeqLM:()=>Zs,AutoModelForSequenceClassification:()=>Ua,AutoModelForSpeechSeq2Seq:()=>Jl,AutoModelForTextToSpectrogram:()=>Zl,AutoModelForTextToWaveform:()=>ec,AutoModelForTokenClassification:()=>Ql,AutoModelForUniversalSegmentation:()=>Fa,AutoModelForVision2Seq:()=>nc,AutoModelForXVector:()=>rb,AutoModelForZeroShotObjectDetection:()=>ic,AutoProcessor:()=>lt,AutoTokenizer:()=>J,AutomaticSpeechRecognitionPipeline:()=>Ac,BackgroundRemovalPipeline:()=>Oc,BartForConditionalGeneration:()=>ff,BartForSequenceClassification:()=>mf,BartModel:()=>df,BartPretrainedModel:()=>Ls,BartTokenizer:()=>zu,BaseStreamer:()=>Vx,BeitFeatureExtractor:()=>Fp,BeitForImageClassification:()=>_f,BeitModel:()=>hf,BeitPreTrainedModel:()=>Dn,BertForMaskedLM:()=>wf,BertForQuestionAnswering:()=>bf,BertForSequenceClassification:()=>xf,BertForTokenClassification:()=>yf,BertModel:()=>gf,BertPreTrainedModel:()=>yr,BertTokenizer:()=>Lu,BitImageProcessor:()=>jp,BlenderbotForConditionalGeneration:()=>kf,BlenderbotModel:()=>vf,BlenderbotPreTrainedModel:()=>Fn,BlenderbotSmallForConditionalGeneration:()=>Af,BlenderbotSmallModel:()=>Ef,BlenderbotSmallPreTrainedModel:()=>jn,BlenderbotSmallTokenizer:()=>Nu,BlenderbotTokenizer:()=>$u,BloomForCausalLM:()=>Tf,BloomModel:()=>Mf,BloomPreTrainedModel:()=>Gn,BloomTokenizer:()=>Ru,CLIPFeatureExtractor:()=>qp,CLIPImageProcessor:()=>wi,CLIPModel:()=>Nf,CLIPPreTrainedModel:()=>er,CLIPSegForImageSegmentation:()=>Df,CLIPSegModel:()=>Bf,CLIPSegPreTrainedModel:()=>Xn,CLIPTextModel:()=>$f,CLIPTextModelWithProjection:()=>Hn,CLIPTokenizer:()=>Bu,CLIPVisionModel:()=>Rf,CLIPVisionModelWithProjection:()=>Uf,CamembertForMaskedLM:()=>Of,CamembertForQuestionAnswering:()=>Pf,CamembertForSequenceClassification:()=>If,CamembertForTokenClassification:()=>Cf,CamembertModel:()=>Sf,CamembertPreTrainedModel:()=>br,CamembertTokenizer:()=>Uu,ChatterboxFeatureExtractor:()=>Ap,ChatterboxModel:()=>qn,ChatterboxPreTrainedModel:()=>Ji,ChatterboxProcessor:()=>$p,ChineseCLIPFeatureExtractor:()=>Gp,ChineseCLIPModel:()=>zf,ChineseCLIPPreTrainedModel:()=>Zi,ClapAudioModelWithProjection:()=>Vn,ClapFeatureExtractor:()=>Mp,ClapModel:()=>Lf,ClapPreTrainedModel:()=>Ns,ClapTextModelWithProjection:()=>Wn,ClassifierFreeGuidanceLogitsProcessor:()=>qi,CodeGenForCausalLM:()=>jf,CodeGenModel:()=>Ff,CodeGenPreTrainedModel:()=>Kn,CodeGenTokenizer:()=>Fu,CodeLlamaTokenizer:()=>Du,CohereForCausalLM:()=>qf,CohereModel:()=>Gf,CoherePreTrainedModel:()=>Yn,CohereTokenizer:()=>ju,ConvBertForMaskedLM:()=>Vf,ConvBertForQuestionAnswering:()=>Kf,ConvBertForSequenceClassification:()=>Hf,ConvBertForTokenClassification:()=>Xf,ConvBertModel:()=>Wf,ConvBertPreTrainedModel:()=>vr,ConvBertTokenizer:()=>Gu,ConvNextFeatureExtractor:()=>Wp,ConvNextForImageClassification:()=>Qf,ConvNextImageProcessor:()=>xi,ConvNextModel:()=>Yf,ConvNextPreTrainedModel:()=>Qn,ConvNextV2ForImageClassification:()=>Zf,ConvNextV2Model:()=>Jf,ConvNextV2PreTrainedModel:()=>Jn,DFineForObjectDetection:()=>sm,DFineModel:()=>rm,DFinePreTrainedModel:()=>eo,DINOv3ConvNextModel:()=>Tm,DINOv3ConvNextPreTrainedModel:()=>al,DINOv3ViTImageProcessor:()=>Xp,DINOv3ViTModel:()=>Sm,DINOv3ViTPreTrainedModel:()=>il,DPTFeatureExtractor:()=>Yp,DPTForDepthEstimation:()=>$m,DPTImageProcessor:()=>vi,DPTModel:()=>Nm,DPTPreTrainedModel:()=>ao,DacDecoderModel:()=>ro,DacDecoderOutput:()=>tl,DacEncoderModel:()=>to,DacEncoderOutput:()=>el,DacFeatureExtractor:()=>Tn,DacModel:()=>nm,DacPreTrainedModel:()=>$s,DebertaForMaskedLM:()=>am,DebertaForQuestionAnswering:()=>cm,DebertaForSequenceClassification:()=>im,DebertaForTokenClassification:()=>lm,DebertaModel:()=>om,DebertaPreTrainedModel:()=>kr,DebertaTokenizer:()=>Wu,DebertaV2ForMaskedLM:()=>pm,DebertaV2ForQuestionAnswering:()=>mm,DebertaV2ForSequenceClassification:()=>dm,DebertaV2ForTokenClassification:()=>fm,DebertaV2Model:()=>um,DebertaV2PreTrainedModel:()=>Er,DebertaV2Tokenizer:()=>qu,DecisionTransformerModel:()=>hm,DecisionTransformerPreTrainedModel:()=>rl,DeiTFeatureExtractor:()=>Vp,DeiTForImageClassification:()=>gm,DeiTImageProcessor:()=>yi,DeiTModel:()=>_m,DeiTPreTrainedModel:()=>so,DepthAnythingForDepthEstimation:()=>wm,DepthAnythingPreTrainedModel:()=>sl,DepthEstimationPipeline:()=>Nc,DepthProForDepthEstimation:()=>xm,DepthProPreTrainedModel:()=>nl,DetrFeatureExtractor:()=>Hp,DetrForObjectDetection:()=>bm,DetrForSegmentation:()=>vm,DetrImageProcessor:()=>bi,DetrModel:()=>ym,DetrObjectDetectionOutput:()=>Us,DetrPreTrainedModel:()=>Rs,DetrSegmentationOutput:()=>ol,Dinov2ForImageClassification:()=>Em,Dinov2Model:()=>km,Dinov2PreTrainedModel:()=>no,Dinov2WithRegistersForImageClassification:()=>Mm,Dinov2WithRegistersModel:()=>Am,Dinov2WithRegistersPreTrainedModel:()=>oo,DistilBertForMaskedLM:()=>zm,DistilBertForQuestionAnswering:()=>Pm,DistilBertForSequenceClassification:()=>Im,DistilBertForTokenClassification:()=>Cm,DistilBertModel:()=>Om,DistilBertPreTrainedModel:()=>Ar,DistilBertTokenizer:()=>Vu,DocumentQuestionAnsweringPipeline:()=>zc,DonutFeatureExtractor:()=>Kp,DonutImageProcessor:()=>Ms,DonutSwinModel:()=>Lm,DonutSwinPreTrainedModel:()=>ll,EdgeTamModel:()=>xw,EfficientNetForImageClassification:()=>Um,EfficientNetImageProcessor:()=>Qp,EfficientNetModel:()=>Rm,EfficientNetPreTrainedModel:()=>io,ElectraForMaskedLM:()=>Dm,ElectraForQuestionAnswering:()=>Gm,ElectraForSequenceClassification:()=>Fm,ElectraForTokenClassification:()=>jm,ElectraModel:()=>Bm,ElectraPreTrainedModel:()=>Mr,ElectraTokenizer:()=>Hu,EncodecFeatureExtractor:()=>Mn,EosTokenCriteria:()=>Xi,Ernie4_5ForCausalLM:()=>Wm,Ernie4_5Model:()=>qm,Ernie4_5PretrainedModel:()=>lo,EsmForMaskedLM:()=>Hm,EsmForSequenceClassification:()=>Xm,EsmForTokenClassification:()=>Km,EsmModel:()=>Vm,EsmPreTrainedModel:()=>Qr,EsmTokenizer:()=>Xu,ExaoneForCausalLM:()=>Qm,ExaoneModel:()=>Ym,ExaonePreTrainedModel:()=>co,FalconForCausalLM:()=>Zm,FalconH1ForCausalLM:()=>th,FalconH1Model:()=>eh,FalconH1PreTrainedModel:()=>po,FalconModel:()=>Jm,FalconPreTrainedModel:()=>uo,FalconTokenizer:()=>Ku,FastViTForImageClassification:()=>sh,FastViTModel:()=>rh,FastViTPreTrainedModel:()=>fo,FeatureExtractionPipeline:()=>$c,FeatureExtractor:()=>ze,FillMaskPipeline:()=>wc,Florence2ForConditionalGeneration:()=>nh,Florence2PreTrainedModel:()=>cl,Florence2Processor:()=>Md,ForcedBOSTokenLogitsProcessor:()=>$i,ForcedEOSTokenLogitsProcessor:()=>Ri,GLPNFeatureExtractor:()=>Jp,GLPNForDepthEstimation:()=>mh,GLPNModel:()=>fh,GLPNPreTrainedModel:()=>xo,GPT2LMHeadModel:()=>Eh,GPT2Model:()=>kh,GPT2PreTrainedModel:()=>Eo,GPT2Tokenizer:()=>Ju,GPTBigCodeForCausalLM:()=>_h,GPTBigCodeModel:()=>hh,GPTBigCodePreTrainedModel:()=>yo,GPTJForCausalLM:()=>Mh,GPTJModel:()=>Ah,GPTJPreTrainedModel:()=>Ao,GPTNeoForCausalLM:()=>wh,GPTNeoModel:()=>gh,GPTNeoPreTrainedModel:()=>bo,GPTNeoXForCausalLM:()=>yh,GPTNeoXModel:()=>xh,GPTNeoXPreTrainedModel:()=>vo,GPTNeoXTokenizer:()=>Qu,Gemma2ForCausalLM:()=>lh,Gemma2Model:()=>ih,Gemma2PreTrainedModel:()=>ho,Gemma3ForCausalLM:()=>uh,Gemma3Model:()=>ch,Gemma3PreTrainedModel:()=>_o,Gemma3nAudioFeatureExtractor:()=>Tp,Gemma3nForConditionalGeneration:()=>go,Gemma3nPreTrainedModel:()=>ul,Gemma3nProcessor:()=>Td,GemmaForCausalLM:()=>ah,GemmaModel:()=>oh,GemmaPreTrainedModel:()=>mo,GemmaTokenizer:()=>Yu,GlmForCausalLM:()=>dh,GlmModel:()=>ph,GlmPreTrainedModel:()=>wo,GptOssForCausalLM:()=>vh,GptOssModel:()=>bh,GptOssPreTrainedModel:()=>ko,GraniteForCausalLM:()=>Sh,GraniteModel:()=>Th,GraniteMoeHybridForCausalLM:()=>Ih,GraniteMoeHybridModel:()=>Oh,GraniteMoeHybridPreTrainedModel:()=>To,GranitePreTrainedModel:()=>Mo,GroundingDinoForObjectDetection:()=>Ch,GroundingDinoImageProcessor:()=>Zp,GroundingDinoPreTrainedModel:()=>pl,GroundingDinoProcessor:()=>Sd,GroupViTModel:()=>Ph,GroupViTPreTrainedModel:()=>dl,HeliumForCausalLM:()=>Lh,HeliumModel:()=>zh,HeliumPreTrainedModel:()=>So,HerbertTokenizer:()=>Zu,HieraForImageClassification:()=>$h,HieraModel:()=>Nh,HieraPreTrainedModel:()=>Oo,HubertForCTC:()=>Gh,HubertForSequenceClassification:()=>qh,HubertModel:()=>jh,HubertPreTrainedModel:()=>Fh,HunYuanDenseV1ForCausalLM:()=>Vh,HunYuanDenseV1Model:()=>Wh,HunYuanDenseV1PreTrainedModel:()=>Io,IJepaForImageClassification:()=>Kh,IJepaModel:()=>Xh,IJepaPreTrainedModel:()=>Co,Idefics3ForConditionalGeneration:()=>ml,Idefics3ImageProcessor:()=>ki,Idefics3PreTrainedModel:()=>fl,Idefics3Processor:()=>zi,ImageClassificationPipeline:()=>Sc,ImageFeatureExtractionPipeline:()=>Rc,ImageFeatureExtractor:()=>W,ImageProcessor:()=>W,ImageSegmentationPipeline:()=>en,ImageToImagePipeline:()=>Lc,ImageToTextPipeline:()=>Tc,InterruptableStoppingCriteria:()=>V0,JAISLMHeadModel:()=>Qh,JAISModel:()=>Yh,JAISPreTrainedModel:()=>Po,JinaCLIPImageProcessor:()=>td,JinaCLIPModel:()=>Jh,JinaCLIPPreTrainedModel:()=>Bs,JinaCLIPProcessor:()=>Id,JinaCLIPTextModel:()=>zo,JinaCLIPVisionModel:()=>Zh,Lfm2ForCausalLM:()=>t_,Lfm2Model:()=>e_,Lfm2MoeForCausalLM:()=>s_,Lfm2MoeModel:()=>r_,Lfm2MoePreTrainedModel:()=>No,Lfm2PreTrainedModel:()=>Lo,LiteWhisperForConditionalGeneration:()=>Cx,Llama4ForCausalLM:()=>a_,Llama4PreTrainedModel:()=>hl,LlamaForCausalLM:()=>o_,LlamaModel:()=>n_,LlamaPreTrainedModel:()=>$o,LlamaTokenizer:()=>ep,LlavaForConditionalGeneration:()=>Ds,LlavaOnevisionForConditionalGeneration:()=>Ds,LlavaOnevisionImageProcessor:()=>rd,LlavaPreTrainedModel:()=>_l,LlavaProcessor:()=>Cd,LlavaQwen2ForCausalLM:()=>l_,LogitsProcessor:()=>Nt,LogitsProcessorList:()=>Kr,LogitsWarper:()=>Nn,LongT5ForConditionalGeneration:()=>u_,LongT5Model:()=>c_,LongT5PreTrainedModel:()=>Ro,M2M100ForConditionalGeneration:()=>d_,M2M100Model:()=>p_,M2M100PreTrainedModel:()=>Uo,M2M100Tokenizer:()=>tp,MBart50Tokenizer:()=>sp,MBartForCausalLM:()=>y_,MBartForConditionalGeneration:()=>w_,MBartForSequenceClassification:()=>x_,MBartModel:()=>g_,MBartPreTrainedModel:()=>Jr,MBartTokenizer:()=>vn,MPNetForMaskedLM:()=>ng,MPNetForQuestionAnswering:()=>ig,MPNetForSequenceClassification:()=>og,MPNetForTokenClassification:()=>ag,MPNetModel:()=>sg,MPNetPreTrainedModel:()=>Tr,MPNetTokenizer:()=>ap,MT5ForConditionalGeneration:()=>pg,MT5Model:()=>ug,MT5PreTrainedModel:()=>Yo,MarianMTModel:()=>m_,MarianModel:()=>f_,MarianPreTrainedModel:()=>Bo,MarianTokenizer:()=>rp,Mask2FormerImageProcessor:()=>nd,MaskFormerFeatureExtractor:()=>sd,MaskFormerForInstanceSegmentation:()=>__,MaskFormerImageProcessor:()=>Ts,MaskFormerModel:()=>h_,MaskFormerPreTrainedModel:()=>Do,MaxLengthCriteria:()=>Hi,Metric3DForDepthEstimation:()=>b_,Metric3DPreTrainedModel:()=>gl,Metric3Dv2ForDepthEstimation:()=>v_,Metric3Dv2PreTrainedModel:()=>wl,MgpstrForSceneTextRecognition:()=>k_,MgpstrModelOutput:()=>xl,MgpstrPreTrainedModel:()=>yl,MgpstrProcessor:()=>Pd,MgpstrTokenizer:()=>np,MimiDecoderModel:()=>jo,MimiDecoderOutput:()=>vl,MimiEncoderModel:()=>Fo,MimiEncoderOutput:()=>bl,MimiModel:()=>E_,MimiPreTrainedModel:()=>Fs,MinLengthLogitsProcessor:()=>Fi,MinNewTokensLengthLogitsProcessor:()=>ji,MistralForCausalLM:()=>M_,MistralModel:()=>A_,MistralPreTrainedModel:()=>Go,MobileBertForMaskedLM:()=>S_,MobileBertForQuestionAnswering:()=>I_,MobileBertForSequenceClassification:()=>O_,MobileBertModel:()=>T_,MobileBertPreTrainedModel:()=>Zr,MobileBertTokenizer:()=>op,MobileLLMForCausalLM:()=>P_,MobileLLMModel:()=>C_,MobileLLMPreTrainedModel:()=>qo,MobileNetV1FeatureExtractor:()=>od,MobileNetV1ForImageClassification:()=>L_,MobileNetV1ForSemanticSegmentation:()=>N_,MobileNetV1ImageProcessor:()=>Ei,MobileNetV1Model:()=>z_,MobileNetV1PreTrainedModel:()=>js,MobileNetV2FeatureExtractor:()=>ad,MobileNetV2ForImageClassification:()=>R_,MobileNetV2ForSemanticSegmentation:()=>U_,MobileNetV2ImageProcessor:()=>Ai,MobileNetV2Model:()=>$_,MobileNetV2PreTrainedModel:()=>Gs,MobileNetV3FeatureExtractor:()=>id,MobileNetV3ForImageClassification:()=>D_,MobileNetV3ForSemanticSegmentation:()=>F_,MobileNetV3ImageProcessor:()=>Mi,MobileNetV3Model:()=>B_,MobileNetV3PreTrainedModel:()=>qs,MobileNetV4FeatureExtractor:()=>ld,MobileNetV4ForImageClassification:()=>G_,MobileNetV4ForSemanticSegmentation:()=>q_,MobileNetV4ImageProcessor:()=>Ti,MobileNetV4Model:()=>j_,MobileNetV4PreTrainedModel:()=>Ws,MobileViTFeatureExtractor:()=>cd,MobileViTForImageClassification:()=>V_,MobileViTImageProcessor:()=>Si,MobileViTModel:()=>W_,MobileViTPreTrainedModel:()=>Wo,MobileViTV2ForImageClassification:()=>X_,MobileViTV2Model:()=>H_,MobileViTV2PreTrainedModel:()=>Vo,ModernBertDecoderForCausalLM:()=>eg,ModernBertDecoderModel:()=>Z_,ModernBertDecoderPreTrainedModel:()=>Ho,ModernBertForMaskedLM:()=>Y_,ModernBertForSequenceClassification:()=>Q_,ModernBertForTokenClassification:()=>J_,ModernBertModel:()=>K_,ModernBertPreTrainedModel:()=>es,Moondream1ForConditionalGeneration:()=>i_,MoonshineFeatureExtractor:()=>Sp,MoonshineForConditionalGeneration:()=>rg,MoonshineModel:()=>tg,MoonshinePreTrainedModel:()=>Xo,MoonshineProcessor:()=>zd,MptForCausalLM:()=>cg,MptModel:()=>lg,MptPreTrainedModel:()=>Ko,MultiModalityCausalLM:()=>dg,MultiModalityPreTrainedModel:()=>kl,MusicgenForCausalLM:()=>mg,MusicgenForConditionalGeneration:()=>Jo,MusicgenModel:()=>fg,MusicgenPreTrainedModel:()=>Qo,NanoChatForCausalLM:()=>_g,NanoChatModel:()=>hg,NanoChatPreTrainedModel:()=>Zo,NeoBertForMaskedLM:()=>wg,NeoBertForQuestionAnswering:()=>bg,NeoBertForSequenceClassification:()=>xg,NeoBertForTokenClassification:()=>yg,NeoBertModel:()=>gg,NeoBertPreTrainedModel:()=>Sr,NllbTokenizer:()=>ip,NoBadWordsLogitsProcessor:()=>Gi,NoRepeatNGramLogitsProcessor:()=>Bi,NomicBertModel:()=>vg,NomicBertPreTrainedModel:()=>El,NougatImageProcessor:()=>ud,NougatTokenizer:()=>lp,OPTForCausalLM:()=>Pg,OPTModel:()=>Cg,OPTPreTrainedModel:()=>na,ObjectDetectionPipeline:()=>Cc,Olmo2ForCausalLM:()=>Mg,Olmo2Model:()=>Ag,Olmo2PreTrainedModel:()=>ta,Olmo3ForCausalLM:()=>Sg,Olmo3Model:()=>Tg,Olmo3PreTrainedModel:()=>ra,OlmoForCausalLM:()=>Eg,OlmoModel:()=>kg,OlmoPreTrainedModel:()=>ea,OpenELMForCausalLM:()=>Ig,OpenELMModel:()=>Og,OpenELMPreTrainedModel:()=>sa,OwlViTFeatureExtractor:()=>pd,OwlViTForObjectDetection:()=>$g,OwlViTImageProcessor:()=>Ss,OwlViTModel:()=>Ng,OwlViTPreTrainedModel:()=>aa,OwlViTProcessor:()=>Ld,Owlv2ForObjectDetection:()=>Lg,Owlv2ImageProcessor:()=>dd,Owlv2Model:()=>zg,Owlv2PreTrainedModel:()=>oa,PaliGemmaForConditionalGeneration:()=>Rg,PaliGemmaPreTrainedModel:()=>Al,PaliGemmaProcessor:()=>Nd,ParakeetFeatureExtractor:()=>Op,ParakeetForCTC:()=>Ug,ParakeetPreTrainedModel:()=>Ml,PatchTSMixerForPrediction:()=>Dg,PatchTSMixerModel:()=>Bg,PatchTSMixerPreTrainedModel:()=>ia,PatchTSTForPrediction:()=>jg,PatchTSTModel:()=>Fg,PatchTSTPreTrainedModel:()=>la,Phi3ForCausalLM:()=>Vg,Phi3Model:()=>Wg,Phi3PreTrainedModel:()=>ua,Phi3VForCausalLM:()=>pa,Phi3VImageProcessor:()=>fd,Phi3VPreTrainedModel:()=>Tl,Phi3VProcessor:()=>$d,PhiForCausalLM:()=>qg,PhiModel:()=>Gg,PhiPreTrainedModel:()=>ca,PixtralImageProcessor:()=>md,PixtralProcessor:()=>Rd,PreTrainedModel:()=>y,PreTrainedTokenizer:()=>j,PretrainedConfig:()=>Ni,Processor:()=>ne,PvtForImageClassification:()=>Xg,PvtImageProcessor:()=>hd,PvtModel:()=>Hg,PvtPreTrainedModel:()=>da,PyAnnoteFeatureExtractor:()=>Sn,PyAnnoteForAudioFrameClassification:()=>Yg,PyAnnoteModel:()=>Kg,PyAnnotePreTrainedModel:()=>fa,PyAnnoteProcessor:()=>Ud,QuestionAnsweringPipeline:()=>gc,Qwen2ForCausalLM:()=>Jg,Qwen2Model:()=>Qg,Qwen2PreTrainedModel:()=>ma,Qwen2Tokenizer:()=>cp,Qwen2VLForConditionalGeneration:()=>Zg,Qwen2VLImageProcessor:()=>_d,Qwen2VLPreTrainedModel:()=>Sl,Qwen2VLProcessor:()=>Bd,Qwen3ForCausalLM:()=>tw,Qwen3Model:()=>ew,Qwen3PreTrainedModel:()=>ha,RFDetrForObjectDetection:()=>ow,RFDetrModel:()=>nw,RFDetrObjectDetectionOutput:()=>Ol,RFDetrPreTrainedModel:()=>ga,RTDetrForObjectDetection:()=>tm,RTDetrImageProcessor:()=>gd,RTDetrModel:()=>em,RTDetrObjectDetectionOutput:()=>tr,RTDetrPreTrainedModel:()=>Zn,RTDetrV2ForObjectDetection:()=>gw,RTDetrV2Model:()=>_w,RTDetrV2ObjectDetectionOutput:()=>Il,RTDetrV2PreTrainedModel:()=>wa,RawAudio:()=>An,RawImage:()=>Xe,RawVideo:()=>Uc,RawVideoFrame:()=>ja,RepetitionPenaltyLogitsProcessor:()=>Di,ResNetForImageClassification:()=>sw,ResNetModel:()=>rw,ResNetPreTrainedModel:()=>_a,RoFormerForMaskedLM:()=>dw,RoFormerForQuestionAnswering:()=>hw,RoFormerForSequenceClassification:()=>fw,RoFormerForTokenClassification:()=>mw,RoFormerModel:()=>pw,RoFormerPreTrainedModel:()=>Ir,RoFormerTokenizer:()=>pp,RobertaForMaskedLM:()=>iw,RobertaForQuestionAnswering:()=>uw,RobertaForSequenceClassification:()=>lw,RobertaForTokenClassification:()=>cw,RobertaModel:()=>aw,RobertaPreTrainedModel:()=>Or,RobertaTokenizer:()=>up,Sam2ImageProcessor:()=>In,Sam2ImageSegmentationOutput:()=>zl,Sam2Model:()=>xa,Sam2PreTrainedModel:()=>Ll,Sam2Processor:()=>Li,Sam2VideoProcessor:()=>Dd,Sam3ImageProcessor:()=>In,Sam3TrackerModel:()=>yw,SamImageProcessor:()=>In,SamImageSegmentationOutput:()=>Cl,SamModel:()=>ww,SamPreTrainedModel:()=>Pl,SamProcessor:()=>zn,SapiensFeatureExtractor:()=>wd,SapiensForDepthEstimation:()=>vw,SapiensForNormalEstimation:()=>kw,SapiensForSemanticSegmentation:()=>bw,SapiensImageProcessor:()=>Oi,SapiensPreTrainedModel:()=>Vs,SeamlessM4TFeatureExtractor:()=>Ip,SegformerFeatureExtractor:()=>xd,SegformerForImageClassification:()=>Aw,SegformerForSemanticSegmentation:()=>Mw,SegformerImageProcessor:()=>Ii,SegformerModel:()=>Ew,SegformerPreTrainedModel:()=>Hs,SiglipImageProcessor:()=>yd,SiglipModel:()=>Tw,SiglipPreTrainedModel:()=>ya,SiglipTextModel:()=>ba,SiglipTokenizer:()=>dp,SiglipVisionModel:()=>Sw,SmolLM3ForCausalLM:()=>Iw,SmolLM3Model:()=>Ow,SmolLM3PreTrainedModel:()=>va,SmolVLMForConditionalGeneration:()=>Hh,SmolVLMImageProcessor:()=>ki,SmolVLMProcessor:()=>zi,SnacDecoderModel:()=>Ea,SnacEncoderModel:()=>ka,SnacFeatureExtractor:()=>Cp,SnacModel:()=>Cw,SnacPreTrainedModel:()=>Xs,SpeechT5FeatureExtractor:()=>Pp,SpeechT5ForSpeechToText:()=>zw,SpeechT5ForTextToSpeech:()=>Lw,SpeechT5HifiGan:()=>Nw,SpeechT5Model:()=>Pw,SpeechT5PreTrainedModel:()=>Ks,SpeechT5Processor:()=>Fd,SpeechT5Tokenizer:()=>fp,SqueezeBertForMaskedLM:()=>Rw,SqueezeBertForQuestionAnswering:()=>Bw,SqueezeBertForSequenceClassification:()=>Uw,SqueezeBertModel:()=>$w,SqueezeBertPreTrainedModel:()=>ts,SqueezeBertTokenizer:()=>mp,StableLmForCausalLM:()=>Fw,StableLmModel:()=>Dw,StableLmPreTrainedModel:()=>Aa,Starcoder2ForCausalLM:()=>Gw,Starcoder2Model:()=>jw,Starcoder2PreTrainedModel:()=>Ma,StoppingCriteria:()=>Is,StoppingCriteriaList:()=>Vi,StyleTextToSpeech2Model:()=>qw,StyleTextToSpeech2PreTrainedModel:()=>Nl,SummarizationPipeline:()=>xc,SupertonicForConditionalGeneration:()=>Ta,SupertonicPreTrainedModel:()=>$l,SuppressTokensAtBeginLogitsProcessor:()=>Os,Swin2SRForImageSuperResolution:()=>Kw,Swin2SRImageProcessor:()=>bd,Swin2SRModel:()=>Xw,Swin2SRPreTrainedModel:()=>Sa,SwinForImageClassification:()=>Vw,SwinForSemanticSegmentation:()=>Hw,SwinModel:()=>Ww,SwinPreTrainedModel:()=>Ys,T5ForConditionalGeneration:()=>Qw,T5Model:()=>Yw,T5PreTrainedModel:()=>Oa,T5Tokenizer:()=>hp,TableTransformerForObjectDetection:()=>Zw,TableTransformerModel:()=>Jw,TableTransformerObjectDetectionOutput:()=>Rl,TableTransformerPreTrainedModel:()=>Ia,TemperatureLogitsWarper:()=>Wi,Tensor:()=>U,Text2TextGenerationPipeline:()=>Lr,TextClassificationPipeline:()=>hc,TextGenerationPipeline:()=>bc,TextStreamer:()=>Hx,TextToAudioPipeline:()=>Mc,TokenClassificationPipeline:()=>_c,TokenizersBackend:()=>j,TopKLogitsWarper:()=>W0,TopPLogitsWarper:()=>q0,TrOCRForCausalLM:()=>ex,TrOCRPreTrainedModel:()=>Ul,TranslationPipeline:()=>yc,UltravoxModel:()=>Dl,UltravoxPreTrainedModel:()=>Bl,UltravoxProcessor:()=>jd,UniSpeechForCTC:()=>sx,UniSpeechForSequenceClassification:()=>nx,UniSpeechModel:()=>rx,UniSpeechPreTrainedModel:()=>Qs,UniSpeechSatForAudioFrameClassification:()=>lx,UniSpeechSatForCTC:()=>ax,UniSpeechSatForSequenceClassification:()=>ix,UniSpeechSatModel:()=>ox,UniSpeechSatPreTrainedModel:()=>rs,VLChatProcessor:()=>Od,VLMImageProcessor:()=>ed,VaultGemmaForCausalLM:()=>ux,VaultGemmaModel:()=>cx,VaultGemmaPreTrainedModel:()=>Ca,ViTFeatureExtractor:()=>vd,ViTForImageClassification:()=>fx,ViTImageProcessor:()=>Ci,ViTMAEModel:()=>mx,ViTMAEPreTrainedModel:()=>Fl,ViTMSNForImageClassification:()=>_x,ViTMSNModel:()=>hx,ViTMSNPreTrainedModel:()=>za,ViTModel:()=>dx,ViTPreTrainedModel:()=>Pa,VisionEncoderDecoderModel:()=>px,VitMatteForImageMatting:()=>gx,VitMatteImageProcessor:()=>kd,VitMattePreTrainedModel:()=>jl,VitPoseForPoseEstimation:()=>wx,VitPoseImageProcessor:()=>Ed,VitPosePreTrainedModel:()=>Gl,VitsModel:()=>xx,VitsModelOutput:()=>ql,VitsPreTrainedModel:()=>Wl,VitsTokenizer:()=>_p,VoxtralForConditionalGeneration:()=>tx,VoxtralProcessor:()=>qd,Wav2Vec2BertForCTC:()=>bx,Wav2Vec2BertForSequenceClassification:()=>vx,Wav2Vec2BertModel:()=>yx,Wav2Vec2BertPreTrainedModel:()=>Js,Wav2Vec2CTCTokenizer:()=>gp,Wav2Vec2FeatureExtractor:()=>zp,Wav2Vec2ForAudioFrameClassification:()=>Dh,Wav2Vec2ForCTC:()=>Uh,Wav2Vec2ForSequenceClassification:()=>Bh,Wav2Vec2Model:()=>Rh,Wav2Vec2PreTrainedModel:()=>Wt,Wav2Vec2Processor:()=>Wd,Wav2Vec2ProcessorWithLM:()=>Vd,WavLMForAudioFrameClassification:()=>Tx,WavLMForCTC:()=>Ex,WavLMForSequenceClassification:()=>Ax,WavLMForXVector:()=>Mx,WavLMModel:()=>kx,WavLMPreTrainedModel:()=>Cr,WeSpeakerFeatureExtractor:()=>Lp,WeSpeakerResNetModel:()=>Sx,WeSpeakerResNetPreTrainedModel:()=>Hl,WhisperFeatureExtractor:()=>Np,WhisperForConditionalGeneration:()=>Xl,WhisperModel:()=>Ix,WhisperPreTrainedModel:()=>La,WhisperProcessor:()=>Hd,WhisperTextStreamer:()=>cb,WhisperTimeStampLogitsProcessor:()=>Ui,WhisperTokenizer:()=>wp,XLMForQuestionAnswering:()=>$x,XLMForSequenceClassification:()=>Lx,XLMForTokenClassification:()=>Nx,XLMModel:()=>Px,XLMPreTrainedModel:()=>Pr,XLMRobertaForMaskedLM:()=>Ux,XLMRobertaForQuestionAnswering:()=>Fx,XLMRobertaForSequenceClassification:()=>Bx,XLMRobertaForTokenClassification:()=>Dx,XLMRobertaModel:()=>Rx,XLMRobertaPreTrainedModel:()=>zr,XLMRobertaTokenizer:()=>xp,XLMTokenizer:()=>yp,XLMWithLMHeadModel:()=>zx,XVectorOutput:()=>Vl,YolosFeatureExtractor:()=>Ad,YolosForObjectDetection:()=>Gx,YolosImageProcessor:()=>Pi,YolosModel:()=>jx,YolosObjectDetectionOutput:()=>Kl,YolosPreTrainedModel:()=>Na,YoutuForCausalLM:()=>Wx,YoutuModel:()=>qx,YoutuPreTrainedModel:()=>$a,ZeroShotAudioClassificationPipeline:()=>Ec,ZeroShotClassificationPipeline:()=>vc,ZeroShotImageClassificationPipeline:()=>Ic,ZeroShotObjectDetectionPipeline:()=>Pc,cat:()=>Ee,cos_sim:()=>mk,dot:()=>Cy,env:()=>De,full:()=>Ge,full_like:()=>yn,interpolate:()=>Su,interpolate_4d:()=>Pt,layer_norm:()=>dP,load_image:()=>fA,load_video:()=>s2,log_softmax:()=>pu,matmul:()=>I0,mean:()=>fi,mean_pooling:()=>C0,ones:()=>rt,ones_like:()=>mi,permute:()=>ZE,pipeline:()=>uz,quantize_embeddings:()=>L0,rand:()=>fP,randn:()=>z0,read_audio:()=>kp,rfft:()=>pP,slice:()=>di,softmax:()=>Oe,stack:()=>zt,std_mean:()=>Ou,topk:()=>Gt,zeros:()=>Iu,zeros_like:()=>Cu});module.exports=pS(fz);var yv=Ur(require("fs"),1),us=Ur(require("path"),1),bv=Ur(require("url"),1),yS={},dS="4.0.0-next.3",vv=typeof process<"u",kv=vv&&process?.release?.name==="node",Ha=!Tv(yv.default),Ev=!Tv(us.default),fS=typeof globalThis.Deno<"u",hz=typeof globalThis.Bun<"u",Av=typeof window<"u"&&typeof window.document<"u",Mv=typeof self<"u"&&["DedicatedWorkerGlobalScope","ServiceWorkerGlobalScope","SharedWorkerGlobalScope"].includes(self.constructor?.name),by=typeof self<"u"&&"caches"in self,mS=kv||typeof navigator<"u"&&"gpu"in navigator,hS=typeof navigator<"u"&&"ml"in navigator,_S=()=>{if(typeof navigator>"u")return!1;let t=navigator.userAgent,r=(navigator.vendor||"").indexOf("Apple")>-1,s=!t.match(/CriOS|FxiOS|EdgiOS|OPiOS|mercury|brave/i)&&!t.includes("Chrome")&&!t.includes("Android");return r&&s},gS=_S(),be=Object.freeze({IS_BROWSER_ENV:Av,IS_WEBWORKER_ENV:Mv,IS_WEB_CACHE_AVAILABLE:by,IS_WEBGPU_AVAILABLE:mS,IS_WEBNN_AVAILABLE:hS,IS_SAFARI:gS,IS_PROCESS_AVAILABLE:vv,IS_NODE_ENV:kv,IS_FS_AVAILABLE:Ha,IS_PATH_AVAILABLE:Ev}),vy=Ha&&Ev,eu="./";if(vy){let t=Object(yS).url;t?eu=us.default.dirname(us.default.dirname(bv.default.fileURLToPath(t))):typeof __dirname<"u"&&(eu=us.default.dirname(__dirname))}var wS=vy?us.default.join(eu,"/.cache/"):null,xv="/models/",xS=vy?us.default.join(eu,xv):xv,De={version:dS,backends:{onnx:{}},allowRemoteModels:!0,remoteHost:"https://huggingface.co/",remotePathTemplate:"{model}/resolve/{revision}/",allowLocalModels:!(Av||Mv),localModelPath:xS,useFS:Ha,useBrowserCache:by&&!fS,useFSCache:Ha,cacheDir:wS,useCustomCache:!1,customCache:null,useWasmCache:by||Ha,cacheKey:"transformers-cache"};function Tv(t){return Object.keys(t).length===0}var bS=class{constructor(t){this.trie=this._build_trie(t)}_build_trie(t){let e=Object.create(null);for(let r of t){let s=e;for(let n=0;n<r.length;++n){let o=r[n];s=s[o]??=Object.create(null)}s.end=r}return e}split(t){let e=[],r=t.length,s=0,n=0;for(;n<r;){let o=this.trie,a=null,i=n;for(;i<r&&(o=o[t[i]]);)o.end&&(a=o.end),++i;a?(n>s&&e.push(t.slice(s,n)),e.push(a),n+=a.length,s=n):++n}return s<r&&e.push(t.slice(s)),e}},Sv=bS,vS=class{constructor(t){this.content=t.content,this.id=t.id,this.single_word=t.single_word??!1,this.lstrip=t.lstrip??!1,this.rstrip=t.rstrip??!1,this.special=t.special??!1,this.normalized=t.normalized??!this.special}},kS=vS,Nv=(()=>{let t=[...Array.from({length:94},(n,o)=>o+33),...Array.from({length:12},(n,o)=>o+161),...Array.from({length:82},(n,o)=>o+174)],e=t.slice(),r=0;for(let n=0;n<256;++n)t.includes(n)||(t.push(n),e.push(256+r),r+=1);let s=e.map(n=>String.fromCharCode(n));return Object.fromEntries(t.map((n,o)=>[n,s[o]]))})(),ES=t=>Object.fromEntries(Object.entries(t).map(([e,r])=>[r,e])),AS=ES(Nv),Ov=".,!?\u2026\u3002\uFF0C\u3001\u0964\u06D4\u060C",MS=new Map([["(?i:'s|'t|'re|'ve|'m|'ll|'d)","(?:'([sS]|[tT]|[rR][eE]|[vV][eE]|[mM]|[lL][lL]|[dD]))"],["(?i:[sdmt]|ll|ve|re)","(?:[sS]|[dD]|[mM]|[tT]|[lL][lL]|[vV][eE]|[rR][eE])"],["[^\\r\\n\\p{L}\\p{N}]?+","[^\\r\\n\\p{L}\\p{N}]?"],["[^\\s\\p{L}\\p{N}]++","[^\\s\\p{L}\\p{N}]+"],[` ?[^(\\s|[${Ov}])]+`,` ?[^\\s${Ov}]+`]]),tu="\\p{P}\\u0021-\\u002F\\u003A-\\u0040\\u005B-\\u0060\\u007B-\\u007E",Ey=t=>t.replace(/ \./g,".").replace(/ \?/g,"?").replace(/ \!/g,"!").replace(/ ,/g,",").replace(/ \' /g,"'").replace(/ n't/g,"n't").replace(/ 'm/g,"'m").replace(/ 's/g,"'s").replace(/ 've/g,"'ve").replace(/ 're/g,"'re"),ru=(t,e=!0)=>{if(t.Regex!==void 0){let r=t.Regex.replace(/\\([#&~])/g,"$1");for(let[s,n]of MS)r=r.replaceAll(s,n);try{return new RegExp(r,"gu")}catch(s){if(!(s instanceof SyntaxError)||!s.message.toLowerCase().includes("invalid property name"))throw s;let n=!1,o=r.replace(/(\\[pP])\{([^}=]+)\}/g,(a,i,l)=>{try{return new RegExp(`\\p{${l}}`,"u"),`${i}{${l}}`}catch{return n=!0,`${i}{Script=${l}}`}});if(!n)throw s;try{return new RegExp(o,"gu")}catch{throw s}}}else if(t.String!==void 0){let r=TS(t.String);return new RegExp(e?r:`(${r})`,"gu")}else return console.warn("Unknown pattern type:",t),null},TS=t=>t.replace(/[.*+?^${}()|[\]\\]/g,"\\$&"),SS=(t,e,r)=>{let s=[],n=0;for(;n<t.length;){if(s.push(t[n]),(e.get(t[n])??r)!==r){++n;continue}for(;++n<t.length&&(e.get(t[n])??r)===r;)e.get(s.at(-1))!==r&&(s[s.length-1]+=t[n])}return s},OS=t=>t>=19968&&t<=40959||t>=13312&&t<=19903||t>=131072&&t<=173791||t>=173824&&t<=177983||t>=177984&&t<=178207||t>=178208&&t<=183983||t>=63744&&t<=64255||t>=194560&&t<=195103,IS=t=>Number.isInteger(t)||typeof t=="bigint",CS=t=>{let e=0;for(let r of t)++e;return e},PS=t=>$v(t.toLowerCase()),Ht=(...t)=>Array.prototype.concat.apply([],t),Ay=t=>new Map(Object.entries(t)),zS=(t,e)=>{let r=[],s=0;for(let n of t.matchAll(e)){let o=n[0];s<n.index&&r.push(t.slice(s,n.index)),o.length>0&&r.push(o),s=n.index+o.length}return s<t.length&&r.push(t.slice(s)),r},$v=t=>t.replace(/\p{M}/gu,""),Iv=(t,e,r=[])=>{if(!t||Array.isArray(t)||typeof t!="object")return`${e} must be a valid object`;for(let s of r)if(!(s in t))return`${e} must contain a "${s}" property`;return null},LS=t=>t.match(/\S+/g)||[],NS=class{constructor(){let t=function(...e){return t._call(...e)};return Object.setPrototypeOf(t,new.target.prototype)}},Xa=NS,$S=class extends Xa{constructor(t){super(),this.config=t}_call(t){return this.normalize(t)}},gr=$S,RS=class extends gr{tokenize_chinese_chars(t){let e=[];for(let r=0;r<t.length;++r){let s=t[r],n=s.charCodeAt(0);OS(n)?(e.push(" "),e.push(s),e.push(" ")):e.push(s)}return e.join("")}strip_accents(t){return t.normalize("NFD").replace(/\p{Mn}/gu,"")}is_control(t){switch(t){case" ":case`
|
|
2
2
|
`:case"\r":return!1;default:return/^\p{Cc}|\p{Cf}|\p{Co}|\p{Cs}$/u.test(t)}}clean_text(t){let e=[];for(let r of t){let s=r.charCodeAt(0);s===0||s===65533||this.is_control(r)||(/^\s$/.test(r)?e.push(" "):e.push(r))}return e.join("")}normalize(t){return this.config.clean_text&&(t=this.clean_text(t)),this.config.handle_chinese_chars&&(t=this.tokenize_chinese_chars(t)),this.config.lowercase?(t=t.toLowerCase(),this.config.strip_accents!==!1&&(t=this.strip_accents(t))):this.config.strip_accents&&(t=this.strip_accents(t)),t}},US=RS,BS=class extends gr{constructor(t){super(t),this.charsmap=t.precompiled_charsmap??null}normalize(t){return t=t.replace(/[\u0001-\u0008\u000B\u000E-\u001F\u007F\u008F\u009F]/gm,""),t=t.replace(/[\u0009\u000A\u000C\u000D\u00A0\u1680\u2000-\u200F\u2028\u2029\u202F\u205F\u2581\u3000\uFEFF\uFFFD]/gm," "),t.includes("\uFF5E")?t=t.split("\uFF5E").map(r=>r.normalize("NFKC")).join("\uFF5E"):t=t.normalize("NFKC"),t}},DS=BS,FS=class extends gr{constructor(t){super(t),this.normalizers=(t.normalizers??[]).map(e=>Rv(e))}normalize(t){return this.normalizers.reduce((e,r)=>r?r.normalize(e):e,t)}},jS=FS,GS=class extends gr{normalize(t){let e=ru(this.config.pattern??{});return e===null?t:t.replaceAll(e,this.config.content??"")}},qS=GS,WS=class extends gr{constructor(){super(...arguments),this.form="NFC"}normalize(t){return t=t.normalize(this.form),t}},su=WS,VS=class extends su{constructor(){super(...arguments),this.form="NFC"}},HS=VS,XS=class extends su{constructor(){super(...arguments),this.form="NFD"}},KS=XS,YS=class extends su{constructor(){super(...arguments),this.form="NFKC"}},QS=YS,JS=class extends su{constructor(){super(...arguments),this.form="NFKD"}},ZS=JS,eO=class extends gr{normalize(t){return this.config.strip_left&&this.config.strip_right?t=t.trim():(this.config.strip_left&&(t=t.trimStart()),this.config.strip_right&&(t=t.trimEnd())),t}},tO=eO,rO=class extends gr{normalize(t){return $v(t)}},sO=rO,nO=class extends gr{normalize(t){return t.toLowerCase()}},oO=nO,aO=class extends gr{normalize(t){return t=this.config.prepend+t,t}},iO=aO;function lO(t){if(t===null)return null;switch(t.type){case"BertNormalizer":return new US(t);case"Precompiled":return new DS(t);case"Sequence":return new jS(t);case"Replace":return new qS(t);case"NFC":return new HS(t);case"NFD":return new KS(t);case"NFKC":return new QS(t);case"NFKD":return new ZS(t);case"Strip":return new tO(t);case"StripAccents":return new sO(t);case"Lowercase":return new oO(t);case"Prepend":return new iO(t);default:throw new Error(`Unknown Normalizer type: ${t.type}`)}}var Rv=lO,cO=class extends Xa{pre_tokenize(t,e){return(Array.isArray(t)?t.map(r=>this.pre_tokenize_text(r,e)):this.pre_tokenize_text(t,e)).flat()}_call(t,e){return this.pre_tokenize(t,e)}},Xt=cO,uO=class extends Xt{constructor(t){super(),this.config=t,this.add_prefix_space=this.config.add_prefix_space??!1,this.trim_offsets=this.config.trim_offsets??!1,this.use_regex=this.config.use_regex??!0,this.pattern=/'s|'t|'re|'ve|'m|'ll|'d| ?\p{L}+| ?\p{N}+| ?[^\s\p{L}\p{N}]+|\s+(?!\S)|\s+/gu,this.byte_encoder=Nv,this.text_encoder=new TextEncoder}pre_tokenize_text(t,e){return this.add_prefix_space&&!t.startsWith(" ")&&(t=" "+t),(this.use_regex?t.match(this.pattern)||[]:[t]).map(s=>Array.from(this.text_encoder.encode(s),n=>this.byte_encoder[n]).join(""))}},pO=uO,dO=class extends Xt{pre_tokenize_text(t,e){return t.match(/\w+|[^\w\s]+/g)||[]}},fO=dO,mO=class extends Xt{constructor(t){super(),this.replacement=t.replacement??"\u2581",this.str_rep=t.str_rep||this.replacement,this.prepend_scheme=t.prepend_scheme??"always"}pre_tokenize_text(t,e){let{section_index:r=void 0}=e??{},s=t.replaceAll(" ",this.str_rep);return!s.startsWith(this.replacement)&&(this.prepend_scheme==="always"||this.prepend_scheme==="first"&&r===0)&&(s=this.str_rep+s),[s]}},hO=mO,_O=class extends Xt{constructor(t){super(),this.config=t,this.pattern=ru(this.config.pattern??{},this.config.invert??!0)}pre_tokenize_text(t){return this.pattern===null?[]:this.config.invert?t.match(this.pattern)||[]:this.config.behavior?.toLowerCase()==="removed"?t.split(this.pattern).filter(e=>e):zS(t,this.pattern)}},gO=_O,wO=class extends Xt{constructor(t){super(),this.config=t,this.pattern=new RegExp(`[^${tu}]+|[${tu}]+`,"gu")}pre_tokenize_text(t){return t.match(this.pattern)||[]}},xO=wO,yO=class extends Xt{constructor(t){super(),this.config=t;let e=`[^\\d]+|\\d${this.config.individual_digits?"":"+"}`;this.pattern=new RegExp(e,"gu")}pre_tokenize_text(t){return t.match(this.pattern)||[]}},bO=yO,vO=class extends Xt{constructor(){super(),this.pattern=new RegExp(`[^\\s${tu}]+|[${tu}]`,"gu")}pre_tokenize_text(t,e){return t.trim().match(this.pattern)||[]}},kO=vO,EO=class extends Xt{constructor(t){super(),this.config=t,this.pattern=ru(this.config.pattern??{}),this.content=this.config.content??""}pre_tokenize_text(t){return this.pattern===null?[t]:[t.replaceAll(this.pattern,this.config.content??"")]}},AO=EO,MO=class extends Xt{constructor(t){super(),this.tokenizers=(t.pretokenizers??[]).map(e=>Uv(e))}pre_tokenize_text(t,e){return this.tokenizers.reduce((r,s)=>s?s.pre_tokenize(r,e):r,[t])}},TO=MO,SO=class extends Xt{pre_tokenize_text(t){return LS(t)}},OO=SO,IO=class extends Xt{constructor(t){super(),this.config=t,this._length=t.length}pre_tokenize_text(t){let e=[];for(let r=0;r<t.length;r+=this._length)e.push(t.slice(r,r+this._length));return e}},CO=IO;function PO(t){if(t===null)return null;switch(t.type){case"BertPreTokenizer":return new kO;case"Sequence":return new TO(t);case"Whitespace":return new fO;case"WhitespaceSplit":return new OO;case"Metaspace":return new hO(t);case"ByteLevel":return new pO(t);case"Split":return new gO(t);case"Punctuation":return new xO(t);case"Digits":return new bO(t);case"Replace":return new AO(t);case"FixedLength":return new CO(t);default:throw new Error(`Unknown PreTokenizer type: ${t.type}`)}}var Uv=PO,zO=class extends Xa{constructor(t){super(),this.config=t,this.vocab=[],this.tokens_to_ids=new Map,this.unk_token_id=void 0,this.unk_token=void 0,this.end_of_word_suffix=void 0,this.fuse_unk=this.config.fuse_unk??!1}_call(t){let e=this.encode(t);return this.fuse_unk&&(e=SS(e,this.tokens_to_ids,this.unk_token_id)),e}},nu=zO,LO=class extends nu{constructor(t){super(t),this.max_input_chars_per_word=100,this.tokens_to_ids=Ay(t.vocab),this.unk_token_id=this.tokens_to_ids.get(t.unk_token),this.unk_token=t.unk_token,this.max_input_chars_per_word=t.max_input_chars_per_word??100,this.vocab=new Array(this.tokens_to_ids.size);for(let[e,r]of this.tokens_to_ids)this.vocab[r]=e}encode(t){let e=[];for(let r of t){let s=[...r];if(s.length>this.max_input_chars_per_word){e.push(this.unk_token);continue}let n=!1,o=0,a=[];for(;o<s.length;){let i=s.length,l=null;for(;o<i;){let u=s.slice(o,i).join("");if(o>0&&(u=this.config.continuing_subword_prefix+u),this.tokens_to_ids.has(u)){l=u;break}--i}if(l===null){n=!0;break}a.push(l),o=i}n?e.push(this.unk_token):e.push(...a)}return e}},Cv=LO,Pv=class Bv{constructor(e,r){this.is_leaf=e,this.children=r}static default(){return new Bv(!1,new Map)}},NO=class{constructor(){this.root=Pv.default()}extend(t){for(let e of t)this.push(e)}push(t){let e=this.root;for(let r of t){let s=e.children.get(r);s===void 0&&(s=Pv.default(),e.children.set(r,s)),e=s}e.is_leaf=!0}*common_prefix_search(t){let e=this.root;if(e===void 0)return;let r="";for(let s of t){if(r+=s,e=e.children.get(s),e===void 0)return;e.is_leaf&&(yield r)}}},$O=NO,ky=class Dv{constructor(e,r,s,n,o){this.token_id=e,this.node_id=r,this.pos=s,this.length=n,this.score=o,this.prev=null,this.backtrace_score=0}clone(){let e=new Dv(this.token_id,this.node_id,this.pos,this.length,this.score);return e.prev=this.prev,e.backtrace_score=this.backtrace_score,e}},RO=class{constructor(t,e,r){this.chars=Array.from(t),this.len=this.chars.length,this.bos_token_id=e,this.eos_token_id=r,this.nodes=[],this.begin_nodes=Array.from({length:this.len+1},()=>[]),this.end_nodes=Array.from({length:this.len+1},()=>[]);let s=new ky(this.bos_token_id??0,0,0,0,0),n=new ky(this.eos_token_id??0,1,this.len,0,0);this.nodes.push(s.clone()),this.nodes.push(n.clone()),this.begin_nodes[this.len].push(n),this.end_nodes[0].push(s)}insert(t,e,r,s){let n=this.nodes.length,o=new ky(s,n,t,e,r);this.begin_nodes[t].push(o),this.end_nodes[t+e].push(o),this.nodes.push(o)}viterbi(){let t=this.len,e=0;for(;e<=t;){if(this.begin_nodes[e].length==0)return[];for(let a of this.begin_nodes[e]){a.prev=null;let i=0,l=null;for(let u of this.end_nodes[e]){let d=u.backtrace_score+a.score;(l===null||d>i)&&(l=u.clone(),i=d)}if(l!==null)a.prev=l,a.backtrace_score=i;else return[]}++e}let r=[],n=this.begin_nodes[t][0].prev;if(n===null)return[];let o=n.clone();for(;o.prev!==null;)r.push(o.clone()),o=o.clone().prev.clone();return r.reverse(),r}piece(t){return this.chars.slice(t.pos,t.pos+t.length).join("")}tokens(){return this.viterbi().map(e=>this.piece(e))}token_ids(){return this.viterbi().map(e=>e.token_id)}},UO=RO;function BO(t){if(t.length===0)throw new Error("Array must not be empty");let e=t[0],r=0;for(let s=1;s<t.length;++s)t[s]<e&&(e=t[s],r=s);return[e,r]}var DO=class extends nu{constructor(t,e){super(t);let r=t.vocab.length;this.vocab=new Array(r),this.scores=new Array(r);for(let s=0;s<r;++s)[this.vocab[s],this.scores[s]]=t.vocab[s];this.unk_token_id=t.unk_id,this.unk_token=this.vocab[t.unk_id],this.tokens_to_ids=new Map(this.vocab.map((s,n)=>[s,n])),this.bos_token=" ",this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=e,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.unk_token=this.vocab[this.unk_token_id],this.min_score=BO(this.scores)[0],this.unk_score=this.min_score-10,this.scores[this.unk_token_id]=this.unk_score,this.trie=new $O,this.trie.extend(this.vocab),this.fuse_unk=!0}populate_nodes(t){let e=t.chars,r=1,s=0;for(;s<e.length;){let n=!1,o=[],a=e.slice(s).join(""),i=this.trie.common_prefix_search(a);for(let l of i){o.push(l);let u=this.tokens_to_ids.get(l),d=this.scores[u],f=CS(l);t.insert(s,f,d,u),!n&&f===r&&(n=!0)}n||t.insert(s,r,this.unk_score,this.unk_token_id),s+=r}}tokenize(t){let e=new UO(t,this.bos_token_id,this.eos_token_id);return this.populate_nodes(e),e.tokens()}encode(t){let e=[];for(let r of t){let s=this.tokenize(r);e.push(...s)}return e}},zv=DO,FO=class{constructor(t=(r,s)=>r>s,e=1/0){this._heap=[],this._comparator=t,this._max_size=e}get size(){return this._heap.length}is_empty(){return this.size===0}peek(){return this._heap[0]}push(...t){return this.extend(t)}extend(t){for(let e of t)if(this.size<this._max_size)this._heap.push(e),this._sift_up();else{let r=this._smallest();this._comparator(e,this._heap[r])&&(this._heap[r]=e,this._sift_up_from(r))}return this.size}pop(){let t=this.peek(),e=this.size-1;return e>0&&this._swap(0,e),this._heap.pop(),this._sift_down(),t}replace(t){let e=this.peek();return this._heap[0]=t,this._sift_down(),e}_parent(t){return(t+1>>>1)-1}_left(t){return(t<<1)+1}_right(t){return t+1<<1}_greater(t,e){return this._comparator(this._heap[t],this._heap[e])}_swap(t,e){let r=this._heap[t];this._heap[t]=this._heap[e],this._heap[e]=r}_sift_up(){this._sift_up_from(this.size-1)}_sift_up_from(t){for(;t>0&&this._greater(t,this._parent(t));)this._swap(t,this._parent(t)),t=this._parent(t)}_sift_down(){let t=0;for(;this._left(t)<this.size&&this._greater(this._left(t),t)||this._right(t)<this.size&&this._greater(this._right(t),t);){let e=this._right(t)<this.size&&this._greater(this._right(t),this._left(t))?this._right(t):this._left(t);this._swap(t,e),t=e}}_smallest(){return 2**Math.floor(Math.log2(this.size))-1}},jO=FO,GO=class{constructor(t){this.capacity=t,this.cache=new Map}get(t){if(!this.cache.has(t))return;let e=this.cache.get(t);return this.cache.delete(t),this.cache.set(t,e),e}put(t,e){this.cache.has(t)&&this.cache.delete(t),this.cache.set(t,e),this.cache.size>this.capacity&&this.cache.delete(this.cache.keys().next().value)}clear(){this.cache.clear()}},qO=GO,WO=class extends nu{constructor(t){super(t),this.tokens_to_ids=Ay(t.vocab),this.unk_token_id=this.tokens_to_ids.get(t.unk_token),this.unk_token=t.unk_token,this.vocab=new Array(this.tokens_to_ids.size);for(let[r,s]of this.tokens_to_ids)this.vocab[s]=r;let e=Array.isArray(t.merges[0]);this.merges=e?t.merges:t.merges.map(r=>r.split(" ",2)),this.bpe_ranks=new Map(this.merges.map((r,s)=>[JSON.stringify(r),s])),this.end_of_word_suffix=t.end_of_word_suffix,this.continuing_subword_suffix=t.continuing_subword_suffix??null,this.byte_fallback=this.config.byte_fallback??!1,this.byte_fallback&&(this.text_encoder=new TextEncoder),this.ignore_merges=this.config.ignore_merges??!1,this.max_length_to_cache=256,this.cache_capacity=1e4,this.cache=new qO(this.cache_capacity)}clear_cache(){this.cache.clear()}bpe(t){if(t.length===0)return[];let e=this.cache.get(t);if(e!==void 0)return e;let r=Array.from(t);this.end_of_word_suffix&&(r[r.length-1]+=this.end_of_word_suffix);let s=[];if(r.length>1){let n=new jO((i,l)=>i.score<l.score),o={token:r[0],bias:0,prev:null,next:null},a=o;for(let i=1;i<r.length;++i){let l={bias:i/r.length,token:r[i],prev:a,next:null};a.next=l,this.add_node(n,a),a=l}for(;!n.is_empty();){let i=n.pop();if(i.deleted||!i.next||i.next.deleted)continue;if(i.deleted=!0,i.next.deleted=!0,i.prev){let u={...i.prev};i.prev.deleted=!0,i.prev=u,u.prev?u.prev.next=u:o=u}let l={token:i.token+i.next.token,bias:i.bias,prev:i.prev,next:i.next.next};l.prev?(l.prev.next=l,this.add_node(n,l.prev)):o=l,l.next&&(l.next.prev=l,this.add_node(n,l))}for(let i=o;i!==null;i=i.next)s.push(i.token)}else s=r;if(this.continuing_subword_suffix)for(let n=0;n<s.length-1;++n)s[n]+=this.continuing_subword_suffix;return t.length<this.max_length_to_cache&&this.cache.put(t,s),s}add_node(t,e){let r=this.bpe_ranks.get(JSON.stringify([e.token,e.next.token]));r!==void 0&&(e.score=r+e.bias,t.push(e))}encode(t){let e=[];for(let r of t){if(this.ignore_merges&&this.tokens_to_ids.has(r)){e.push(r);continue}let s=this.bpe(r);for(let n of s)if(this.tokens_to_ids.has(n))e.push(n);else if(this.byte_fallback){let o=Array.from(this.text_encoder.encode(n)).map(a=>`<0x${a.toString(16).toUpperCase().padStart(2,"0")}>`);o.every(a=>this.tokens_to_ids.has(a))?e.push(...o):e.push(this.unk_token)}else e.push(this.unk_token)}return e}},Lv=WO,VO=class extends nu{constructor(t,e){super(t);let r=t.vocab;this.tokens_to_ids=Ay(e.target_lang?r[e.target_lang]:r),this.bos_token=e.bos_token,this.bos_token_id=this.tokens_to_ids.get(this.bos_token),this.eos_token=e.eos_token,this.eos_token_id=this.tokens_to_ids.get(this.eos_token),this.pad_token=e.pad_token,this.pad_token_id=this.tokens_to_ids.get(this.pad_token),this.unk_token=e.unk_token,this.unk_token_id=this.tokens_to_ids.get(this.unk_token),this.vocab=new Array(this.tokens_to_ids.size);for(let[s,n]of this.tokens_to_ids)this.vocab[n]=s}encode(t){return t}},HO=VO;function XO(t,e){switch(t.type){case"WordPiece":return new Cv(t);case"Unigram":return new zv(t,e.eos_token);case"BPE":return new Lv(t);default:if(t.vocab)return Array.isArray(t.vocab)?new zv(t,e.eos_token):Object.hasOwn(t,"continuing_subword_prefix")&&Object.hasOwn(t,"unk_token")?Object.hasOwn(t,"merges")?new Lv(t):new Cv(t):new HO(t,{target_lang:e.target_lang,bos_token:e.bos_token,eos_token:e.eos_token,pad_token:e.pad_token,unk_token:e.unk_token});throw new Error(`Unknown TokenizerModel type: ${t?.type}`)}}var KO=XO,YO=class extends Xa{constructor(t){super(),this.config=t}_call(t,...e){return this.post_process(t,...e)}},Ka=YO,QO=class extends Ka{post_process(t,e=null,r=!0){let s=e===null?this.config.single:this.config.pair,n=[],o=[];for(let a of s)"SpecialToken"in a?r&&(n.push(a.SpecialToken.id),o.push(a.SpecialToken.type_id)):"Sequence"in a&&(a.Sequence.id==="A"?(n=Ht(n,t),o=Ht(o,new Array(t.length).fill(a.Sequence.type_id))):a.Sequence.id==="B"&&(n=Ht(n,e),o=Ht(o,new Array(e.length).fill(a.Sequence.type_id))));return{tokens:n,token_type_ids:o}}},JO=QO,ZO=class extends Ka{post_process(t,e=null){return{tokens:t,tokens_pair:e}}},eI=ZO,tI=class extends Ka{constructor(t){super(t),this.sep=t.sep,this.cls=t.cls}post_process(t,e=null,r=!0){r&&(t=Ht([this.cls[0]],t,[this.sep[0]]));let s=new Array(t.length).fill(0);if(e){let n=[],o=r?[this.sep[0]]:[];t=Ht(t,n,e,o),s=Ht(s,new Array(e.length+n.length+o.length).fill(1))}return{tokens:t,token_type_ids:s}}},rI=tI,sI=class extends Ka{constructor(t){super(t),this.sep=t.sep,this.cls=t.cls}post_process(t,e,r=!0){r&&(t=Ht([this.cls[0]],t,[this.sep[0]]));let s=new Array(t.length).fill(0);if(e){let n=r?[this.sep[0]]:[],o=r?[this.sep[0]]:[];t=Ht(t,n,e,o),s=Ht(s,new Array(e.length+n.length+o.length).fill(1))}return{tokens:t,token_type_ids:s}}},nI=sI,oI=class extends Ka{constructor(t){super(t),this.processors=(t.processors??[]).map(e=>Fv(e))}post_process(t,e=null,r=!0){let s={tokens:t,tokens_pair:e};for(let n of this.processors)s=n.post_process(s.tokens,s.tokens_pair,r);return s}},aI=oI;function iI(t){if(t===null)return null;switch(t.type){case"TemplateProcessing":return new JO(t);case"ByteLevel":return new eI(t);case"BertProcessing":return new rI(t);case"RobertaProcessing":return new nI(t);case"Sequence":return new aI(t);default:throw new Error(`Unknown PostProcessor type: ${t.type}`)}}var Fv=iI,lI=class extends Xa{constructor(t){super(),this.config=t,this.added_tokens=[],this.end_of_word_suffix=null,this.trim_offsets="trim_offsets"in t?t.trim_offsets:!1}_call(t){return this.decode(t)}decode(t){return this.decode_chain(t).join("")}},Bt=lI,cI=class extends Bt{constructor(t){super(t),this.byte_decoder=AS,this.text_decoder=new TextDecoder("utf-8",{fatal:!1,ignoreBOM:!0}),this.end_of_word_suffix=null}convert_tokens_to_string(t){let e=t.join(""),r=new Uint8Array([...e].map(s=>this.byte_decoder[s]));return this.text_decoder.decode(r)}decode_chain(t){let e=[],r=[];for(let s of t)this.added_tokens.find(n=>n.content===s)!==void 0?(r.length>0&&(e.push(this.convert_tokens_to_string(r)),r=[]),e.push(s)):r.push(s);return r.length>0&&e.push(this.convert_tokens_to_string(r)),e}},uI=cI,pI=class extends Bt{constructor(t){super(t),this.cleanup=t.cleanup}decode_chain(t){return t.map((e,r)=>{if(r!==0){let s=this.config.prefix;s&&e.startsWith(s)?e=e.replace(s,""):e=" "+e}return this.cleanup&&(e=Ey(e)),e})}},dI=pI,fI=class extends Bt{constructor(t){super(t),this.replacement=t.replacement??"\u2581"}decode_chain(t){let e=[];for(let r=0;r<t.length;++r){let s=t[r].replaceAll(this.replacement," ");r==0&&s.startsWith(" ")&&(s=s.substring(1)),e.push(s)}return e}},mI=fI,hI=class extends Bt{constructor(t){super(t),this.suffix=t.suffix??""}decode_chain(t){return t.map((e,r)=>e.replaceAll(this.suffix,r===t.length-1?"":" "))}},_I=hI,gI=class extends Bt{constructor(t){super(t),this.pad_token=t.pad_token??"",this.word_delimiter_token=t.word_delimiter_token??"",this.cleanup=t.cleanup}convert_tokens_to_string(t){if(t.length===0)return"";let e=[t[0]];for(let n=1;n<t.length;++n)t[n]!==e.at(-1)&&e.push(t[n]);let s=e.filter(n=>n!==this.pad_token).join("");return this.cleanup&&(s=Ey(s).replaceAll(this.word_delimiter_token," ").trim()),s}decode_chain(t){return[this.convert_tokens_to_string(t)]}},wI=gI,xI=class extends Bt{constructor(t){super(t),this.decoders=(t.decoders??[]).map(e=>jv(e))}decode_chain(t){return this.decoders.reduce((e,r)=>r.decode_chain(e),t)}},yI=xI,bI=class extends Bt{decode_chain(t){let e=ru(this.config.pattern),r=this.config.content??"";return e===null?t:t.map(s=>s.replaceAll(e,r))}},vI=bI,kI=class extends Bt{decode_chain(t){return[t.join("")]}},EI=kI,AI=class extends Bt{constructor(t){super(t),this.content=t.content??"",this.start=t.start??0,this.stop=t.stop??0}decode_chain(t){return t.map(e=>{let r=0;for(let n=0;n<this.start&&e[n]===this.content;++n){r=n+1;continue}let s=e.length;for(let n=0;n<this.stop;++n){let o=e.length-n-1;if(e[o]===this.content){s=o;continue}else break}return e.slice(r,s)})}},MI=AI,TI=class extends Bt{constructor(t){super(t),this.text_decoder=new TextDecoder}decode_chain(t){let e=[],r=[];for(let s of t){let n=null;if(s.length===6&&s.startsWith("<0x")&&s.endsWith(">")){let o=parseInt(s.slice(3,5),16);isNaN(o)||(n=o)}if(n!==null)r.push(n);else{if(r.length>0){let o=this.text_decoder.decode(Uint8Array.from(r));e.push(o),r=[]}e.push(s)}}if(r.length>0){let s=this.text_decoder.decode(Uint8Array.from(r));e.push(s),r=[]}return e}},SI=TI;function OI(t){if(t===null)return null;switch(t.type){case"ByteLevel":return new uI(t);case"WordPiece":return new dI(t);case"Metaspace":return new mI(t);case"BPEDecoder":return new _I(t);case"CTC":return new wI(t);case"Sequence":return new yI(t);case"Replace":return new vI(t);case"Fuse":return new EI(t);case"Strip":return new MI(t);case"ByteFallback":return new SI(t);default:throw new Error(`Unknown Decoder type: ${t.type}`)}}var jv=OI,II=class{constructor(t,e){let r=Iv(t,"Tokenizer",["model","decoder","post_processor","pre_tokenizer","normalizer"]);if(r)throw new Error(r);let s=Iv(e,"Config");if(s)throw new Error(s);this.tokenizer=t,this.config=e,this.normalizer=Rv(this.tokenizer.normalizer),this.pre_tokenizer=Uv(this.tokenizer.pre_tokenizer),this.model=KO(this.tokenizer.model,this.config),this.post_processor=Fv(this.tokenizer.post_processor),this.decoder=jv(this.tokenizer.decoder),this.special_tokens=[],this.all_special_ids=[],this.added_tokens=[];let n=[],o=[];this.added_tokens_map=new Map;for(let a of this.tokenizer.added_tokens){let i=new kS(a);if(this.added_tokens.push(i),this.model.tokens_to_ids.set(i.content,i.id),this.model.vocab[i.id]=i.content,i.special&&(this.special_tokens.push(i.content),this.all_special_ids.push(i.id)),this.added_tokens_map.set(i.content,i),i.normalized&&this.normalizer!==null){let l=this.normalizer(i.content);o.push(l),this.added_tokens_map.set(l,i)}else n.push(i.content)}(this.config.additional_special_tokens??[]).forEach(a=>{this.special_tokens.includes(a)||this.special_tokens.push(a)}),this.decoder&&(this.decoder.added_tokens=this.added_tokens,this.decoder.end_of_word_suffix=this.model.end_of_word_suffix),this.splitter_unnormalized=new Sv(n),this.splitter_normalized=new Sv(o),this.remove_space=this.config.remove_space,this.clean_up_tokenization_spaces=this.config.clean_up_tokenization_spaces??!0,this.do_lowercase_and_remove_accent=this.config.do_lowercase_and_remove_accent??!1}encode(t,{text_pair:e=null,add_special_tokens:r=!0,return_token_type_ids:s=null}={}){let{tokens:n,token_type_ids:o}=this.tokenize_helper(t,{text_pair:e,add_special_tokens:r}),a=n.map(l=>this.added_tokens_map.get(l)?.id??this.model.tokens_to_ids.get(l)??this.model.unk_token_id),i={ids:a,tokens:n,attention_mask:new Array(a.length).fill(1)};return s&&o&&(i.token_type_ids=o),i}decode(t,e={}){if(!Array.isArray(t)||t.length===0||!IS(t[0]))throw Error("token_ids must be a non-empty array of integers.");let r=t.map(n=>this.model.vocab[Number(n)]??this.model.unk_token);e.skip_special_tokens&&(r=r.filter(n=>!this.special_tokens.includes(n)));let s=this.decoder?this.decoder(r):r.join(" ");return this.decoder&&this.decoder.end_of_word_suffix&&(s=s.replaceAll(this.decoder.end_of_word_suffix," "),e.skip_special_tokens&&(s=s.trim())),(e.clean_up_tokenization_spaces??this.clean_up_tokenization_spaces)&&(s=Ey(s)),s}tokenize(t,{text_pair:e=null,add_special_tokens:r=!1}={}){return this.tokenize_helper(t,{text_pair:e,add_special_tokens:r}).tokens}encode_text(t){if(t===null)return null;let e=this.splitter_unnormalized.split(t);return e.forEach((r,s)=>{let n=this.added_tokens_map.get(r);n&&(n.lstrip&&s>0&&(e[s-1]=e[s-1].trimEnd()),n.rstrip&&s<e.length-1&&(e[s+1]=e[s+1].trimStart()))}),e.flatMap((r,s)=>{if(r.length===0)return[];if(this.added_tokens_map.has(r))return[r];if(this.remove_space===!0&&(r=r.trim().split(/\s+/).join(" ")),this.do_lowercase_and_remove_accent&&(r=PS(r)),this.normalizer!==null&&(r=this.normalizer(r)),r.length===0)return[];let n=this.splitter_normalized.split(r);return n.forEach((o,a)=>{let i=this.added_tokens_map.get(o);i&&(i.lstrip&&a>0&&(n[a-1]=n[a-1].trimEnd()),i.rstrip&&a<n.length-1&&(n[a+1]=n[a+1].trimStart()))}),n.flatMap(o=>{if(o.length===0)return[];if(this.added_tokens_map.has(o))return[o];let a=this.pre_tokenizer!==null?this.pre_tokenizer(o,{section_index:s}):[o];return this.model(a)})})}tokenize_helper(t,{text_pair:e=null,add_special_tokens:r=!0}){let s=this.encode_text(t),n=this.encode_text(e||null);return this.post_processor?this.post_processor(s,n,r):{tokens:Ht(s??[],n??[])}}token_to_id(t){return this.model.tokens_to_ids.get(t)}id_to_token(t){return this.model.vocab[t]}get_added_tokens_decoder(){let t=new Map;for(let e of this.added_tokens)t.set(e.id,e);return t}get_vocab(t=!0){let e=new Map;for(let r=0;r<this.model.vocab.length;++r){let s=this.model.vocab[r];(t||!this.added_tokens_map.has(s))&&e.set(s,r)}return e}},Gv=II;var $=Object.freeze({Text:"Text",NumericLiteral:"NumericLiteral",StringLiteral:"StringLiteral",Identifier:"Identifier",Equals:"Equals",OpenParen:"OpenParen",CloseParen:"CloseParen",OpenStatement:"OpenStatement",CloseStatement:"CloseStatement",OpenExpression:"OpenExpression",CloseExpression:"CloseExpression",OpenSquareBracket:"OpenSquareBracket",CloseSquareBracket:"CloseSquareBracket",OpenCurlyBracket:"OpenCurlyBracket",CloseCurlyBracket:"CloseCurlyBracket",Comma:"Comma",Dot:"Dot",Colon:"Colon",Pipe:"Pipe",CallOperator:"CallOperator",AdditiveBinaryOperator:"AdditiveBinaryOperator",MultiplicativeBinaryOperator:"MultiplicativeBinaryOperator",ComparisonBinaryOperator:"ComparisonBinaryOperator",UnaryOperator:"UnaryOperator",Comment:"Comment"}),Dt=class{constructor(t,e){this.value=t,this.type=e}};function qv(t){return/\w/.test(t)}function Ya(t){return/[0-9]/.test(t)}function Wv(t){return/\s/.test(t)}var CI=[["{%",$.OpenStatement],["%}",$.CloseStatement],["{{",$.OpenExpression],["}}",$.CloseExpression],["(",$.OpenParen],[")",$.CloseParen],["{",$.OpenCurlyBracket],["}",$.CloseCurlyBracket],["[",$.OpenSquareBracket],["]",$.CloseSquareBracket],[",",$.Comma],[".",$.Dot],[":",$.Colon],["|",$.Pipe],["<=",$.ComparisonBinaryOperator],[">=",$.ComparisonBinaryOperator],["==",$.ComparisonBinaryOperator],["!=",$.ComparisonBinaryOperator],["<",$.ComparisonBinaryOperator],[">",$.ComparisonBinaryOperator],["+",$.AdditiveBinaryOperator],["-",$.AdditiveBinaryOperator],["~",$.AdditiveBinaryOperator],["*",$.MultiplicativeBinaryOperator],["/",$.MultiplicativeBinaryOperator],["%",$.MultiplicativeBinaryOperator],["=",$.Equals]],PI=new Map([["n",`
|
|
3
3
|
`],["t"," "],["r","\r"],["b","\b"],["f","\f"],["v","\v"],["'","'"],['"','"'],["\\","\\"]]);function zI(t,e={}){return t.endsWith(`
|
|
4
4
|
`)&&(t=t.slice(0,-1)),e.lstrip_blocks&&(t=t.replace(/^[ \t]*({[#%-])/gm,"$1")),e.trim_blocks&&(t=t.replace(/([#%-]})\n/g,"$1")),t.replace(/{%\s*(end)?generation\s*%}/gs,"")}function LI(t,e={}){let r=[],s=zI(t,e),n=0,o=0,a=u=>{let d="";for(;u(s[n]);){if(s[n]==="\\"){if(++n,n>=s.length)throw new SyntaxError("Unexpected end of input");let f=s[n++],m=PI.get(f);if(m===void 0)throw new SyntaxError(`Unexpected escaped character: ${f}`);d+=m;continue}if(d+=s[n++],n>=s.length)throw new SyntaxError("Unexpected end of input")}return d},i=()=>{let u=r.at(-1);u&&u.type===$.Text&&(u.value=u.value.trimEnd(),u.value===""&&r.pop())},l=()=>{for(;n<s.length&&Wv(s[n]);)++n};e:for(;n<s.length;){let u=r.at(-1)?.type;if(u===void 0||u===$.CloseStatement||u===$.CloseExpression||u===$.Comment){let f="";for(;n<s.length&&!(s[n]==="{"&&(s[n+1]==="%"||s[n+1]==="{"||s[n+1]==="#"));)f+=s[n++];if(f.length>0){r.push(new Dt(f,$.Text));continue}}if(s[n]==="{"&&s[n+1]==="#"){n+=2;let f=s[n]==="-";f&&++n;let m="";for(;s[n]!=="#"||s[n+1]!=="}";){if(n+2>=s.length)throw new SyntaxError("Missing end of comment tag");m+=s[n++]}let _=m.endsWith("-");_&&(m=m.slice(0,-1)),f&&i(),r.push(new Dt(m,$.Comment)),n+=2,_&&l();continue}if(s.slice(n,n+3)==="{%-"){i(),r.push(new Dt("{%",$.OpenStatement)),n+=3;continue}if(s.slice(n,n+3)==="{{-"){i(),r.push(new Dt("{{",$.OpenExpression)),o=0,n+=3;continue}if(a(Wv),s.slice(n,n+3)==="-%}"){r.push(new Dt("%}",$.CloseStatement)),n+=3,l();continue}if(s.slice(n,n+3)==="-}}"){r.push(new Dt("}}",$.CloseExpression)),n+=3,l();continue}let d=s[n];if(d==="-"||d==="+"){let f=r.at(-1)?.type;if(f===$.Text||f===void 0)throw new SyntaxError(`Unexpected character: ${d}`);switch(f){case $.Identifier:case $.NumericLiteral:case $.StringLiteral:case $.CloseParen:case $.CloseSquareBracket:break;default:{++n;let m=a(Ya);r.push(new Dt(`${d}${m}`,m.length>0?$.NumericLiteral:$.UnaryOperator));continue}}}for(let[f,m]of CI){if(f==="}}"&&o>0)continue;if(s.slice(n,n+f.length)===f){r.push(new Dt(f,m)),m===$.OpenExpression?o=0:m===$.OpenCurlyBracket?++o:m===$.CloseCurlyBracket&&--o,n+=f.length;continue e}}if(d==="'"||d==='"'){++n;let f=a(m=>m!==d);r.push(new Dt(f,$.StringLiteral)),++n;continue}if(Ya(d)){let f=a(Ya);if(s[n]==="."&&Ya(s[n+1])){++n;let m=a(Ya);f=`${f}.${m}`}r.push(new Dt(f,$.NumericLiteral));continue}if(qv(d)){let f=a(qv);r.push(new Dt(f,$.Identifier));continue}throw new SyntaxError(`Unexpected character: ${d}`)}return r}var Yt=class{type="Statement"},NI=class extends Yt{constructor(t){super(),this.body=t}type="Program"},$I=class extends Yt{constructor(t,e,r){super(),this.test=t,this.body=e,this.alternate=r}type="If"},RI=class extends Yt{constructor(t,e,r,s){super(),this.loopvar=t,this.iterable=e,this.body=r,this.defaultBlock=s}type="For"},UI=class extends Yt{type="Break"},BI=class extends Yt{type="Continue"},DI=class extends Yt{constructor(t,e,r){super(),this.assignee=t,this.value=e,this.body=r}type="Set"},FI=class extends Yt{constructor(t,e,r){super(),this.name=t,this.args=e,this.body=r}type="Macro"},jI=class extends Yt{constructor(t){super(),this.value=t}type="Comment"},St=class extends Yt{type="Expression"},GI=class extends St{constructor(t,e,r){super(),this.object=t,this.property=e,this.computed=r}type="MemberExpression"},Vv=class extends St{constructor(t,e){super(),this.callee=t,this.args=e}type="CallExpression"},ln=class extends St{constructor(t){super(),this.value=t}type="Identifier"},cn=class extends St{constructor(t){super(),this.value=t}type="Literal"},qI=class extends cn{type="IntegerLiteral"},WI=class extends cn{type="FloatLiteral"},Hv=class extends cn{type="StringLiteral"},VI=class extends cn{type="ArrayLiteral"},Xv=class extends cn{type="TupleLiteral"},HI=class extends cn{type="ObjectLiteral"},Qa=class extends St{constructor(t,e,r){super(),this.operator=t,this.left=e,this.right=r}type="BinaryExpression"},XI=class extends St{constructor(t,e){super(),this.operand=t,this.filter=e}type="FilterExpression"},KI=class extends Yt{constructor(t,e){super(),this.filter=t,this.body=e}type="FilterStatement"},YI=class extends St{constructor(t,e){super(),this.lhs=t,this.test=e}type="SelectExpression"},QI=class extends St{constructor(t,e,r){super(),this.operand=t,this.negate=e,this.test=r}type="TestExpression"},JI=class extends St{constructor(t,e){super(),this.operator=t,this.argument=e}type="UnaryExpression"},ZI=class extends St{constructor(t=void 0,e=void 0,r=void 0){super(),this.start=t,this.stop=e,this.step=r}type="SliceExpression"},eC=class extends St{constructor(t,e){super(),this.key=t,this.value=e}type="KeywordArgumentExpression"},tC=class extends St{constructor(t){super(),this.argument=t}type="SpreadExpression"},rC=class extends Yt{constructor(t,e,r){super(),this.call=t,this.callerArgs=e,this.body=r}type="CallStatement"},sC=class extends St{constructor(t,e,r){super(),this.condition=t,this.trueExpr=e,this.falseExpr=r}type="Ternary"};function nC(t){let e=new NI([]),r=0;function s(S,L){let R=t[r++];if(!R||R.type!==S)throw new Error(`Parser Error: ${L}. ${R.type} !== ${S}.`);return R}function n(S){if(!l(S))throw new SyntaxError(`Expected ${S}`);++r}function o(){switch(t[r].type){case $.Comment:return new jI(t[r++].value);case $.Text:return u();case $.OpenStatement:return d();case $.OpenExpression:return f();default:throw new SyntaxError(`Unexpected token type: ${t[r].type}`)}}function a(...S){return r+S.length<=t.length&&S.every((L,R)=>L===t[r+R].type)}function i(...S){return t[r]?.type===$.OpenStatement&&t[r+1]?.type===$.Identifier&&S.includes(t[r+1]?.value)}function l(...S){return r+S.length<=t.length&&S.every((L,R)=>t[r+R].type==="Identifier"&&L===t[r+R].value)}function u(){return new Hv(s($.Text,"Expected text token").value)}function d(){if(s($.OpenStatement,"Expected opening statement token"),t[r].type!==$.Identifier)throw new SyntaxError(`Unknown statement, got ${t[r].type}`);let S=t[r].value,L;switch(S){case"set":++r,L=m();break;case"if":++r,L=_(),s($.OpenStatement,"Expected {% token"),n("endif"),s($.CloseStatement,"Expected %} token");break;case"macro":++r,L=w(),s($.OpenStatement,"Expected {% token"),n("endmacro"),s($.CloseStatement,"Expected %} token");break;case"for":++r,L=k(),s($.OpenStatement,"Expected {% token"),n("endfor"),s($.CloseStatement,"Expected %} token");break;case"call":{++r;let R=null;a($.OpenParen)&&(R=V());let te=ie();if(te.type!=="Identifier")throw new SyntaxError("Expected identifier following call statement");let ue=V();s($.CloseStatement,"Expected closing statement token");let Be=[];for(;!i("endcall");)Be.push(o());s($.OpenStatement,"Expected '{%'"),n("endcall"),s($.CloseStatement,"Expected closing statement token");let Pe=new Vv(te,ue);L=new rC(Pe,R,Be);break}case"break":++r,s($.CloseStatement,"Expected closing statement token"),L=new UI;break;case"continue":++r,s($.CloseStatement,"Expected closing statement token"),L=new BI;break;case"filter":{++r;let R=ie();R instanceof ln&&a($.OpenParen)&&(R=X(R)),s($.CloseStatement,"Expected closing statement token");let te=[];for(;!i("endfilter");)te.push(o());s($.OpenStatement,"Expected '{%'"),n("endfilter"),s($.CloseStatement,"Expected '%}'"),L=new KI(R,te);break}default:throw new SyntaxError(`Unknown statement type: ${S}`)}return L}function f(){s($.OpenExpression,"Expected opening expression token");let S=E();return s($.CloseExpression,"Expected closing expression token"),S}function m(){let S=x(),L=null,R=[];if(a($.Equals))++r,L=x();else{for(s($.CloseStatement,"Expected %} token");!i("endset");)R.push(o());s($.OpenStatement,"Expected {% token"),n("endset")}return s($.CloseStatement,"Expected closing statement token"),new DI(S,L,R)}function _(){let S=E();s($.CloseStatement,"Expected closing statement token");let L=[],R=[];for(;!i("elif","else","endif");)L.push(o());if(i("elif")){++r,++r;let te=_();R.push(te)}else if(i("else"))for(++r,++r,s($.CloseStatement,"Expected closing statement token");!i("endif");)R.push(o());return new $I(S,L,R)}function w(){let S=ie();if(S.type!=="Identifier")throw new SyntaxError("Expected identifier following macro statement");let L=V();s($.CloseStatement,"Expected closing statement token");let R=[];for(;!i("endmacro");)R.push(o());return new FI(S,L,R)}function x(S=!1){let L=S?ie:E,R=[L()],te=a($.Comma);for(;te&&(++r,R.push(L()),!!a($.Comma)););return te?new Xv(R):R[0]}function k(){let S=x(!0);if(!(S instanceof ln||S instanceof Xv))throw new SyntaxError(`Expected identifier/tuple for the loop variable, got ${S.type} instead`);if(!l("in"))throw new SyntaxError("Expected `in` keyword following loop variable");++r;let L=E();s($.CloseStatement,"Expected closing statement token");let R=[];for(;!i("endfor","else");)R.push(o());let te=[];if(i("else"))for(++r,++r,s($.CloseStatement,"Expected closing statement token");!i("endfor");)te.push(o());return new RI(S,L,R,te)}function E(){return M()}function M(){let S=I();if(l("if")){++r;let L=I();if(l("else")){++r;let R=M();return new sC(L,S,R)}else return new YI(S,L)}return S}function I(){let S=T();for(;l("or");){let L=t[r];++r;let R=T();S=new Qa(L,S,R)}return S}function T(){let S=z();for(;l("and");){let L=t[r];++r;let R=z();S=new Qa(L,S,R)}return S}function z(){let S;for(;l("not");){let L=t[r];++r;let R=z();S=new JI(L,R)}return S??C()}function C(){let S=v();for(;;){let L;if(l("not","in"))L=new Dt("not in",$.Identifier),r+=2;else if(l("in"))L=t[r++];else if(a($.ComparisonBinaryOperator))L=t[r++];else break;let R=v();S=new Qa(L,S,R)}return S}function v(){let S=B();for(;a($.AdditiveBinaryOperator);){let L=t[r];++r;let R=B();S=new Qa(L,S,R)}return S}function G(){let S=Y(ie());return a($.OpenParen)?X(S):S}function X(S){let L=new Vv(S,V());return L=Y(L),a($.OpenParen)&&(L=X(L)),L}function V(){s($.OpenParen,"Expected opening parenthesis for arguments list");let S=Q();return s($.CloseParen,"Expected closing parenthesis for arguments list"),S}function Q(){let S=[];for(;!a($.CloseParen);){let L;if(t[r].type===$.MultiplicativeBinaryOperator&&t[r].value==="*"){++r;let R=E();L=new tC(R)}else if(L=E(),a($.Equals)){if(++r,!(L instanceof ln))throw new SyntaxError("Expected identifier for keyword argument");let R=E();L=new eC(L,R)}S.push(L),a($.Comma)&&++r}return S}function K(){let S=[],L=!1;for(;!a($.CloseSquareBracket);)a($.Colon)?(S.push(void 0),++r,L=!0):(S.push(E()),a($.Colon)&&(++r,L=!0));if(S.length===0)throw new SyntaxError("Expected at least one argument for member/slice expression");if(L){if(S.length>3)throw new SyntaxError("Expected 0-3 arguments for slice expression");return new ZI(...S)}return S[0]}function Y(S){for(;a($.Dot)||a($.OpenSquareBracket);){let L=t[r];++r;let R,te=L.type===$.OpenSquareBracket;if(te)R=K(),s($.CloseSquareBracket,"Expected closing square bracket");else if(R=ie(),R.type!=="Identifier")throw new SyntaxError("Expected identifier following dot operator");S=new GI(S,R,te)}return S}function B(){let S=P();for(;a($.MultiplicativeBinaryOperator);){let L=t[r++],R=P();S=new Qa(L,S,R)}return S}function P(){let S=se();for(;l("is");){++r;let L=l("not");L&&++r;let R=ie();if(!(R instanceof ln))throw new SyntaxError("Expected identifier for the test");S=new QI(S,L,R)}return S}function se(){let S=G();for(;a($.Pipe);){++r;let L=ie();if(!(L instanceof ln))throw new SyntaxError("Expected identifier for the filter");a($.OpenParen)&&(L=X(L)),S=new XI(S,L)}return S}function ie(){let S=t[r++];switch(S.type){case $.NumericLiteral:{let L=S.value;return L.includes(".")?new WI(Number(L)):new qI(Number(L))}case $.StringLiteral:{let L=S.value;for(;a($.StringLiteral);)L+=t[r++].value;return new Hv(L)}case $.Identifier:return new ln(S.value);case $.OpenParen:{let L=x();return s($.CloseParen,"Expected closing parenthesis, got ${tokens[current].type} instead."),L}case $.OpenSquareBracket:{let L=[];for(;!a($.CloseSquareBracket);)L.push(E()),a($.Comma)&&++r;return++r,new VI(L)}case $.OpenCurlyBracket:{let L=new Map;for(;!a($.CloseCurlyBracket);){let R=E();s($.Colon,"Expected colon between key and value in object literal");let te=E();L.set(R,te),a($.Comma)&&++r}return++r,new HI(L)}default:throw new SyntaxError(`Unexpected token: ${S.type}`)}}for(;r<t.length;)e.body.push(o());return e}function oC(t,e,r=1){if(e===void 0&&(e=t,t=0),r===0)throw new Error("range() step must not be zero");let s=[];if(r>0)for(let n=t;n<e;n+=r)s.push(n);else for(let n=t;n>e;n+=r)s.push(n);return s}function Kv(t,e,r,s=1){let n=Math.sign(s);n>=0?(e=(e??=0)<0?Math.max(t.length+e,0):Math.min(e,t.length),r=(r??=t.length)<0?Math.max(t.length+r,0):Math.min(r,t.length)):(e=(e??=t.length-1)<0?Math.max(t.length+e,-1):Math.min(e,t.length-1),r=(r??=-1)<-1?Math.max(t.length+r,-1):Math.min(r,t.length-1));let o=[];for(let a=e;n*a<n*r;a+=s)o.push(t[a]);return o}function aC(t){return t.replace(/\b\w/g,e=>e.toUpperCase())}function iC(t){return lC(new Date,t)}function lC(t,e){let r=new Intl.DateTimeFormat(void 0,{month:"long"}),s=new Intl.DateTimeFormat(void 0,{month:"short"}),n=o=>o<10?"0"+o:o.toString();return e.replace(/%[YmdbBHM%]/g,o=>{switch(o){case"%Y":return t.getFullYear().toString();case"%m":return n(t.getMonth()+1);case"%d":return n(t.getDate());case"%b":return s.format(t);case"%B":return r.format(t);case"%H":return n(t.getHours());case"%M":return n(t.getMinutes());case"%%":return"%";default:return o}})}function cC(t){return t.replace(/[.*+?^${}()|[\]\\]/g,"\\$&")}function uC(t,e,r,s){if(s===0)return t;let n=s==null||s<0?1/0:s,o=e.length===0?new RegExp("(?=)","gu"):new RegExp(cC(e),"gu");return t.replaceAll(o,a=>n>0?(--n,r):a)}var Yv=class extends Error{},Qv=class extends Error{},ar=class{type="RuntimeValue";value;builtins=new Map;constructor(t=void 0){this.value=t}__bool__(){return new le(!!this.value)}toString(){return String(this.value)}},de=class extends ar{type="IntegerValue"},Ke=class extends ar{type="FloatValue";toString(){return this.value%1===0?this.value.toFixed(1):this.value.toString()}},Z=class extends ar{type="StringValue";builtins=new Map([["upper",new je(()=>new Z(this.value.toUpperCase()))],["lower",new je(()=>new Z(this.value.toLowerCase()))],["strip",new je(()=>new Z(this.value.trim()))],["title",new je(()=>new Z(aC(this.value)))],["capitalize",new je(()=>new Z(this.value.charAt(0).toUpperCase()+this.value.slice(1)))],["length",new de(this.value.length)],["rstrip",new je(()=>new Z(this.value.trimEnd()))],["lstrip",new je(()=>new Z(this.value.trimStart()))],["startswith",new je(t=>{if(t.length===0)throw new Error("startswith() requires at least one argument");let e=t[0];if(e instanceof Z)return new le(this.value.startsWith(e.value));if(e instanceof ve){for(let r of e.value){if(!(r instanceof Z))throw new Error("startswith() tuple elements must be strings");if(this.value.startsWith(r.value))return new le(!0)}return new le(!1)}throw new Error("startswith() argument must be a string or tuple of strings")})],["endswith",new je(t=>{if(t.length===0)throw new Error("endswith() requires at least one argument");let e=t[0];if(e instanceof Z)return new le(this.value.endsWith(e.value));if(e instanceof ve){for(let r of e.value){if(!(r instanceof Z))throw new Error("endswith() tuple elements must be strings");if(this.value.endsWith(r.value))return new le(!0)}return new le(!1)}throw new Error("endswith() argument must be a string or tuple of strings")})],["split",new je(t=>{let e=t[0]??new We;if(!(e instanceof Z||e instanceof We))throw new Error("sep argument must be a string or null");let r=t[1]??new de(-1);if(!(r instanceof de))throw new Error("maxsplit argument must be a number");let s=[];if(e instanceof We){let n=this.value.trimStart();for(let{0:o,index:a}of n.matchAll(/\S+/g)){if(r.value!==-1&&s.length>=r.value&&a!==void 0){s.push(o+n.slice(a+o.length));break}s.push(o)}}else{if(e.value==="")throw new Error("empty separator");s=this.value.split(e.value),r.value!==-1&&s.length>r.value&&s.push(s.splice(r.value).join(e.value))}return new ve(s.map(n=>new Z(n)))})],["replace",new je(t=>{if(t.length<2)throw new Error("replace() requires at least two arguments");let e=t[0],r=t[1];if(!(e instanceof Z&&r instanceof Z))throw new Error("replace() arguments must be strings");let s;if(t.length>2?t[2].type==="KeywordArgumentsValue"?s=t[2].value.get("count")??new We:s=t[2]:s=new We,!(s instanceof de||s instanceof We))throw new Error("replace() count argument must be a number or null");return new Z(uC(this.value,e.value,r.value,s.value))})]])},le=class extends ar{type="BooleanValue"},pC=/[\x7f-\uffff]/g;function Jv(t){return t.replace(pC,e=>"\\u"+e.charCodeAt(0).toString(16).padStart(4,"0"))}function ds(t,e={},r=0,s=!0){let{indent:n=null,ensureAscii:o=!1,separators:a=null,sortKeys:i=!1}=e,l,u;switch(a?[l,u]=a:n?(l=",",u=": "):(l=", ",u=": "),t.type){case"NullValue":return"null";case"UndefinedValue":return s?"null":"undefined";case"IntegerValue":case"FloatValue":case"BooleanValue":return JSON.stringify(t.value);case"StringValue":{let d=JSON.stringify(t.value);return o&&(d=Jv(d)),d}case"ArrayValue":case"ObjectValue":{let d=n?" ".repeat(n):"",f=`
|
|
@@ -11,8 +11,8 @@ var aS=Object.create;var Zc=Object.defineProperty;var iS=Object.getOwnPropertyDe
|
|
|
11
11
|
${N}
|
|
12
12
|
}`,h=new Function(Object.keys(O),N)(...Object.values(O)),N=`methodCaller<(${b.map(D=>D.name)}) => ${g.name}>`,q2(Object.defineProperty(h,"name",{value:N}))}function K2(c,p){return p>>>=0,(c=$t(c>>>0))==$t(p)}function Y2(c){return(c>>>=0)?(c=Wc(c),Vt(globalThis[c])):Vt(globalThis)}function Q2(c){return c=Wc(c>>>0),Vt(e[c])}function J2(c,p){return p>>>=0,c=$t(c>>>0),p=$t(p),Vt(c[p])}function Z2(c){9<(c>>>=0)&&(as[c+1]+=1)}function jb(c,p,h,g,b){return ny[c>>>0](p>>>0,h>>>0,g>>>0,b>>>0)}function eM(c,p,h,g,b){return jb(c>>>0,p>>>0,h>>>0,g>>>0,b>>>0)}function tM(){return Vt([])}function rM(c){c=$t(c>>>0);for(var p=Array(c.length),h=0;h<c.length;h++)p[h]=c[h];return Vt(p)}function sM(c){return Vt(Wc(c>>>0))}function nM(){return Vt({})}function oM(c){for(var p=$t(c>>>=0);p.length;){var h=p.pop();p.pop()(h)}Jx(c)}function aM(c,p,h){p>>>=0,h>>>=0,c=$t(c>>>0),p=$t(p),h=$t(h),c[p]=h}function iM(c,p){c=wt(c),p>>>=0,c=new Date(1e3*c),(v(),B)[p>>>2>>>0]=c.getUTCSeconds(),(v(),B)[p+4>>>2>>>0]=c.getUTCMinutes(),(v(),B)[p+8>>>2>>>0]=c.getUTCHours(),(v(),B)[p+12>>>2>>>0]=c.getUTCDate(),(v(),B)[p+16>>>2>>>0]=c.getUTCMonth(),(v(),B)[p+20>>>2>>>0]=c.getUTCFullYear()-1900,(v(),B)[p+24>>>2>>>0]=c.getUTCDay(),c=(c.getTime()-Date.UTC(c.getUTCFullYear(),0,1,0,0,0,0))/864e5|0,(v(),B)[p+28>>>2>>>0]=c}var Gb=c=>c%4==0&&(c%100!=0||c%400==0),qb=[0,31,60,91,121,152,182,213,244,274,305,335],Wb=[0,31,59,90,120,151,181,212,243,273,304,334];function lM(c,p){c=wt(c),p>>>=0,c=new Date(1e3*c),(v(),B)[p>>>2>>>0]=c.getSeconds(),(v(),B)[p+4>>>2>>>0]=c.getMinutes(),(v(),B)[p+8>>>2>>>0]=c.getHours(),(v(),B)[p+12>>>2>>>0]=c.getDate(),(v(),B)[p+16>>>2>>>0]=c.getMonth(),(v(),B)[p+20>>>2>>>0]=c.getFullYear()-1900,(v(),B)[p+24>>>2>>>0]=c.getDay();var h=(Gb(c.getFullYear())?qb:Wb)[c.getMonth()]+c.getDate()-1|0;(v(),B)[p+28>>>2>>>0]=h,(v(),B)[p+36>>>2>>>0]=-60*c.getTimezoneOffset(),h=new Date(c.getFullYear(),6,1).getTimezoneOffset();var g=new Date(c.getFullYear(),0,1).getTimezoneOffset();c=0|(h!=g&&c.getTimezoneOffset()==Math.min(g,h)),(v(),B)[p+32>>>2>>>0]=c}function cM(c){c>>>=0;var p=new Date((v(),B)[c+20>>>2>>>0]+1900,(v(),B)[c+16>>>2>>>0],(v(),B)[c+12>>>2>>>0],(v(),B)[c+8>>>2>>>0],(v(),B)[c+4>>>2>>>0],(v(),B)[c>>>2>>>0],0),h=(v(),B)[c+32>>>2>>>0],g=p.getTimezoneOffset(),b=new Date(p.getFullYear(),6,1).getTimezoneOffset(),A=new Date(p.getFullYear(),0,1).getTimezoneOffset(),O=Math.min(A,b);return 0>h?(v(),B)[c+32>>>2>>>0]=+(b!=A&&O==g):0<h!=(O==g)&&(b=Math.max(A,b),p.setTime(p.getTime()+6e4*((0<h?O:b)-g))),(v(),B)[c+24>>>2>>>0]=p.getDay(),h=(Gb(p.getFullYear())?qb:Wb)[p.getMonth()]+p.getDate()-1|0,(v(),B)[c+28>>>2>>>0]=h,(v(),B)[c>>>2>>>0]=p.getSeconds(),(v(),B)[c+4>>>2>>>0]=p.getMinutes(),(v(),B)[c+8>>>2>>>0]=p.getHours(),(v(),B)[c+12>>>2>>>0]=p.getDate(),(v(),B)[c+16>>>2>>>0]=p.getMonth(),(v(),B)[c+20>>>2>>>0]=p.getYear(),c=p.getTime(),BigInt(isNaN(c)?-1:c/1e3)}function Vb(c,p,h,g,b,A,O){return n?$e(16,1,c,p,h,g,b,A,O):-52}function Hb(c,p,h,g,b,A){if(n)return $e(17,1,c,p,h,g,b,A)}var qa={},uM=()=>performance.timeOrigin+performance.now();function Xb(c,p){if(n)return $e(18,1,c,p);if(qa[c]&&(clearTimeout(qa[c].id),delete qa[c]),!p)return 0;var h=setTimeout(()=>{delete qa[c],Fc(()=>A1(c,performance.timeOrigin+performance.now()))},p);return qa[c]={id:h,Ne:p},0}function pM(c,p,h,g){c>>>=0,p>>>=0,h>>>=0,g>>>=0;var b=new Date().getFullYear(),A=new Date(b,0,1).getTimezoneOffset();b=new Date(b,6,1).getTimezoneOffset();var O=Math.max(A,b);(v(),P)[c>>>2>>>0]=60*O,(v(),B)[p>>>2>>>0]=+(A!=b),c=(p=N=>{var D=Math.abs(N);return`UTC${0<=N?"-":"+"}${String(Math.floor(D/60)).padStart(2,"0")}${String(D%60).padStart(2,"0")}`})(A),p=p(b),b<A?(fr(c,h,17),fr(p,g,17)):(fr(c,g,17),fr(p,h,17))}var dM=()=>Date.now(),fM=1;function mM(c,p,h){if(h>>>=0,!(0<=c&&3>=c))return 28;if(c===0)c=Date.now();else{if(!fM)return 52;c=performance.timeOrigin+performance.now()}return c=Math.round(1e6*c),(v(),S)[h>>>3>>>0]=BigInt(c),0}var oy=[],Kb=(c,p)=>{oy.length=0;for(var h;h=(v(),Q)[c++>>>0];){var g=h!=105;p+=(g&=h!=112)&&p%8?4:0,oy.push(h==112?(v(),P)[p>>>2>>>0]:h==106?(v(),S)[p>>>3>>>0]:h==105?(v(),B)[p>>>2>>>0]:(v(),ie)[p>>>3>>>0]),p+=g?8:4}return oy};function hM(c,p,h){return c>>>=0,p=Kb(p>>>0,h>>>0),yy[c](...p)}function _M(c,p,h){return c>>>=0,p=Kb(p>>>0,h>>>0),yy[c](...p)}var gM=()=>{};function wM(c,p){return T(rn(c>>>0,p>>>0))}var xM=()=>{throw ge+=1,"unwind"};function yM(){return 4294901760}var bM=()=>1,vM=()=>navigator.hardwareConcurrency,is={},Yb=c=>{var p=mr(c)+1,h=an(p);return h&&fr(c,h,p),h},Vc=c=>{var p;return(p=/\bwasm-function\[\d+\]:(0x[0-9a-f]+)/.exec(c))?+p[1]:(p=/:(\d+):\d+(?:\)|$)/.exec(c))?2147483648|+p[1]:0},Qb=c=>{for(var p of c)(c=Vc(p))&&(is[c]=p)};function kM(){var c=Error().stack.toString().split(`
|
|
13
13
|
`);return c[0]=="Error"&&c.shift(),Qb(c),is.Xd=Vc(c[3]),is.re=c,is.Xd}function Hc(c){if(!(c=is[c>>>0]))return 0;var p;if(p=/^\s+at .*\.wasm\.(.*) \(.*\)$/.exec(c))c=p[1];else if(p=/^\s+at (.*) \(.*\)$/.exec(c))c=p[1];else{if(!(p=/^(.+?)@/.exec(c)))return 0;c=p[1]}return Rt(Hc.ae??0),Hc.ae=Yb(c),Hc.ae}function EM(c){c>>>=0;var p=(v(),Q).length;if(c<=p||4294901760<c)return!1;for(var h=1;4>=h;h*=2){var g=p*(1+.2/h);g=Math.min(g,c+100663296);e:{g=(Math.min(4294901760,65536*Math.ceil(Math.max(c,g)/65536))-$r.buffer.byteLength+65535)/65536|0;try{$r.grow(g),ue();var b=1;break e}catch{}b=void 0}if(b)return!0}return!1}function AM(c,p,h){if(c>>>=0,p>>>=0,is.Xd==c)var g=is.re;else(g=Error().stack.toString().split(`
|
|
14
|
-
`))[0]=="Error"&&g.shift(),Qb(g);for(var b=3;g[b]&&Vc(g[b])!=c;)++b;for(c=0;c<h&&g[c+b];++c)(v(),B)[p+4*c>>>2>>>0]=Vc(g[c+b]);return c}var nr=c=>{var p=mr(c)+1,h=Qc(p);return fr(c,h,p),h},ay=[],xt=(c,p)=>{ay[c>>>=0]=p},or=[],Xc=[],nn=(c,p)=>{Xc[c]=new Promise(h=>p.finally(()=>h(c)))},re=c=>{if(c)return ay[c>>>0]},Kc=(c,p,h)=>{(v(),P)[c>>>2>>>0]=p,(v(),P)[c+4>>>2>>>0]=h},Jb=c=>{var p=(v(),P)[c>>>2>>>0];return c=(v(),P)[c+4>>>2>>>0],rn(p,c)},hr=c=>{var p=(v(),P)[c>>>2>>>0];return c=(v(),P)[c+4>>>2>>>0],p?rn(p,c):c===0?"":void 0},MM=c=>{var p=hr(c+4),h=(h=(v(),P)[c+12>>>2>>>0])?re(h):"auto";if(c+=16){var g=re((v(),P)[c+4>>>2>>>0]),b=(v(),P)[c+16>>>2>>>0],A=(v(),P)[c+20>>>2>>>0];if(b){for(var O={},N=0;N<b;++N){var D=A+24*N;O[Jb(D+4)]=(v(),ie)[D+16>>>3>>>0]}b=O}else b=void 0;c={module:g,constants:b,entryPoint:hr(c+8)}}else c=void 0;return{label:p,layout:h,compute:c}},Zb=(c,p)=>{function h(b,A){b=c[b],(v(),B)[p+A>>>2>>>0]=b}function g(b,A){b=c[b],(v(),S)[p+A>>>3>>>0]=BigInt(b)}h("maxTextureDimension1D",4),h("maxTextureDimension2D",8),h("maxTextureDimension3D",12),h("maxTextureArrayLayers",16),h("maxBindGroups",20),h("maxBindGroupsPlusVertexBuffers",24),h("maxBindingsPerBindGroup",28),h("maxDynamicUniformBuffersPerPipelineLayout",32),h("maxDynamicStorageBuffersPerPipelineLayout",36),h("maxSampledTexturesPerShaderStage",40),h("maxSamplersPerShaderStage",44),h("maxStorageBuffersPerShaderStage",48),h("maxStorageTexturesPerShaderStage",52),h("maxUniformBuffersPerShaderStage",56),h("minUniformBufferOffsetAlignment",80),h("minStorageBufferOffsetAlignment",84),g("maxUniformBufferBindingSize",64),g("maxStorageBufferBindingSize",72),h("maxVertexBuffers",88),g("maxBufferSize",96),h("maxVertexAttributes",104),h("maxVertexBufferArrayStride",108),h("maxInterStageShaderVariables",112),h("maxColorAttachments",116),h("maxColorAttachmentBytesPerSample",120),h("maxComputeWorkgroupStorageSize",124),h("maxComputeInvocationsPerWorkgroup",128),h("maxComputeWorkgroupSizeX",132),h("maxComputeWorkgroupSizeY",136),h("maxComputeWorkgroupSizeZ",140),h("maxComputeWorkgroupsPerDimension",144),c.Le!==void 0&&h("maxImmediateSize",148)},TM=[,"validation","out-of-memory","internal"],SM=[,"compatibility","core"],e1={1:"core-features-and-limits",2:"depth-clip-control",3:"depth32float-stencil8",4:"texture-compression-bc",5:"texture-compression-bc-sliced-3d",6:"texture-compression-etc2",7:"texture-compression-astc",8:"texture-compression-astc-sliced-3d",9:"timestamp-query",10:"indirect-first-instance",11:"shader-f16",12:"rg11b10ufloat-renderable",13:"bgra8unorm-storage",14:"float32-filterable",15:"float32-blendable",16:"clip-distances",17:"dual-source-blending",18:"subgroups",19:"texture-formats-tier1",20:"texture-formats-tier2",21:"primitive-index",327692:"chromium-experimental-unorm16-texture-formats",327693:"chromium-experimental-snorm16-texture-formats",327732:"chromium-experimental-multi-draw-indirect"},OM=[,"low-power","high-performance"],IM=[,"occlusion","timestamp"],CM={undefined:1,unknown:1,destroyed:2};function PM(c,p,h,g,b,A){p=wt(p),h=wt(h),g>>>=0,b>>>=0,A>>>=0;var O=re(c>>>0);if(c={},A){var N=(v(),P)[A+12>>>2>>>0];if(N){var D=(v(),P)[A+16>>>2>>>0];c.requiredFeatures=Array.from((v(),P).subarray(D>>>2>>>0,D+4*N>>>2>>>0),ee=>e1[ee])}var q=(v(),P)[A+20>>>2>>>0];if(q){let ee=function(Ut,nt,ls=!1){nt=q+nt,(nt=(v(),P)[nt>>>2>>>0])==4294967295||ls&&nt==0||(Re[Ut]=nt)},ct=function(Ut,nt){nt=q+nt;var ls=(v(),P)[nt>>>2>>>0],oS=(v(),P)[nt+4>>>2>>>0];ls==4294967295&&oS==4294967295||(Re[Ut]=4294967296*(v(),P)[nt+4>>>2>>>0]+(v(),P)[nt>>>2>>>0])};var fe=ee,me=ct,Re={};ee("maxTextureDimension1D",4),ee("maxTextureDimension2D",8),ee("maxTextureDimension3D",12),ee("maxTextureArrayLayers",16),ee("maxBindGroups",20),ee("maxBindGroupsPlusVertexBuffers",24),ee("maxDynamicUniformBuffersPerPipelineLayout",32),ee("maxDynamicStorageBuffersPerPipelineLayout",36),ee("maxSampledTexturesPerShaderStage",40),ee("maxSamplersPerShaderStage",44),ee("maxStorageBuffersPerShaderStage",48),ee("maxStorageTexturesPerShaderStage",52),ee("maxUniformBuffersPerShaderStage",56),ee("minUniformBufferOffsetAlignment",80),ee("minStorageBufferOffsetAlignment",84),ct("maxUniformBufferBindingSize",64),ct("maxStorageBufferBindingSize",72),ee("maxVertexBuffers",88),ct("maxBufferSize",96),ee("maxVertexAttributes",104),ee("maxVertexBufferArrayStride",108),ee("maxInterStageShaderVariables",112),ee("maxColorAttachments",116),ee("maxColorAttachmentBytesPerSample",120),ee("maxComputeWorkgroupStorageSize",124),ee("maxComputeInvocationsPerWorkgroup",128),ee("maxComputeWorkgroupSizeX",132),ee("maxComputeWorkgroupSizeY",136),ee("maxComputeWorkgroupSizeZ",140),ee("maxComputeWorkgroupsPerDimension",144),ee("maxImmediateSize",148,!0),c.requiredLimits=Re}(N=(v(),P)[A+24>>>2>>>0])&&(N={label:hr(N+4)},c.defaultQueue=N),c.label=hr(A+4)}ge+=1,nn(p,O.requestDevice(c).then(ee=>{--ge,xt(b,ee.queue),xt(g,ee),h&&(ge+=1,nn(h,ee.lost.then(ct=>{--ge,ee.onuncapturederror=()=>{};var Ut=ae(),nt=nr(ct.message);py(h,CM[ct.reason],nt),oe(Ut)}))),ee.onuncapturederror=ct=>{var Ut=5;ct.error instanceof GPUValidationError?Ut=2:ct.error instanceof GPUOutOfMemoryError?Ut=3:ct.error instanceof GPUInternalError&&(Ut=4);var nt=ae();ct=nr(ct.error.message),b1(g,Ut,ct),oe(nt)},"adapterInfo"in ee||(ee.adapterInfo=O.info),my(p,1,g,0)},ee=>{--ge;var ct=ae();ee=nr(ee.message),my(p,3,g,ee),h&&py(h,4,ee),oe(ct)}))}function zM(c){var p=re(c>>>=0),h=or[c];if(h){for(var g=0;g<h.length;++g)h[g]();delete or[c]}p.destroy()}var on=()=>{var c="getMappedRange size=0 no longer means WGPU_WHOLE_MAP_SIZE";on.ed||(on.ed={}),on.ed[c]||(on.ed[c]=1,T(c))};function LM(c,p,h){p>>>=0,h>>>=0;var g=re(c>>>=0);h===0&&on(),h==4294967295&&(h=void 0);try{var b=g.getMappedRange(p,h)}catch{return 0}var A=gy(16,b.byteLength);return(v(),Q).set(new Uint8Array(b),A>>>0),or[c].push(()=>Rt(A)),A}function NM(c,p,h){p>>>=0,h>>>=0;var g=re(c>>>=0);h===0&&on(),h==4294967295&&(h=void 0);try{var b=g.getMappedRange(p,h)}catch{return 0}var A=gy(16,b.byteLength);return(v(),Q).fill(0,A,b.byteLength),or[c].push(()=>{new Uint8Array(b).set((v(),Q).subarray(A>>>0,A+b.byteLength>>>0)),Rt(A)}),A}function $M(c,p,h,g,b){c>>>=0,p=wt(p),h=wt(h),b>>>=0;var A=re(c);or[c]=[],b==4294967295&&(b=void 0),ge+=1,nn(p,A.mapAsync(h,g>>>0,b).then(()=>{--ge,dy(p,1,0)},O=>{--ge,ae();var N=nr(O.message);dy(p,O.name==="AbortError"?4:O.name==="OperationError"?3:0,N),delete or[c]}))}function RM(c){var p=re(c>>>=0),h=or[c];if(h){for(var g=0;g<h.length;++g)h[g]();delete or[c],p.unmap()}}function UM(c){delete ay[c>>>0]}function BM(c,p,h){c>>>=0,p>>>=0,h>>>=0;var g=!!(v(),P)[p+32>>>2>>>0];p={label:hr(p+4),usage:(v(),P)[p+16>>>2>>>0],size:4294967296*(v(),P)[p+28>>>2>>>0]+(v(),P)[p+24>>>2>>>0],mappedAtCreation:g},c=re(c);try{var b=c.createBuffer(p)}catch{return!1}return xt(h,b),g&&(or[h]=[]),!0}function DM(c,p,h,g){c>>>=0,p=wt(p),g>>>=0,h=MM(h>>>0),c=re(c),ge+=1,nn(p,c.createComputePipelineAsync(h).then(b=>{--ge,xt(g,b),uy(p,1,g,0)},b=>{--ge;var A=ae(),O=nr(b.message);uy(p,b.reason==="validation"?3:b.reason==="internal"?4:0,g,O),oe(A)}))}function FM(c,p,h){c>>>=0,p>>>=0,h>>>=0;var g=(v(),P)[p>>>2>>>0],b=(v(),P)[g+4>>>2>>>0];p={label:hr(p+4),code:""},b===2&&(p.code=Jb(g+8)),xt(h,re(c).createShaderModule(p))}var jM=c=>{(c=re(c)).onuncapturederror=null,c.destroy()};function GM(c,p){p=wt(p),c=re(c>>>0),ge+=1,nn(p,c.popErrorScope().then(h=>{--ge;var g=5;h?h instanceof GPUValidationError?g=2:h instanceof GPUOutOfMemoryError?g=3:h instanceof GPUInternalError&&(g=4):g=1;var b=ae();h=h?nr(h.message):0,fy(p,1,g,h),oe(b)},h=>{--ge;var g=ae();h=nr(h.message),fy(p,1,5,h),oe(g)}))}function qM(c,p,h,g){if(p=wt(p),g>>>=0,h>>>=0){var b=(v(),P)[h+4>>>2>>>0];b={featureLevel:SM[b],powerPreference:OM[(v(),P)[h+8>>>2>>>0]],forceFallbackAdapter:!!(v(),P)[h+12>>>2>>>0]},(h=(v(),P)[h>>>2>>>0])!==0&&(v(),b.Qe=!!(v(),P)[h+8>>>2>>>0])}"gpu"in navigator?(ge+=1,nn(p,navigator.gpu.requestAdapter(b).then(A=>{if(--ge,A)xt(g,A),Wa(p,1,g,0);else{A=ae();var O=nr("WebGPU not available on this browser (requestAdapter returned null)");Wa(p,3,g,O),oe(A)}},A=>{--ge;var O=ae();A=nr(A.message),Wa(p,4,g,A),oe(O)}))):(h=ae(),b=nr("WebGPU not available on this browser (navigator.gpu is not available)"),Wa(p,3,g,b),oe(h))}function WM(c,p,h){return c>>>=0,p>>>=0,h>>>=0,Fb(async()=>{var g=[];if(h){var b=(v(),B)[h>>>2>>>0];g.length=p+1,g[p]=new Promise(N=>setTimeout(N,b,0))}else g.length=p;for(var A=0;A<p;++A){var O=4294967296*(v(),P)[c+8*A+4>>>2>>>0]+(v(),P)[c+8*A>>>2>>>0];if(!(O in Xc))return O;g[A]=Xc[O]}return g=await Promise.race(g),delete Xc[g],g})}var iy,ly={},t1=()=>{if(!iy){var c,p={USER:"web_user",LOGNAME:"web_user",PATH:"/",PWD:"/",HOME:"/home/web_user",LANG:(globalThis.navigator?.language??"C").replace("-","_")+".UTF-8",_:"./this.program"};for(c in ly)ly[c]===void 0?delete p[c]:p[c]=ly[c];var h=[];for(c in p)h.push(`${c}=${p[c]}`);iy=h}return iy};function r1(c,p){if(n)return $e(19,1,c,p);c>>>=0,p>>>=0;var h,g=0,b=0;for(h of t1()){var A=p+g;(v(),P)[c+b>>>2>>>0]=A,g+=fr(h,A,1/0)+1,b+=4}return 0}function s1(c,p){if(n)return $e(20,1,c,p);c>>>=0,p>>>=0;var h=t1();for(var g of((v(),P)[c>>>2>>>0]=h.length,c=0,h))c+=mr(g)+1;return(v(),P)[p>>>2>>>0]=c,0}function n1(c){return n?$e(21,1,c):52}function o1(c,p,h,g){return n?$e(22,1,c,p,h,g):52}function a1(c,p,h,g){return n?$e(23,1,c,p,h,g):70}var VM=[null,[],[]];function i1(c,p,h,g){if(n)return $e(24,1,c,p,h,g);p>>>=0,h>>>=0,g>>>=0;for(var b=0,A=0;A<h;A++){var O=(v(),P)[p>>>2>>>0],N=(v(),P)[p+4>>>2>>>0];p+=8;for(var D=0;D<N;D++){var q=c,fe=(v(),Q)[O+D>>>0],me=VM[q];fe===0||fe===10?((q===1?I:T)(bb(me)),me.length=0):me.push(fe)}b+=N}return(v(),P)[g>>>2>>>0]=b,0}function HM(c){return c>>>0}function XM(c,p){return Zb(re(c>>>0).limits,p>>>0),1}function KM(c,p){return re(c>>>0).features.has(e1[p])}function YM(c){return BigInt(re(c>>>0).size)}function QM(c){return BigInt(re(c>>>0).usage)}function JM(c,p){if(c>>>=0,p>>>=0){var h=hr(p+4);h={label:h,timestampWrites:p=(p=(v(),P)[p+12>>>2>>>0])!==0?{querySet:re((v(),P)[p+4>>>2>>>0]),beginningOfPassWriteIndex:(v(),P)[p+8>>>2>>>0],endOfPassWriteIndex:(v(),P)[p+12>>>2>>>0]}:void 0}}return c=re(c),p=_1(0),xt(p,c.beginComputePass(h)),p}function ZM(c,p,h,g,b,A){h=wt(h),b=wt(b),A=wt(A),re(c>>>0).copyBufferToBuffer(re(p>>>0),h,re(g>>>0),b,A)}function eT(c){c=re(c>>>0);var p=m1(0);return xt(p,c.finish()),p}function tT(c,p,h,g,b,A){A=wt(A),re(c>>>0).resolveQuerySet(re(p>>>0),h,g,re(b>>>0),A)}function rT(c,p,h,g){re(c>>>0).dispatchWorkgroups(p,h,g)}function sT(c,p,h){h=wt(h),re(c>>>0).dispatchWorkgroupsIndirect(re(p>>>0),h)}function nT(c){re(c>>>0).end()}function oT(c,p,h,g,b){g>>>=0,b>>>=0,c=re(c>>>0),h=re(h>>>0),g==0?c.setBindGroup(p,h):c.setBindGroup(p,h,(v(),P),b>>>2,g)}function aT(c,p){re(c>>>0).setPipeline(re(p>>>0))}function iT(c,p,h){re(c>>>0).Pe(re(p>>>0),h)}function lT(c,p){c=re(c>>>0);var h=f1(0);return xt(h,c.getBindGroupLayout(p)),h}function cT(c,p){c>>>=0;var h=hr(4+(p>>>=0)),g=re((v(),P)[p+12>>>2>>>0]),b=(v(),P)[p+16>>>2>>>0];p=(v(),P)[p+20>>>2>>>0];for(var A=[],O=0;O<b;++O){var N=A,D=N.push,q=p+40*O,fe=(v(),P)[q+8>>>2>>>0],me=(v(),P)[q+32>>>2>>>0],Re=(v(),P)[q+36>>>2>>>0],ee=(v(),P)[q+4>>>2>>>0];fe?(me=q+24,(me=(v(),P)[me>>>2>>>0]+4294967296*(v(),B)[me+4>>>2>>>0])==-1&&(me=void 0),q={binding:ee,resource:{buffer:re(fe),offset:4294967296*(v(),P)[q+4+16>>>2>>>0]+(v(),P)[q+16>>>2>>>0],size:me}}):q=me?{binding:ee,resource:re(me)}:{binding:ee,resource:re(Re)},D.call(N,q)}return h={label:h,layout:g,entries:A},c=re(c),g=d1(0),xt(g,c.createBindGroup(h)),g}function uT(c,p){var h;return c>>>=0,(p>>>=0)&&(h={label:hr(p+4)}),c=re(c),p=h1(0),xt(p,c.createCommandEncoder(h)),p}function pT(c,p){c>>>=0,p>>>=0,p={type:IM[(v(),P)[p+12>>>2>>>0]],count:(v(),P)[p+16>>>2>>>0]},c=re(c);var h=g1(0);return xt(h,c.createQuerySet(p)),h}function dT(c,p){c=re(c>>>0).adapterInfo,p>>>=0,(v(),B)[p+52>>>2>>>0]=c.subgroupMinSize,(v(),B)[p+56>>>2>>>0]=c.subgroupMaxSize;var h=Yb(c.vendor+c.architecture+c.device+c.description),g=mr(c.vendor);return Kc(p+4,h,g),h+=g,g=mr(c.architecture),Kc(p+12,h,g),h+=g,g=mr(c.device),Kc(p+20,h,g),Kc(p+28,h+g,mr(c.description)),(v(),B)[p+36>>>2>>>0]=2,c=c.isFallbackAdapter?3:4,(v(),B)[p+40>>>2>>>0]=c,(v(),B)[p+44>>>2>>>0]=0,(v(),B)[p+48>>>2>>>0]=0,1}var fT={"core-features-and-limits":1,"depth-clip-control":2,"depth32float-stencil8":3,"texture-compression-bc":4,"texture-compression-bc-sliced-3d":5,"texture-compression-etc2":6,"texture-compression-astc":7,"texture-compression-astc-sliced-3d":8,"timestamp-query":9,"indirect-first-instance":10,"shader-f16":11,"rg11b10ufloat-renderable":12,"bgra8unorm-storage":13,"float32-filterable":14,"float32-blendable":15,"clip-distances":16,"dual-source-blending":17,subgroups:18,"texture-formats-tier1":19,"texture-formats-tier2":20,"primitive-index":21,"chromium-experimental-unorm16-texture-formats":327692,"chromium-experimental-snorm16-texture-formats":327693,"chromium-experimental-multi-draw-indirect":327732};function mT(c,p){p>>>=0,c=re(c>>>0);var h=an(4*c.features.size),g=0,b=0;c.features.forEach(A=>{0<=(A=fT[A])&&((v(),B)[h+g>>>2>>>0]=A,g+=4,b++)}),(v(),P)[p+4>>>2>>>0]=h,(v(),P)[p>>>2>>>0]=b}function hT(c,p){return Zb(re(c>>>0).limits,p>>>0),1}function _T(c,p){re(c>>>0).pushErrorScope(TM[p])}function gT(c,p,h){p>>>=0,h>>>=0,c=re(c>>>0),p=Array.from((v(),B).subarray(h>>>2>>>0,h+4*p>>>2>>>0),g=>re(g)),c.submit(p)}function wT(c,p,h,g,b){h=wt(h),g>>>=0,b>>>=0,c=re(c>>>0),p=re(p>>>0),g=(v(),Q).subarray(g>>>0,g+b>>>0),c.writeBuffer(p,h,g,0,b)}n||(function(){for(var c=e.numThreads-1;c--;)mb();Me.push(async()=>{var p=(async function(){if(!n)return Promise.all(tt.map(fb))})();xe++,await p,--xe==0&&qe&&(p=qe,qe=null,p())})})(),n||($r=new WebAssembly.Memory({initial:256,maximum:65536,shared:!0}),ue()),e.wasmBinary&&(f=e.wasmBinary),e.stackSave=()=>ae(),e.stackRestore=c=>oe(c),e.stackAlloc=c=>Qc(c),e.setValue=function(c,p,h="i8"){switch(h.endsWith("*")&&(h="*"),h){case"i1":case"i8":(v(),V)[c>>>0]=p;break;case"i16":(v(),K)[c>>>1>>>0]=p;break;case"i32":(v(),B)[c>>>2>>>0]=p;break;case"i64":(v(),S)[c>>>3>>>0]=BigInt(p);break;case"float":(v(),se)[c>>>2>>>0]=p;break;case"double":(v(),ie)[c>>>3>>>0]=p;break;case"*":(v(),P)[c>>>2>>>0]=p;break;default:Pe(`invalid type for setValue: ${h}`)}},e.getValue=function(c,p="i8"){switch(p.endsWith("*")&&(p="*"),p){case"i1":case"i8":return(v(),V)[c>>>0];case"i16":return(v(),K)[c>>>1>>>0];case"i32":return(v(),B)[c>>>2>>>0];case"i64":return(v(),S)[c>>>3>>>0];case"float":return(v(),se)[c>>>2>>>0];case"double":return(v(),ie)[c>>>3>>>0];case"*":return(v(),P)[c>>>2>>>0];default:Pe(`invalid type for getValue: ${p}`)}},e.UTF8ToString=rn,e.stringToUTF8=fr,e.lengthBytesUTF8=mr;var l1,c1,cy,Yc,Rt,an,u1,p1,d1,f1,m1,h1,_1,g1,w1,x1,y1,uy,py,dy,fy,Wa,my,b1,hy,v1,k1,E1,_y,A1,M1,gy,he,Va,T1,oe,Qc,ae,S1,wy,O1,I1,C1,xy,P1,z1,L1,N1,$1,R1,U1,B1,D1,F1,j1,G1,q1,W1,V1,H1,X1,K1,Y1,Q1,J1,Z1,ev,tv,rv,sv,nv,ov,av,iv,lv,cv,uv,pv,dv,fv,mv,hv,_v,gv,_r,xT=[Nr,ns,gb,vb,kb,Eb,Ab,Mb,Tb,Sb,Ob,Ib,Cb,Pb,zb,Lb,Vb,Hb,Xb,r1,s1,n1,o1,a1,i1],yy={1116828:(c,p,h,g,b)=>{if(e===void 0||!e.Zc)return 1;if((c=rn(Number(c>>>0))).startsWith("./")&&(c=c.substring(2)),!(c=e.Zc.get(c)))return 2;if(p=Number(p>>>0),h=Number(h>>>0),g=Number(g>>>0),p+h>c.byteLength)return 3;try{let A=c.subarray(p,p+h);switch(b){case 0:(v(),Q).set(A,g>>>0);break;case 1:e.ie?e.ie(g,A):e.Ke(g,A);break;default:return 4}return 0}catch{return 4}},1117652:(c,p,h)=>{e.ke(c,(v(),Q).subarray(p>>>0,p+h>>>0))},1117716:()=>e.Ie(),1117758:c=>{e.je(c)},1117795:()=>typeof wasmOffsetConverter<"u"};function yT(){return typeof wasmOffsetConverter<"u"}function bT(c,p,h,g){var b=ae();try{return B1(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function vT(c,p,h){var g=ae();try{return $1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function kT(c,p,h){var g=ae();try{C1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function ET(c,p){var h=ae();try{return xy(c,p)}catch(g){if(oe(h),g!==g+0)throw g;he(1,0)}}function AT(c){var p=ae();try{P1(c)}catch(h){if(oe(p),h!==h+0)throw h;he(1,0)}}function MT(c,p,h,g,b,A,O){var N=ae();try{return N1(c,p,h,g,b,A,O)}catch(D){if(oe(N),D!==D+0)throw D;he(1,0)}}function TT(c,p){var h=ae();try{D1(c,p)}catch(g){if(oe(h),g!==g+0)throw g;he(1,0)}}function ST(c,p,h,g,b,A){var O=ae();try{z1(c,p,h,g,b,A)}catch(N){if(oe(O),N!==N+0)throw N;he(1,0)}}function OT(c,p,h,g){var b=ae();try{U1(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function IT(c,p,h,g,b,A,O){var N=ae();try{j1(c,p,h,g,b,A,O)}catch(D){if(oe(N),D!==D+0)throw D;he(1,0)}}function CT(c,p,h,g,b,A,O){var N=ae();try{G1(c,p,h,g,b,A,O)}catch(D){if(oe(N),D!==D+0)throw D;he(1,0)}}function PT(c,p,h,g,b,A,O,N){var D=ae();try{Z1(c,p,h,g,b,A,O,N)}catch(q){if(oe(D),q!==q+0)throw q;he(1,0)}}function zT(c,p,h,g,b){var A=ae();try{L1(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;he(1,0)}}function LT(c,p,h,g,b){var A=ae();try{return F1(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;he(1,0)}}function NT(c,p,h,g,b,A,O,N){var D=ae();try{ev(c,p,h,g,b,A,O,N)}catch(q){if(oe(D),q!==q+0)throw q;he(1,0)}}function $T(c,p,h,g,b,A,O,N,D,q,fe,me){var Re=ae();try{q1(c,p,h,g,b,A,O,N,D,q,fe,me)}catch(ee){if(oe(Re),ee!==ee+0)throw ee;he(1,0)}}function RT(c,p,h,g,b,A){var O=ae();try{return Q1(c,p,h,g,b,A)}catch(N){if(oe(O),N!==N+0)throw N;he(1,0)}}function UT(c,p,h){var g=ae();try{return X1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;return he(1,0),0n}}function BT(c,p,h,g,b,A,O,N,D){var q=ae();try{R1(c,p,h,g,b,A,O,N,D)}catch(fe){if(oe(q),fe!==fe+0)throw fe;he(1,0)}}function DT(c){var p=ae();try{return V1(c)}catch(h){if(oe(p),h!==h+0)throw h;he(1,0)}}function FT(c,p,h){var g=ae();try{return tv(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function jT(c,p){var h=ae();try{return fv(c,p)}catch(g){if(oe(h),g!==g+0)throw g;return he(1,0),0n}}function GT(c,p,h,g,b){var A=ae();try{rv(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;he(1,0)}}function qT(c){var p=ae();try{return W1(c)}catch(h){if(oe(p),h!==h+0)throw h;return he(1,0),0n}}function WT(c,p,h,g,b,A){var O=ae();try{return ov(c,p,h,g,b,A)}catch(N){if(oe(O),N!==N+0)throw N;he(1,0)}}function VT(c,p,h,g,b,A){var O=ae();try{return av(c,p,h,g,b,A)}catch(N){if(oe(O),N!==N+0)throw N;he(1,0)}}function HT(c,p,h,g,b,A,O,N){var D=ae();try{return J1(c,p,h,g,b,A,O,N)}catch(q){if(oe(D),q!==q+0)throw q;he(1,0)}}function XT(c,p,h,g,b){var A=ae();try{return iv(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;return he(1,0),0n}}function KT(c,p,h,g){var b=ae();try{return lv(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function YT(c,p,h,g){var b=ae();try{return cv(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function QT(c,p,h,g,b,A,O,N,D,q,fe,me){var Re=ae();try{return uv(c,p,h,g,b,A,O,N,D,q,fe,me)}catch(ee){if(oe(Re),ee!==ee+0)throw ee;he(1,0)}}function JT(c,p,h,g,b,A,O,N,D,q,fe){var me=ae();try{sv(c,p,h,g,b,A,O,N,D,q,fe)}catch(Re){if(oe(me),Re!==Re+0)throw Re;he(1,0)}}function ZT(c,p,h,g,b,A,O,N,D,q,fe,me,Re,ee,ct,Ut){var nt=ae();try{nv(c,p,h,g,b,A,O,N,D,q,fe,me,Re,ee,ct,Ut)}catch(ls){if(oe(nt),ls!==ls+0)throw ls;he(1,0)}}function eS(c,p,h,g){var b=ae();try{return pv(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function tS(c,p,h,g,b){var A=ae();try{return dv(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;he(1,0)}}function rS(c,p,h){var g=ae();try{return H1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function sS(c,p,h){var g=ae();try{return K1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function nS(c,p,h,g){var b=ae();try{Y1(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function Jc(){if(0<xe)qe=Jc;else if(n)w?.(e),Be();else{for(var c=Me;0<c.length;)c.shift()(e);0<xe?qe=Jc:(e.calledRun=!0,z||(Be(),w?.(e)))}}return n||(_r=await Qe(),Jc()),e.PTR_SIZE=4,e.webgpuInit=c=>{let p=new WeakMap,h,g,b=1;e.webgpuRegisterDevice=N=>{if(g!==void 0)throw Error("another WebGPU EP inference session is being created.");if(N){var D=p.get(N);if(!D){let q=((fe,me=0)=>{var Re=y1(me);return me=x1(me,Re),xt(Re,fe.queue),xt(me,fe),me})(N,D=p1(0));D=[b++,D,q],p.set(N,D)}return h=N,g=D[0],D}h=void 0,g=0};let A=new Map;e.webgpuOnCreateSession=N=>{if(g!==void 0){var D=g;if(g=void 0,N){let q=cy(D);A.set(N,q),D===0&&c(h??re(q))}h=void 0}},e.webgpuOnReleaseSession=N=>{A.delete(N)};let O=Symbol("gpuBufferMetadata");e.webgpuRegisterBuffer=(N,D,q)=>{if(q)return N[O]=[q,NaN],q;if(q=N[O])return q[1]++,q[0];if((D=A.get(D))===void 0)throw Error("Invalid session handle passed to webgpuRegisterBuffer");return D=((fe,me=0)=>(fe.mapState!="pending"||Pe(),me=w1(me,fe.mapState=="mapped"?3:1),xt(me,fe),fe.mapState=="mapped"&&(or[me]=[]),me))(N,D),N[O]=[D,1],D},e.webgpuUnregisterBuffer=N=>{let D=N[O];if(!D)throw Error("Buffer is not registered");D[1]--,D[1]===0&&(u1(D[0]),delete N[O])},e.webgpuGetBuffer=N=>re(N),e.webgpuCreateDownloader=(N,D,q)=>{if((q=A.get(q))===void 0)throw Error("Invalid session handle passed to webgpuRegisterBuffer");let fe=re(q),me=16*Math.ceil(Number(D)/16);return async()=>{let Re=fe.createBuffer({size:me,usage:9});try{let ee=fe.createCommandEncoder();return ee.copyBufferToBuffer(N,0,Re,0,me),fe.queue.submit([ee.finish()]),await Re.mapAsync(GPUMapMode.READ),Re.getMappedRange().slice(0,D)}finally{Re.destroy()}}},e.ie=(N,D)=>{var q=D.buffer;let fe=D.byteOffset,me=D.byteLength;if(D=16*Math.ceil(Number(me)/16),N=re(N),!h){var Re=cy(g);h=re(Re)}let ee=(Re=h.createBuffer({mappedAtCreation:!0,size:D,usage:6})).getMappedRange();new Uint8Array(ee).set(new Uint8Array(q,fe,me)),Re.unmap(),(q=h.createCommandEncoder()).copyBufferToBuffer(Re,0,N,0,D),h.queue.submit([q.finish()]),Re.destroy()}},e.webnnInit=c=>{let p=c[0];[e.Ie,e.je,e.webnnEnsureTensor,e.ke,e.webnnDownloadTensor,e.He,e.webnnEnableTraceEvent]=c.slice(1),e.webnnReleaseTensorId=e.je,e.webnnUploadTensor=e.ke,e.webnnRegisterMLContext=e.He,e.webnnOnRunStart=h=>p.onRunStart(h),e.webnnOnRunEnd=p.onRunEnd.bind(p),e.webnnOnReleaseSession=h=>{p.onReleaseSession(h)},e.webnnCreateMLTensorDownloader=(h,g)=>p.createMLTensorDownloader(h,g),e.webnnRegisterMLTensor=(h,g,b,A)=>p.registerMLTensor(h,g,b,A),e.webnnCreateMLContext=h=>p.createMLContext(h),e.webnnRegisterMLConstant=(h,g,b,A,O,N)=>p.registerMLConstant(h,g,b,A,O,e.Zc,N),e.webnnRegisterGraphInput=p.registerGraphInput.bind(p),e.webnnIsGraphInput=p.isGraphInput.bind(p),e.webnnRegisterGraphOutput=p.registerGraphOutput.bind(p),e.webnnIsGraphOutput=p.isGraphOutput.bind(p),e.webnnCreateTemporaryTensor=p.createTemporaryTensor.bind(p),e.webnnIsGraphInputOutputTypeSupported=p.isGraphInputOutputTypeSupported.bind(p)},te?e:new Promise((c,p)=>{w=c,x=p})}var hE,vk,KC=ye(()=>{"use strict";hE=bk,vk=globalThis.self?.name?.startsWith("em-pthread"),vk&&bk()}),Ry,Zy,kk,Ot,_E,fu,Ek,Ak,Uy,Mk,By,gE,Dy,wE,l0=ye(()=>{"use strict";i0(),Ry=typeof location>"u"?void 0:location.origin,Zy=Qt.url>"file:"&&Qt.url<"file;",kk=()=>{if(Zy){let t=URL;return new URL(new t("ort.webgpu.bundle.min.mjs",Qt.url).href,Ry).href}return Qt.url},Ot=kk(),_E=()=>{if(Ot&&!Ot.startsWith("blob:"))return Ot.substring(0,Ot.lastIndexOf("/")+1)},fu=(t,e)=>{try{let r=e??Ot;return(r?new URL(t,r):new URL(t)).origin===Ry}catch{return!1}},Ek=(t,e)=>{let r=e??Ot;try{return(r?new URL(t,r):new URL(t)).href}catch{return}},Ak=(t,e)=>`${e??"./"}${t}`,Uy=async t=>{let e=await(await fetch(t,{credentials:"same-origin"})).blob();return URL.createObjectURL(e)},Mk=async t=>(await import(t)).default,By=(XC(),xu(dE)).default,gE=async()=>{if(!Ot)throw new Error("Failed to load proxy worker: cannot determine the script source URL.");if(fu(Ot))return[void 0,By()];let t=await Uy(Ot);return[t,By(t)]},Dy=(KC(),xu(mE)).default,wE=async(t,e,r,s)=>{let n=Dy&&!(t||e);if(n)if(Ot)n=fu(Ot);else if(s&&!r)n=!0;else throw new Error("cannot determine the script source URL.");if(n)return[void 0,Dy];{let o="ort-wasm-simd-threaded.asyncify.mjs",a=t??Ek(o,e),i=r&&a&&!fu(a,e),l=i?await Uy(a):a??Ak(o,e);return[i?l:void 0,await Mk(l)]}}}),Fy,mu,si,jy,Tk,Sk,Ok,c0,Ue,ks=ye(()=>{"use strict";l0(),mu=!1,si=!1,jy=!1,Tk=()=>{if(typeof SharedArrayBuffer>"u")return!1;try{return typeof MessageChannel<"u"&&new MessageChannel().port1.postMessage(new SharedArrayBuffer(1)),WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,5,4,1,3,1,1,10,11,1,9,0,65,0,254,16,2,0,26,11]))}catch{return!1}},Sk=()=>{try{return WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,10,30,1,28,0,65,0,253,15,253,12,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,253,186,1,26,11]))}catch{return!1}},Ok=()=>{try{return WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,5,1,96,0,1,123,3,2,1,0,10,19,1,17,0,65,1,253,15,65,2,253,15,65,3,253,15,253,147,2,11]))}catch{return!1}},c0=async t=>{if(mu)return Promise.resolve();if(si)throw new Error("multiple calls to 'initializeWebAssembly()' detected.");if(jy)throw new Error("previous call to 'initializeWebAssembly()' failed.");si=!0;let e=t.initTimeout,r=t.numThreads;if(t.simd!==!1){if(t.simd==="relaxed"){if(!Ok())throw new Error("Relaxed WebAssembly SIMD is not supported in the current environment.")}else if(!Sk())throw new Error("WebAssembly SIMD is not supported in the current environment.")}let s=Tk();r>1&&!s&&(typeof self<"u"&&!self.crossOriginIsolated&&console.warn("env.wasm.numThreads is set to "+r+", but this will not work unless you enable crossOriginIsolated mode. See https://web.dev/cross-origin-isolation-guide/ for more info."),console.warn("WebAssembly multi-threading is not supported in the current environment. Falling back to single-threading."),t.numThreads=r=1);let n=t.wasmPaths,o=typeof n=="string"?n:void 0,a=n?.mjs,i=a?.href??a,l=n?.wasm,u=l?.href??l,d=t.wasmBinary,[f,m]=await wE(i,o,r>1,!!d||!!u),_=!1,w=[];if(e>0&&w.push(new Promise(x=>{setTimeout(()=>{_=!0,x()},e)})),w.push(new Promise((x,k)=>{let E={numThreads:r};if(d)E.wasmBinary=d;else if(u||o)E.locateFile=M=>u??o+M;else if(i&&i.indexOf("blob:")!==0)E.locateFile=M=>new URL(M,i).href;else if(f){let M=_E();M&&(E.locateFile=I=>M+I)}m(E).then(M=>{si=!1,mu=!0,Fy=M,x(),f&&URL.revokeObjectURL(f)},M=>{si=!1,jy=!0,k(M)})})),await Promise.race(w),_)throw new Error(`WebAssembly backend initializing failed due to timeout: ${e}ms`)},Ue=()=>{if(mu&&Fy)return Fy;throw new Error("WebAssembly is not initialized yet.")}}),It,bu,Ie,u0=ye(()=>{"use strict";ks(),It=(t,e)=>{let r=Ue(),s=r.lengthBytesUTF8(t)+1,n=r._malloc(s);return r.stringToUTF8(t,n,s),e.push(n),n},bu=(t,e,r,s)=>{if(typeof t=="object"&&t!==null){if(r.has(t))throw new Error("Circular reference in options");r.add(t)}Object.entries(t).forEach(([n,o])=>{let a=e?e+n:n;if(typeof o=="object")bu(o,a+".",r,s);else if(typeof o=="string"||typeof o=="number")s(a,o.toString());else if(typeof o=="boolean")s(a,o?"1":"0");else throw new Error(`Can't handle extra config type: ${typeof o}`)})},Ie=t=>{let e=Ue(),r=e.stackSave();try{let s=e.PTR_SIZE,n=e.stackAlloc(2*s);e._OrtGetLastError(n,n+s);let o=Number(e.getValue(n,s===4?"i32":"i64")),a=e.getValue(n+s,"*"),i=a?e.UTF8ToString(a):"";throw new Error(`${t} ERROR_CODE: ${o}, ERROR_MESSAGE: ${i}`)}finally{e.stackRestore(r)}}}),xE,YC=ye(()=>{"use strict";ks(),u0(),xE=t=>{let e=Ue(),r=0,s=[],n=t||{};try{if(t?.logSeverityLevel===void 0)n.logSeverityLevel=2;else if(typeof t.logSeverityLevel!="number"||!Number.isInteger(t.logSeverityLevel)||t.logSeverityLevel<0||t.logSeverityLevel>4)throw new Error(`log severity level is not valid: ${t.logSeverityLevel}`);if(t?.logVerbosityLevel===void 0)n.logVerbosityLevel=0;else if(typeof t.logVerbosityLevel!="number"||!Number.isInteger(t.logVerbosityLevel))throw new Error(`log verbosity level is not valid: ${t.logVerbosityLevel}`);t?.terminate===void 0&&(n.terminate=!1);let o=0;return t?.tag!==void 0&&(o=It(t.tag,s)),r=e._OrtCreateRunOptions(n.logSeverityLevel,n.logVerbosityLevel,!!n.terminate,o),r===0&&Ie("Can't create run options."),t?.extra!==void 0&&bu(t.extra,"",new WeakSet,(a,i)=>{let l=It(a,s),u=It(i,s);e._OrtAddRunConfigEntry(r,l,u)!==0&&Ie(`Can't set a run config entry: ${a} - ${i}.`)}),[r,s]}catch(o){throw r!==0&&e._OrtReleaseRunOptions(r),s.forEach(a=>e._free(a)),o}}}),Ik,Ck,Pk,hu,Dr,zk,yE,QC=ye(()=>{"use strict";ks(),u0(),Ik=t=>{switch(t){case"disabled":return 0;case"basic":return 1;case"extended":return 2;case"layout":return 3;case"all":return 99;default:throw new Error(`unsupported graph optimization level: ${t}`)}},Ck=t=>{switch(t){case"sequential":return 0;case"parallel":return 1;default:throw new Error(`unsupported execution mode: ${t}`)}},Pk=t=>{t.extra||(t.extra={}),t.extra.session||(t.extra.session={});let e=t.extra.session;e.use_ort_model_bytes_directly||(e.use_ort_model_bytes_directly="1"),t.executionProviders&&t.executionProviders.some(r=>(typeof r=="string"?r:r.name)==="webgpu")&&(t.enableMemPattern=!1)},hu=(t,e,r,s)=>{let n=It(e,s),o=It(r,s);Ue()._OrtAddSessionConfigEntry(t,n,o)!==0&&Ie(`Can't set a session config entry: ${e} - ${r}.`)},Dr=(t,e,r,s)=>{let n=It(e,s),o=It(r,s);t.push([n,o])},zk=async(t,e,r)=>{let s=e.executionProviders;for(let n of s){let o=typeof n=="string"?n:n.name,a=[];switch(o){case"webnn":if(o="WEBNN",typeof n!="string"){let f=n?.deviceType;f&&hu(t,"deviceType",f,r)}break;case"webgpu":{o="WebGPU";let f;if(typeof n!="string"){let _=n;if(_.device)if(typeof GPUDevice<"u"&&_.device instanceof GPUDevice)f=_.device;else throw new Error("Invalid GPU device set in WebGPU EP options.");let{enableGraphCapture:w}=e;if(typeof w=="boolean"&&w&&Dr(a,"enableGraphCapture","1",r),typeof _.preferredLayout=="string"&&Dr(a,"preferredLayout",_.preferredLayout,r),_.forceCpuNodeNames){let x=Array.isArray(_.forceCpuNodeNames)?_.forceCpuNodeNames:[_.forceCpuNodeNames];Dr(a,"forceCpuNodeNames",x.join(`
|
|
15
|
-
`),r)}_.validationMode&&Dr(a,"validationMode",_.validationMode,r)}let m=Ue().webgpuRegisterDevice(f);if(m){let[_,w,x]=m;Dr(a,"deviceId",_.toString(),r),Dr(a,"webgpuInstance",w.toString(),r),Dr(a,"webgpuDevice",x.toString(),r)}}break;case"wasm":case"cpu":continue;default:throw new Error(`not supported execution provider: ${o}`)}let i=It(o,r),l=a.length,u=0,d=0;if(l>0){u=Ue()._malloc(l*Ue().PTR_SIZE),r.push(u),d=Ue()._malloc(l*Ue().PTR_SIZE),r.push(d);for(let f=0;f<l;f++)Ue().setValue(u+f*Ue().PTR_SIZE,a[f][0],"*"),Ue().setValue(d+f*Ue().PTR_SIZE,a[f][1],"*")}await Ue()._OrtAppendExecutionProvider(t,i,u,d,l)!==0&&Ie(`Can't append execution provider: ${o}.`)}},yE=async t=>{let e=Ue(),r=0,s=[],n=t||{};Pk(n);try{let o=Ik(n.graphOptimizationLevel??"all"),a=Ck(n.executionMode??"sequential"),i=typeof n.logId=="string"?It(n.logId,s):0,l=n.logSeverityLevel??2;if(!Number.isInteger(l)||l<0||l>4)throw new Error(`log severity level is not valid: ${l}`);let u=n.logVerbosityLevel??0;if(!Number.isInteger(u)||u<0||u>4)throw new Error(`log verbosity level is not valid: ${u}`);let d=typeof n.optimizedModelFilePath=="string"?It(n.optimizedModelFilePath,s):0;if(r=e._OrtCreateSessionOptions(o,!!n.enableCpuMemArena,!!n.enableMemPattern,a,!!n.enableProfiling,0,i,l,u,d),r===0&&Ie("Can't create session options."),n.executionProviders&&await zk(r,n,s),n.enableGraphCapture!==void 0){if(typeof n.enableGraphCapture!="boolean")throw new Error(`enableGraphCapture must be a boolean value: ${n.enableGraphCapture}`);hu(r,"enableGraphCapture",n.enableGraphCapture.toString(),s)}if(n.freeDimensionOverrides)for(let[f,m]of Object.entries(n.freeDimensionOverrides)){if(typeof f!="string")throw new Error(`free dimension override name must be a string: ${f}`);if(typeof m!="number"||!Number.isInteger(m)||m<0)throw new Error(`free dimension override value must be a non-negative integer: ${m}`);let _=It(f,s);e._OrtAddFreeDimensionOverride(r,_,m)!==0&&Ie(`Can't set a free dimension override: ${f} - ${m}.`)}return n.extra!==void 0&&bu(n.extra,"",new WeakSet,(f,m)=>{hu(r,f,m,s)}),[r,s]}catch(o){throw r!==0&&e._OrtReleaseSessionOptions(r)!==0&&Ie("Can't release session options."),s.forEach(a=>e._free(a)),o}}}),ws,wu,hn,li,vu,p0,d0,e0,_n=ye(()=>{"use strict";ws=t=>{switch(t){case"int8":return 3;case"uint8":return 2;case"bool":return 9;case"int16":return 5;case"uint16":return 4;case"int32":return 6;case"uint32":return 12;case"float16":return 10;case"float32":return 1;case"float64":return 11;case"string":return 8;case"int64":return 7;case"uint64":return 13;case"int4":return 22;case"uint4":return 21;default:throw new Error(`unsupported data type: ${t}`)}},wu=t=>{switch(t){case 3:return"int8";case 2:return"uint8";case 9:return"bool";case 5:return"int16";case 4:return"uint16";case 6:return"int32";case 12:return"uint32";case 10:return"float16";case 1:return"float32";case 11:return"float64";case 8:return"string";case 7:return"int64";case 13:return"uint64";case 22:return"int4";case 21:return"uint4";default:throw new Error(`unsupported data type: ${t}`)}},hn=(t,e)=>{let r=[-1,4,1,1,2,2,4,8,-1,1,2,8,4,8,-1,-1,-1,-1,-1,-1,-1,.5,.5][t],s=typeof e=="number"?e:e.reduce((n,o)=>n*o,1);return r>0?Math.ceil(s*r):void 0},li=t=>{switch(t){case"float16":return typeof Float16Array<"u"&&Float16Array.from?Float16Array:Uint16Array;case"float32":return Float32Array;case"uint8":return Uint8Array;case"int8":return Int8Array;case"uint16":return Uint16Array;case"int16":return Int16Array;case"int32":return Int32Array;case"bool":return Uint8Array;case"float64":return Float64Array;case"uint32":return Uint32Array;case"int64":return BigInt64Array;case"uint64":return BigUint64Array;default:throw new Error(`unsupported type: ${t}`)}},vu=t=>{switch(t){case"verbose":return 0;case"info":return 1;case"warning":return 2;case"error":return 3;case"fatal":return 4;default:throw new Error(`unsupported logging level: ${t}`)}},p0=t=>t==="float32"||t==="float16"||t==="int32"||t==="int64"||t==="uint32"||t==="uint8"||t==="bool"||t==="uint4"||t==="int4",d0=t=>t==="float32"||t==="float16"||t==="int32"||t==="int64"||t==="uint32"||t==="uint64"||t==="int8"||t==="uint8"||t==="bool"||t==="uint4"||t==="int4",e0=t=>{switch(t){case"none":return 0;case"cpu":return 1;case"cpu-pinned":return 2;case"texture":return 3;case"gpu-buffer":return 4;case"ml-tensor":return 5;default:throw new Error(`unsupported data location: ${t}`)}}}),f0,bE=ye(()=>{"use strict";i0(),f0=async t=>{if(typeof t=="string"){let e=await fetch(t);if(!e.ok)throw new Error(`failed to load external data file: ${t}`);let r=e.headers.get("Content-Length"),s=r?parseInt(r,10):0;if(s<1073741824)return new Uint8Array(await e.arrayBuffer());{if(!e.body)throw new Error(`failed to load external data file: ${t}, no response body.`);let n=e.body.getReader(),o;try{o=new ArrayBuffer(s)}catch(i){if(i instanceof RangeError){let l=Math.ceil(s/65536);o=new WebAssembly.Memory({initial:l,maximum:l}).buffer}else throw i}let a=0;for(;;){let{done:i,value:l}=await n.read();if(i)break;let u=l.byteLength;new Uint8Array(o,a,u).set(l),a+=u}return new Uint8Array(o,0,s)}}else return t instanceof Blob?new Uint8Array(await t.arrayBuffer()):t instanceof Uint8Array?t:new Uint8Array(t)}}),vE,JC=ye(()=>{"use strict";_n(),vE=(t,e)=>new(li(e))(t)}),Lk,Nk,$k,Rk,kE,Uk,_t,EE=ye(()=>{"use strict";_n(),Lk=["V","I","W","E","F"],Nk=(t,e)=>{console.log(`[${Lk[t]},${new Date().toISOString()}]${e}`)},kE=(t,e)=>{$k=t,Rk=e},Uk=(t,e)=>{let r=vu(t),s=vu($k);r>=s&&Nk(r,typeof e=="function"?e():e)},_t=(...t)=>{Rk&&Uk(...t)}}),Gy,t0,qy,Bk,Wy,Dk,Vy,Hy,Xy,Fk,AE,ZC=ye(()=>{"use strict";_n(),EE(),Gy=new Map([["float32",32],["float16",16],["int32",32],["uint32",32],["int64",64],["uint64",64],["int8",8],["uint8",8],["int4",4],["uint4",4]]),t0=(t,e)=>{if(e==="int32")return t;let r=Gy.get(e);if(!r)throw new Error(`WebNN backend does not support data type: ${e}`);let s=r/8;if(t.byteLength%s!==0)throw new Error(`Invalid Uint8Array length - must be a multiple of ${s}.`);let n=t.byteLength/s,o=new(li(e))(t.buffer,t.byteOffset,n);switch(e){case"int64":case"uint64":{let a=new Int32Array(n);for(let i=0;i<n;i++){let l=o[i];if(l>2147483647n||l<-2147483648n)throw new Error("Can not convert int64 data to int32 - value out of range.");a[i]=Number(l)}return new Uint8Array(a.buffer)}case"int8":case"uint8":case"uint32":{if(e==="uint32"&&o.some(i=>i>2147483647))throw new Error("Can not convert uint32 data to int32 - value out of range.");let a=Int32Array.from(o,Number);return new Uint8Array(a.buffer)}default:throw new Error(`Unsupported data conversion from ${e} to 'int32'`)}},qy=(t,e)=>{if(e==="int32")return t;if(t.byteLength%4!==0)throw new Error("Invalid Uint8Array length - must be a multiple of 4 (int32).");let r=t.byteLength/4,s=new Int32Array(t.buffer,t.byteOffset,r);switch(e){case"int64":{let n=BigInt64Array.from(s,BigInt);return new Uint8Array(n.buffer)}case"uint64":{if(s.some(o=>o<0))throw new Error("Can not convert int32 data to uin64 - negative value found.");let n=BigUint64Array.from(s,BigInt);return new Uint8Array(n.buffer)}case"int8":{if(s.some(o=>o<-128||o>127))throw new Error("Can not convert int32 data to int8 - value out of range.");let n=Int8Array.from(s,Number);return new Uint8Array(n.buffer)}case"uint8":{if(s.some(n=>n<0||n>255))throw new Error("Can not convert int32 data to uint8 - value out of range.");return Uint8Array.from(s,Number)}case"uint32":{if(s.some(o=>o<0))throw new Error("Can not convert int32 data to uint32 - negative value found.");let n=Uint32Array.from(s,Number);return new Uint8Array(n.buffer)}default:throw new Error(`Unsupported data conversion from 'int32' to ${e}`)}},Bk=1,Wy=()=>Bk++,Dk=new Map([["int8","int32"],["uint8","int32"],["uint32","int32"],["int64","int32"]]),Vy=(t,e)=>{let r=Gy.get(t);if(!r)throw new Error(`WebNN backend does not support data type: ${t}`);return e.length>0?Math.ceil(e.reduce((s,n)=>s*n)*r/8):0},Hy=class{constructor(t){this.isDataConverted=!1;let{sessionId:e,context:r,tensor:s,dataType:n,shape:o,fallbackDataType:a}=t;this.sessionId=e,this.mlContext=r,this.mlTensor=s,this.dataType=n,this.tensorShape=o,this.fallbackDataType=a}get tensor(){return this.mlTensor}get type(){return this.dataType}get fallbackType(){return this.fallbackDataType}get shape(){return this.tensorShape}get byteLength(){return Vy(this.dataType,this.tensorShape)}destroy(){_t("verbose",()=>"[WebNN] TensorWrapper.destroy"),this.mlTensor.destroy()}write(t){this.mlContext.writeTensor(this.mlTensor,t)}async read(t){if(this.fallbackDataType){let e=await this.mlContext.readTensor(this.mlTensor),r=qy(new Uint8Array(e),this.dataType);if(t){(t instanceof ArrayBuffer?new Uint8Array(t):new Uint8Array(t.buffer,t.byteOffset,t.byteLength)).set(r);return}else return r.buffer}else return t?this.mlContext.readTensor(this.mlTensor,t):this.mlContext.readTensor(this.mlTensor)}canReuseTensor(t,e,r){return this.mlContext===t&&this.dataType===e&&this.tensorShape.length===r.length&&this.tensorShape.every((s,n)=>s===r[n])}setIsDataConverted(t){this.isDataConverted=t}},Xy=class{constructor(t,e){this.tensorManager=t,this.wrapper=e}get tensorWrapper(){return this.wrapper}releaseTensor(){this.tensorWrapper&&(this.tensorManager.releaseTensor(this.tensorWrapper),this.wrapper=void 0)}async ensureTensor(t,e,r,s){let n=this.tensorManager.getMLContext(t),o=this.tensorManager.getMLOpSupportLimits(t),a;if(!o?.input.dataTypes.includes(e)){if(a=Dk.get(e),!a||o?.input.dataTypes.includes(a))throw new Error(`WebNN backend does not support data type: ${e}`);_t("verbose",()=>`[WebNN] TensorIdTracker.ensureTensor: fallback dataType from ${e} to ${a}`)}if(this.wrapper){if(this.wrapper.canReuseTensor(n,e,r))return this.wrapper.tensor;if(s){if(this.wrapper.byteLength!==Vy(e,r))throw new Error("Unable to copy data to tensor with different size.");this.activeUpload=new Uint8Array(await this.wrapper.read())}this.tensorManager.releaseTensor(this.wrapper)}let i=typeof MLTensorUsage>"u"?void 0:MLTensorUsage.READ|MLTensorUsage.WRITE;return this.wrapper=await this.tensorManager.getCachedTensor(t,e,r,i,!0,!0,a),s&&this.activeUpload&&(this.wrapper.write(this.activeUpload),this.activeUpload=void 0),this.wrapper.tensor}upload(t){let e=t;if(this.wrapper){if(this.wrapper.fallbackType)if(this.wrapper.fallbackType==="int32")e=t0(t,this.wrapper.type),this.wrapper.setIsDataConverted(!0);else throw new Error(`Unsupported fallback data type: ${this.wrapper.fallbackType}`);if(t.byteLength===this.wrapper.byteLength){this.wrapper.write(e);return}else _t("verbose",()=>"Data size does not match tensor size. Releasing tensor."),this.releaseTensor()}this.activeUpload?this.activeUpload.set(e):this.activeUpload=new Uint8Array(e)}async download(t){if(this.activeUpload){let e=this.wrapper?.isDataConverted?qy(this.activeUpload,this.wrapper?.type):this.activeUpload;if(t){t instanceof ArrayBuffer?new Uint8Array(t).set(e):new Uint8Array(t.buffer,t.byteOffset,t.byteLength).set(e);return}else return e.buffer}if(!this.wrapper)throw new Error("Tensor has not been created.");return t?this.wrapper.read(t):this.wrapper.read()}},Fk=class{constructor(t){this.backend=t,this.tensorTrackersById=new Map,this.freeTensors=[],this.externalTensors=new Set}getMLContext(t){let e=this.backend.getMLContext(t);if(!e)throw new Error("MLContext not found for session.");return e}getMLOpSupportLimits(t){return this.backend.getMLOpSupportLimits(t)}reserveTensorId(){let t=Wy();return this.tensorTrackersById.set(t,new Xy(this)),t}releaseTensorId(t){let e=this.tensorTrackersById.get(t);e&&(this.tensorTrackersById.delete(t),e.tensorWrapper&&this.releaseTensor(e.tensorWrapper))}async ensureTensor(t,e,r,s,n){_t("verbose",()=>`[WebNN] TensorManager.ensureTensor {tensorId: ${e}, dataType: ${r}, shape: ${s}, copyOld: ${n}}`);let o=this.tensorTrackersById.get(e);if(!o)throw new Error("Tensor not found.");return o.ensureTensor(t,r,s,n)}upload(t,e){let r=this.tensorTrackersById.get(t);if(!r)throw new Error("Tensor not found.");r.upload(e)}async download(t,e){_t("verbose",()=>`[WebNN] TensorManager.download {tensorId: ${t}, dstBuffer: ${e?.byteLength}}`);let r=this.tensorTrackersById.get(t);if(!r)throw new Error("Tensor not found.");return r.download(e)}releaseTensorsForSession(t){for(let e of this.freeTensors)e.sessionId===t&&e.destroy();this.freeTensors=this.freeTensors.filter(e=>e.sessionId!==t)}registerTensor(t,e,r,s){let n=this.getMLContext(t),o=Wy(),a=new Hy({sessionId:t,context:n,tensor:e,dataType:r,shape:s});return this.tensorTrackersById.set(o,new Xy(this,a)),this.externalTensors.add(a),o}async getCachedTensor(t,e,r,s,n,o,a){let i=this.getMLContext(t);for(let[u,d]of this.freeTensors.entries())if(d.canReuseTensor(i,e,r)){_t("verbose",()=>`[WebNN] Reusing tensor {dataType: ${e}, ${a?`fallbackDataType: ${a},`:""} shape: ${r}`);let f=this.freeTensors.splice(u,1)[0];return f.sessionId=t,f}_t("verbose",()=>`[WebNN] MLContext.createTensor {dataType: ${e}, ${a?`fallbackDataType: ${a},`:""} shape: ${r}}`);let l=await i.createTensor({dataType:a??e,shape:r,dimensions:r,usage:s,writable:n,readable:o});return new Hy({sessionId:t,context:i,tensor:l,dataType:e,shape:r,fallbackDataType:a})}releaseTensor(t){this.externalTensors.has(t)&&this.externalTensors.delete(t),this.freeTensors.push(t)}},AE=(...t)=>new Fk(...t)}),ME={};ci(ME,{WebNNBackend:()=>TE});var ni,jk,TE,eP=ye(()=>{"use strict";_n(),ks(),JC(),ZC(),EE(),ni=new Map([[1,"float32"],[10,"float16"],[6,"int32"],[12,"uint32"],[7,"int64"],[13,"uint64"],[22,"int4"],[21,"uint4"],[3,"int8"],[2,"uint8"],[9,"uint8"]]),jk=(t,e)=>{if(t===e)return!0;if(t===void 0||e===void 0)return!1;let r=Object.keys(t).sort(),s=Object.keys(e).sort();return r.length===s.length&&r.every((n,o)=>n===s[o]&&t[n]===e[n])},TE=class{constructor(t){this.tensorManager=AE(this),this.mlContextBySessionId=new Map,this.sessionIdsByMLContext=new Map,this.mlContextCache=[],this.sessionGraphInputs=new Map,this.sessionGraphOutputs=new Map,this.temporaryGraphInputs=[],this.temporaryGraphOutputs=[],this.temporarySessionTensorIds=new Map,this.mlOpSupportLimitsBySessionId=new Map,kE(t.logLevel,!!t.debug)}get currentSessionId(){if(this.activeSessionId===void 0)throw new Error("No active session");return this.activeSessionId}onRunStart(t){_t("verbose",()=>`[WebNN] onRunStart {sessionId: ${t}}`),this.activeSessionId=t}onRunEnd(t){_t("verbose",()=>`[WebNN] onRunEnd {sessionId: ${t}}`);let e=this.temporarySessionTensorIds.get(t);if(e){for(let r of e)_t("verbose",()=>`[WebNN] releasing temporary tensor {tensorId: ${r}}`),this.tensorManager.releaseTensorId(r);this.temporarySessionTensorIds.delete(t),this.activeSessionId=void 0}}async createMLContext(t){if(t instanceof GPUDevice){let r=this.mlContextCache.findIndex(s=>s.gpuDevice===t);if(r!==-1)return this.mlContextCache[r].mlContext;{let s=await navigator.ml.createContext(t);return this.mlContextCache.push({gpuDevice:t,mlContext:s}),s}}else if(t===void 0){let r=this.mlContextCache.findIndex(s=>s.options===void 0&&s.gpuDevice===void 0);if(r!==-1)return this.mlContextCache[r].mlContext;{let s=await navigator.ml.createContext();return this.mlContextCache.push({mlContext:s}),s}}let e=this.mlContextCache.findIndex(r=>jk(r.options,t));if(e!==-1)return this.mlContextCache[e].mlContext;{let r=await navigator.ml.createContext(t);return this.mlContextCache.push({options:t,mlContext:r}),r}}registerMLContext(t,e){this.mlContextBySessionId.set(t,e);let r=this.sessionIdsByMLContext.get(e);r||(r=new Set,this.sessionIdsByMLContext.set(e,r)),r.add(t),this.mlOpSupportLimitsBySessionId.has(t)||this.mlOpSupportLimitsBySessionId.set(t,e.opSupportLimits()),this.temporaryGraphInputs.length>0&&(this.sessionGraphInputs.set(t,this.temporaryGraphInputs),this.temporaryGraphInputs=[]),this.temporaryGraphOutputs.length>0&&(this.sessionGraphOutputs.set(t,this.temporaryGraphOutputs),this.temporaryGraphOutputs=[])}onReleaseSession(t){this.sessionGraphInputs.delete(t),this.sessionGraphOutputs.delete(t);let e=this.mlContextBySessionId.get(t);if(!e)return;this.tensorManager.releaseTensorsForSession(t),this.mlContextBySessionId.delete(t),this.mlOpSupportLimitsBySessionId.delete(t);let r=this.sessionIdsByMLContext.get(e);if(r.delete(t),r.size===0){this.sessionIdsByMLContext.delete(e);let s=this.mlContextCache.findIndex(n=>n.mlContext===e);s!==-1&&this.mlContextCache.splice(s,1)}}getMLContext(t){return this.mlContextBySessionId.get(t)}getMLOpSupportLimits(t){return this.mlOpSupportLimitsBySessionId.get(t)}reserveTensorId(){return this.tensorManager.reserveTensorId()}releaseTensorId(t){_t("verbose",()=>`[WebNN] releaseTensorId {tensorId: ${t}}`),this.tensorManager.releaseTensorId(t)}async ensureTensor(t,e,r,s,n){let o=ni.get(r);if(!o)throw new Error(`Unsupported ONNX data type: ${r}`);return this.tensorManager.ensureTensor(t??this.currentSessionId,e,o,s,n)}async createTemporaryTensor(t,e,r){_t("verbose",()=>`[WebNN] createTemporaryTensor {onnxDataType: ${e}, shape: ${r}}`);let s=ni.get(e);if(!s)throw new Error(`Unsupported ONNX data type: ${e}`);let n=this.tensorManager.reserveTensorId();await this.tensorManager.ensureTensor(t,n,s,r,!1);let o=this.temporarySessionTensorIds.get(t);return o?o.push(n):this.temporarySessionTensorIds.set(t,[n]),n}uploadTensor(t,e){if(!Ue().shouldTransferToMLTensor)throw new Error("Trying to upload to a MLTensor while shouldTransferToMLTensor is false");_t("verbose",()=>`[WebNN] uploadTensor {tensorId: ${t}, data: ${e.byteLength}}`),this.tensorManager.upload(t,e)}async downloadTensor(t,e){return this.tensorManager.download(t,e)}createMLTensorDownloader(t,e){return async()=>{let r=await this.tensorManager.download(t);return vE(r,e)}}registerMLTensor(t,e,r,s){let n=ni.get(r);if(!n)throw new Error(`Unsupported ONNX data type: ${r}`);let o=this.tensorManager.registerTensor(t,e,n,s);return _t("verbose",()=>`[WebNN] registerMLTensor {tensor: ${e}, dataType: ${n}, dimensions: ${s}} -> {tensorId: ${o}}`),o}registerMLConstant(t,e,r,s,n,o,a=!1){if(!o)throw new Error("External mounted files are not available.");let i=t;t.startsWith("./")&&(i=t.substring(2));let l=o.get(i);if(!l)throw new Error(`File with name ${i} not found in preloaded files.`);if(e+r>l.byteLength)throw new Error("Out of bounds: data offset and length exceed the external file data size.");let u=l.slice(e,e+r).buffer,d;switch(n.dataType){case"float32":d=new Float32Array(u);break;case"float16":d=typeof Float16Array<"u"&&Float16Array.from?new Float16Array(u):new Uint16Array(u);break;case"int32":d=new Int32Array(u);break;case"uint32":d=new Uint32Array(u);break;case"int64":if(a){let f=t0(new Uint8Array(u),"int64");d=new Int32Array(f.buffer),n.dataType="int32"}else d=new BigInt64Array(u);break;case"uint64":d=new BigUint64Array(u);break;case"int8":d=new Int8Array(u);break;case"int4":case"uint4":case"uint8":d=new Uint8Array(u);break;default:throw new Error(`Unsupported data type: ${n.dataType} in creating WebNN Constant from external data.`)}return _t("verbose",()=>`[WebNN] registerMLConstant {dataType: ${n.dataType}, shape: ${n.shape}}} ${a?"(Note: it was int64 data type and registered to int32 as workaround)":""}`),s.constant(n,d)}registerGraphInput(t){this.temporaryGraphInputs.push(t)}registerGraphOutput(t){this.temporaryGraphOutputs.push(t)}isGraphInput(t,e){let r=this.sessionGraphInputs.get(t);return r?r.includes(e):!1}isGraphOutput(t,e){let r=this.sessionGraphOutputs.get(t);return r?r.includes(e):!1}isGraphInputOutputTypeSupported(t,e,r=!0){let s=ni.get(ws(e)),n=this.mlOpSupportLimitsBySessionId.get(t);return typeof s>"u"?!1:r?!!n?.input.dataTypes.includes(s):!!n?.output.dataTypes.includes(s)}flush(){}}}),Gk,m0,h0,Fr,qk,Ky,ku,_0,g0,Yy,w0,x0,y0,SE=ye(()=>{"use strict";vs(),YC(),QC(),_n(),ks(),u0(),bE(),Gk=(t,e)=>{Ue()._OrtInit(t,e)!==0&&Ie("Can't initialize onnxruntime.")},m0=async t=>{Gk(t.wasm.numThreads,vu(t.logLevel))},h0=async(t,e)=>{Ue().asyncInit?.();let r=t.webgpu.adapter;if(e==="webgpu"){if(typeof navigator>"u"||!navigator.gpu)throw new Error("WebGPU is not supported in current environment");if(r){if(typeof r.limits!="object"||typeof r.features!="object"||typeof r.requestDevice!="function")throw new Error("Invalid GPU adapter set in `env.webgpu.adapter`. It must be a GPUAdapter object.")}else{let s=t.webgpu.powerPreference;if(s!==void 0&&s!=="low-power"&&s!=="high-performance")throw new Error(`Invalid powerPreference setting: "${s}"`);let n=t.webgpu.forceFallbackAdapter;if(n!==void 0&&typeof n!="boolean")throw new Error(`Invalid forceFallbackAdapter setting: "${n}"`);if(r=await navigator.gpu.requestAdapter({powerPreference:s,forceFallbackAdapter:n}),!r)throw new Error('Failed to get GPU adapter. You may need to enable flag "--enable-unsafe-webgpu" if you are using Chrome.')}}if(e==="webnn"&&(typeof navigator>"u"||!navigator.ml))throw new Error("WebNN is not supported in current environment");if(e==="webgpu"&&Ue().webgpuInit(s=>{t.webgpu.device=s}),e==="webnn"){let s=new(eP(),xu(ME)).WebNNBackend(t);Ue().webnnInit([s,()=>s.reserveTensorId(),n=>s.releaseTensorId(n),async(n,o,a,i,l)=>s.ensureTensor(n,o,a,i,l),(n,o)=>{s.uploadTensor(n,o)},async(n,o)=>s.downloadTensor(n,o),(n,o)=>s.registerMLContext(n,o),!!t.trace])}},Fr=new Map,qk=t=>{let e=Ue(),r=e.stackSave();try{let s=e.PTR_SIZE,n=e.stackAlloc(2*s);e._OrtGetInputOutputCount(t,n,n+s)!==0&&Ie("Can't get session input/output count.");let o=s===4?"i32":"i64";return[Number(e.getValue(n,o)),Number(e.getValue(n+s,o))]}finally{e.stackRestore(r)}},Ky=(t,e)=>{let r=Ue(),s=r.stackSave(),n=0;try{let o=r.PTR_SIZE,a=r.stackAlloc(2*o);r._OrtGetInputOutputMetadata(t,e,a,a+o)!==0&&Ie("Can't get session input/output metadata.");let i=Number(r.getValue(a,"*"));n=Number(r.getValue(a+o,"*"));let l=r.HEAP32[n/4];if(l===0)return[i,0];let u=r.HEAPU32[n/4+1],d=[];for(let f=0;f<u;f++){let m=Number(r.getValue(n+8+f*o,"*"));d.push(m!==0?r.UTF8ToString(m):Number(r.getValue(n+8+(f+u)*o,"*")))}return[i,l,d]}finally{r.stackRestore(s),n!==0&&r._OrtFree(n)}},ku=t=>{let e=Ue(),r=e._malloc(t.byteLength);if(r===0)throw new Error(`Can't create a session. failed to allocate a buffer of size ${t.byteLength}.`);return e.HEAPU8.set(t,r),[r,t.byteLength]},_0=async(t,e)=>{let r,s,n=Ue();Array.isArray(t)?[r,s]=t:t.buffer===n.HEAPU8.buffer?[r,s]=[t.byteOffset,t.byteLength]:[r,s]=ku(t);let o=0,a=0,i=0,l=[],u=[],d=[];try{if([a,l]=await yE(e),e?.externalData&&n.mountExternalData){let T=[];for(let z of e.externalData){let C=typeof z=="string"?z:z.path;T.push(f0(typeof z=="string"?z:z.data).then(v=>{n.mountExternalData(C,v)}))}await Promise.all(T)}for(let T of e?.executionProviders??[])if((typeof T=="string"?T:T.name)==="webnn"){if(n.shouldTransferToMLTensor=!1,typeof T!="string"){let z=T,C=z?.context,v=z?.gpuDevice,G=z?.deviceType,X=z?.powerPreference;C?n.currentContext=C:v?n.currentContext=await n.webnnCreateMLContext(v):n.currentContext=await n.webnnCreateMLContext({deviceType:G,powerPreference:X})}else n.currentContext=await n.webnnCreateMLContext();break}o=await n._OrtCreateSession(r,s,a),n.webgpuOnCreateSession?.(o),o===0&&Ie("Can't create a session."),n.jsepOnCreateSession?.(),n.currentContext&&(n.webnnRegisterMLContext(o,n.currentContext),n.currentContext=void 0,n.shouldTransferToMLTensor=!0);let[f,m]=qk(o),_=!!e?.enableGraphCapture,w=[],x=[],k=[],E=[],M=[];for(let T=0;T<f;T++){let[z,C,v]=Ky(o,T);z===0&&Ie("Can't get an input name."),u.push(z);let G=n.UTF8ToString(z);w.push(G),k.push(C===0?{name:G,isTensor:!1}:{name:G,isTensor:!0,type:wu(C),shape:v})}for(let T=0;T<m;T++){let[z,C,v]=Ky(o,T+f);z===0&&Ie("Can't get an output name."),d.push(z);let G=n.UTF8ToString(z);x.push(G),E.push(C===0?{name:G,isTensor:!1}:{name:G,isTensor:!0,type:wu(C),shape:v});{if(_&&e?.preferredOutputLocation===void 0){M.push("gpu-buffer");continue}let X=typeof e?.preferredOutputLocation=="string"?e.preferredOutputLocation:e?.preferredOutputLocation?.[G]??"cpu",V=n.webnnIsGraphOutput;if(X==="cpu"&&V&&V(o,G)){M.push("ml-tensor-cpu-output");continue}if(X!=="cpu"&&X!=="cpu-pinned"&&X!=="gpu-buffer"&&X!=="ml-tensor")throw new Error(`Not supported preferred output location: ${X}.`);if(_&&X!=="gpu-buffer")throw new Error(`Not supported preferred output location: ${X}. Only 'gpu-buffer' location is supported when enableGraphCapture is true.`);M.push(X)}}let I=null;return M.some(T=>T==="gpu-buffer"||T==="ml-tensor"||T==="ml-tensor-cpu-output")&&(i=n._OrtCreateBinding(o),i===0&&Ie("Can't create IO binding."),I={handle:i,outputPreferredLocations:M,outputPreferredLocationsEncoded:M.map(T=>T==="ml-tensor-cpu-output"?"ml-tensor":T).map(T=>e0(T))}),Fr.set(o,[o,u,d,I,_,!1]),[o,w,x,k,E]}catch(f){throw u.forEach(m=>n._OrtFree(m)),d.forEach(m=>n._OrtFree(m)),i!==0&&n._OrtReleaseBinding(i)!==0&&Ie("Can't release IO binding."),o!==0&&n._OrtReleaseSession(o)!==0&&Ie("Can't release session."),f}finally{n._free(r),a!==0&&n._OrtReleaseSessionOptions(a)!==0&&Ie("Can't release session options."),l.forEach(f=>n._free(f)),n.unmountExternalData?.()}},g0=t=>{let e=Ue(),r=Fr.get(t);if(!r)throw new Error(`cannot release session. invalid session id: ${t}`);let[s,n,o,a,i]=r;a&&(i&&e._OrtClearBoundOutputs(a.handle)!==0&&Ie("Can't clear bound outputs."),e._OrtReleaseBinding(a.handle)!==0&&Ie("Can't release IO binding.")),e.jsepOnReleaseSession?.(t),e.webnnOnReleaseSession?.(t),e.webgpuOnReleaseSession?.(t),n.forEach(l=>e._OrtFree(l)),o.forEach(l=>e._OrtFree(l)),e._OrtReleaseSession(s)!==0&&Ie("Can't release session."),Fr.delete(t)},Yy=async(t,e,r,s,n,o,a=!1)=>{if(!t){e.push(0);return}let i=Ue(),l=i.PTR_SIZE,u=t[0],d=t[1],f=t[3],m=f,_,w;if(u==="string"&&(f==="gpu-buffer"||f==="ml-tensor"))throw new Error("String tensor is not supported on GPU.");if(a&&f!=="gpu-buffer")throw new Error(`External buffer must be provided for input/output index ${o} when enableGraphCapture is true.`);if(f==="gpu-buffer"){let E=t[2].gpuBuffer;w=hn(ws(u),d);{let M=i.webgpuRegisterBuffer;if(!M)throw new Error('Tensor location "gpu-buffer" is not supported without using WebGPU.');_=M(E,s)}}else if(f==="ml-tensor"){let E=t[2].mlTensor;w=hn(ws(u),d);let M=i.webnnRegisterMLTensor;if(!M)throw new Error('Tensor location "ml-tensor" is not supported without using WebNN.');_=M(s,E,ws(u),d)}else{let E=t[2];if(Array.isArray(E)){w=l*E.length,_=i._malloc(w),r.push(_);for(let M=0;M<E.length;M++){if(typeof E[M]!="string")throw new TypeError(`tensor data at index ${M} is not a string`);i.setValue(_+M*l,It(E[M],r),"*")}}else{let M=i.webnnIsGraphInput,I=i.webnnIsGraphOutput;if(u!=="string"&&M&&I){let T=i.UTF8ToString(n);if(M(s,T)||I(s,T)){let z=ws(u);w=hn(z,d),m="ml-tensor";let C=i.webnnCreateTemporaryTensor,v=i.webnnUploadTensor;if(!C||!v)throw new Error('Tensor location "ml-tensor" is not supported without using WebNN.');let G=await C(s,z,d);v(G,new Uint8Array(E.buffer,E.byteOffset,E.byteLength)),_=G}else w=E.byteLength,_=i._malloc(w),r.push(_),i.HEAPU8.set(new Uint8Array(E.buffer,E.byteOffset,w),_)}else w=E.byteLength,_=i._malloc(w),r.push(_),i.HEAPU8.set(new Uint8Array(E.buffer,E.byteOffset,w),_)}}let x=i.stackSave(),k=i.stackAlloc(4*d.length);try{d.forEach((M,I)=>i.setValue(k+I*l,M,l===4?"i32":"i64"));let E=i._OrtCreateTensor(ws(u),_,w,k,d.length,e0(m));E===0&&Ie(`Can't create tensor for input/output. session=${s}, index=${o}.`),e.push(E)}finally{i.stackRestore(x)}},w0=async(t,e,r,s,n,o)=>{let a=Ue(),i=a.PTR_SIZE,l=Fr.get(t);if(!l)throw new Error(`cannot run inference. invalid session id: ${t}`);let u=l[0],d=l[1],f=l[2],m=l[3],_=l[4],w=l[5],x=e.length,k=s.length,E=0,M=[],I=[],T=[],z=[],C=[],v=a.stackSave(),G=a.stackAlloc(x*i),X=a.stackAlloc(x*i),V=a.stackAlloc(k*i),Q=a.stackAlloc(k*i);try{[E,M]=xE(o),Gr("wasm prepareInputOutputTensor");for(let P=0;P<x;P++)await Yy(r[P],I,z,t,d[e[P]],e[P],_);for(let P=0;P<k;P++)await Yy(n[P],T,z,t,f[s[P]],x+s[P],_);qr("wasm prepareInputOutputTensor");for(let P=0;P<x;P++)a.setValue(G+P*i,I[P],"*"),a.setValue(X+P*i,d[e[P]],"*");for(let P=0;P<k;P++)a.setValue(V+P*i,T[P],"*"),a.setValue(Q+P*i,f[s[P]],"*");if(m&&!w){let{handle:P,outputPreferredLocations:se,outputPreferredLocationsEncoded:ie}=m;if(d.length!==x)throw new Error(`input count from feeds (${x}) is expected to be always equal to model's input count (${d.length}).`);Gr("wasm bindInputsOutputs");for(let S=0;S<x;S++){let L=e[S];await a._OrtBindInput(P,d[L],I[S])!==0&&Ie(`Can't bind input[${S}] for session=${t}.`)}for(let S=0;S<k;S++){let L=s[S];n[S]?.[3]?(C.push(T[S]),a._OrtBindOutput(P,f[L],T[S],0)!==0&&Ie(`Can't bind pre-allocated output[${S}] for session=${t}.`)):a._OrtBindOutput(P,f[L],0,ie[L])!==0&&Ie(`Can't bind output[${S}] to ${se[S]} for session=${t}.`)}qr("wasm bindInputsOutputs"),Fr.set(t,[u,d,f,m,_,!0])}a.jsepOnRunStart?.(u),a.webnnOnRunStart?.(u);let K;m?K=await a._OrtRunWithBinding(u,m.handle,k,V,E):K=await a._OrtRun(u,X,G,x,Q,k,V,E),K!==0&&Ie("failed to call OrtRun().");let Y=[],B=[];Gr("wasm ProcessOutputTensor");for(let P=0;P<k;P++){let se=Number(a.getValue(V+P*i,"*"));if(se===T[P]||C.includes(T[P])){Y.push(n[P]),se!==T[P]&&a._OrtReleaseTensor(se)!==0&&Ie("Can't release tensor.");continue}let ie=a.stackSave(),S=a.stackAlloc(4*i),L=!1,R,te=0;try{a._OrtGetTensorData(se,S,S+i,S+2*i,S+3*i)!==0&&Ie(`Can't access output tensor data on index ${P}.`);let ue=i===4?"i32":"i64",Be=Number(a.getValue(S,ue));te=a.getValue(S+i,"*");let Pe=a.getValue(S+i*2,"*"),vt=Number(a.getValue(S+i*3,ue)),Qe=[];for(let Me=0;Me<vt;Me++)Qe.push(Number(a.getValue(Pe+Me*i,ue)));a._OrtFree(Pe)!==0&&Ie("Can't free memory for tensor dims.");let et=Qe.reduce((Me,xe)=>Me*xe,1);R=wu(Be);let st=m?.outputPreferredLocations[s[P]];if(R==="string"){if(st==="gpu-buffer"||st==="ml-tensor")throw new Error("String tensor is not supported on GPU.");let Me=[];for(let xe=0;xe<et;xe++){let qe=a.getValue(te+xe*i,"*"),kt=a.getValue(te+(xe+1)*i,"*"),ge=xe===et-1?void 0:kt-qe;Me.push(a.UTF8ToString(qe,ge))}Y.push([R,Qe,Me,"cpu"])}else if(st==="gpu-buffer"&&et>0){let Me=a.webgpuGetBuffer;if(!Me)throw new Error('preferredLocation "gpu-buffer" is not supported without using WebGPU.');let xe=Me(te),qe=hn(Be,et);if(qe===void 0||!p0(R))throw new Error(`Unsupported data type: ${R}`);L=!0;{a.webgpuRegisterBuffer(xe,t,te);let kt=a.webgpuCreateDownloader(xe,qe,t);Y.push([R,Qe,{gpuBuffer:xe,download:async()=>{let ge=await kt();return new(li(R))(ge)},dispose:()=>{a._OrtReleaseTensor(se)!==0&&Ie("Can't release tensor.")}},"gpu-buffer"])}}else if(st==="ml-tensor"&&et>0){let Me=a.webnnEnsureTensor,xe=a.webnnIsGraphInputOutputTypeSupported;if(!Me||!xe)throw new Error('preferredLocation "ml-tensor" is not supported without using WebNN.');if(hn(Be,et)===void 0||!d0(R))throw new Error(`Unsupported data type: ${R}`);if(!xe(t,R,!1))throw new Error(`preferredLocation "ml-tensor" for ${R} output is not supported by current WebNN Context.`);let qe=await Me(t,te,Be,Qe,!1);L=!0,Y.push([R,Qe,{mlTensor:qe,download:a.webnnCreateMLTensorDownloader(te,R),dispose:()=>{a.webnnReleaseTensorId(te),a._OrtReleaseTensor(se)}},"ml-tensor"])}else if(st==="ml-tensor-cpu-output"&&et>0){let Me=a.webnnCreateMLTensorDownloader(te,R)(),xe=Y.length;L=!0,B.push((async()=>{let qe=[xe,await Me];return a.webnnReleaseTensorId(te),a._OrtReleaseTensor(se),qe})()),Y.push([R,Qe,[],"cpu"])}else{let Me=li(R),xe=new Me(et);new Uint8Array(xe.buffer,xe.byteOffset,xe.byteLength).set(a.HEAPU8.subarray(te,te+xe.byteLength)),Y.push([R,Qe,xe,"cpu"])}}finally{a.stackRestore(ie),R==="string"&&te&&a._free(te),L||a._OrtReleaseTensor(se)}}m&&!_&&(a._OrtClearBoundOutputs(m.handle)!==0&&Ie("Can't clear bound outputs."),Fr.set(t,[u,d,f,m,_,!1]));for(let[P,se]of await Promise.all(B))Y[P][2]=se;return qr("wasm ProcessOutputTensor"),Y}finally{a.webnnOnRunEnd?.(u),a.stackRestore(v),r.forEach(K=>{K&&K[3]==="gpu-buffer"&&a.webgpuUnregisterBuffer(K[2].gpuBuffer)}),n.forEach(K=>{K&&K[3]==="gpu-buffer"&&a.webgpuUnregisterBuffer(K[2].gpuBuffer)}),I.forEach(K=>a._OrtReleaseTensor(K)),T.forEach(K=>a._OrtReleaseTensor(K)),z.forEach(K=>a._free(K)),E!==0&&a._OrtReleaseRunOptions(E),M.forEach(K=>a._free(K))}},x0=t=>{let e=Ue(),r=Fr.get(t);if(!r)throw new Error("invalid session id");let s=r[0],n=e._OrtEndProfiling(s);n===0&&Ie("Can't get an profile file name."),e._OrtFree(n)},y0=t=>{let e=[];for(let r of t){let s=r[2];!Array.isArray(s)&&"buffer"in s&&e.push(s.buffer)}return e}}),jr,Ft,mn,oi,ai,_u,Qy,gu,hs,_s,Wk,OE,IE,CE,PE,zE,LE,NE,$E=ye(()=>{"use strict";vs(),SE(),ks(),l0(),jr=()=>!!Ve.wasm.proxy&&typeof document<"u",mn=!1,oi=!1,ai=!1,gu=new Map,hs=(t,e)=>{let r=gu.get(t);r?r.push(e):gu.set(t,[e])},_s=()=>{if(mn||!oi||ai||!Ft)throw new Error("worker not ready")},Wk=t=>{switch(t.data.type){case"init-wasm":mn=!1,t.data.err?(ai=!0,Qy[1](t.data.err)):(oi=!0,Qy[0]()),_u&&(URL.revokeObjectURL(_u),_u=void 0);break;case"init-ep":case"copy-from":case"create":case"release":case"run":case"end-profiling":{let e=gu.get(t.data.type);t.data.err?e.shift()[1](t.data.err):e.shift()[0](t.data.out);break}default:}},OE=async()=>{if(!oi){if(mn)throw new Error("multiple calls to 'initWasm()' detected.");if(ai)throw new Error("previous call to 'initWasm()' failed.");if(mn=!0,jr())return new Promise((t,e)=>{Ft?.terminate(),gE().then(([r,s])=>{try{Ft=s,Ft.onerror=o=>e(o),Ft.onmessage=Wk,Qy=[t,e];let n={type:"init-wasm",in:Ve};!n.in.wasm.wasmPaths&&(r||Zy)&&(n.in.wasm.wasmPaths={wasm:new URL("ort-wasm-simd-threaded.asyncify.wasm",Qt.url).href}),Ft.postMessage(n),_u=r}catch(n){e(n)}},e)});try{await c0(Ve.wasm),await m0(Ve),oi=!0}catch(t){throw ai=!0,t}finally{mn=!1}}},IE=async t=>{if(jr())return _s(),new Promise((e,r)=>{hs("init-ep",[e,r]);let s={type:"init-ep",in:{epName:t,env:Ve}};Ft.postMessage(s)});await h0(Ve,t)},CE=async t=>jr()?(_s(),new Promise((e,r)=>{hs("copy-from",[e,r]);let s={type:"copy-from",in:{buffer:t}};Ft.postMessage(s,[t.buffer])})):ku(t),PE=async(t,e)=>{if(jr()){if(e?.preferredOutputLocation)throw new Error('session option "preferredOutputLocation" is not supported for proxy.');return _s(),new Promise((r,s)=>{hs("create",[r,s]);let n={type:"create",in:{model:t,options:{...e}}},o=[];t instanceof Uint8Array&&o.push(t.buffer),Ft.postMessage(n,o)})}else return _0(t,e)},zE=async t=>{if(jr())return _s(),new Promise((e,r)=>{hs("release",[e,r]);let s={type:"release",in:t};Ft.postMessage(s)});g0(t)},LE=async(t,e,r,s,n,o)=>{if(jr()){if(r.some(a=>a[3]!=="cpu"))throw new Error("input tensor on GPU is not supported for proxy.");if(n.some(a=>a))throw new Error("pre-allocated output tensor is not supported for proxy.");return _s(),new Promise((a,i)=>{hs("run",[a,i]);let l=r,u={type:"run",in:{sessionId:t,inputIndices:e,inputs:l,outputIndices:s,options:o}};Ft.postMessage(u,y0(l))})}else return w0(t,e,r,s,n,o)},NE=async t=>{if(jr())return _s(),new Promise((e,r)=>{hs("end-profiling",[e,r]);let s={type:"end-profiling",in:t};Ft.postMessage(s)});x0(t)}}),Jy,Vk,RE,tP=ye(()=>{"use strict";vs(),$E(),_n(),i0(),bE(),Jy=(t,e)=>{switch(t.location){case"cpu":return[t.type,t.dims,t.data,"cpu"];case"gpu-buffer":return[t.type,t.dims,{gpuBuffer:t.gpuBuffer},"gpu-buffer"];case"ml-tensor":return[t.type,t.dims,{mlTensor:t.mlTensor},"ml-tensor"];default:throw new Error(`invalid data location: ${t.location} for ${e()}`)}},Vk=t=>{switch(t[3]){case"cpu":return new Jt(t[0],t[2],t[1]);case"gpu-buffer":{let e=t[0];if(!p0(e))throw new Error(`not supported data type: ${e} for deserializing GPU tensor`);let{gpuBuffer:r,download:s,dispose:n}=t[2];return Jt.fromGpuBuffer(r,{dataType:e,dims:t[1],download:s,dispose:n})}case"ml-tensor":{let e=t[0];if(!d0(e))throw new Error(`not supported data type: ${e} for deserializing MLTensor tensor`);let{mlTensor:r,download:s,dispose:n}=t[2];return Jt.fromMLTensor(r,{dataType:e,dims:t[1],download:s,dispose:n})}default:throw new Error(`invalid data location: ${t[3]}`)}},RE=class{async fetchModelAndCopyToWasmMemory(t){return CE(await f0(t))}async loadModel(t,e){ys();let r;typeof t=="string"?r=await this.fetchModelAndCopyToWasmMemory(t):r=t,[this.sessionId,this.inputNames,this.outputNames,this.inputMetadata,this.outputMetadata]=await PE(r,e),bs()}async dispose(){return zE(this.sessionId)}async run(t,e,r){ys();let s=[],n=[];Object.entries(t).forEach(f=>{let m=f[0],_=f[1],w=this.inputNames.indexOf(m);if(w===-1)throw new Error(`invalid input '${m}'`);s.push(_),n.push(w)});let o=[],a=[];Object.entries(e).forEach(f=>{let m=f[0],_=f[1],w=this.outputNames.indexOf(m);if(w===-1)throw new Error(`invalid output '${m}'`);o.push(_),a.push(w)});let i=s.map((f,m)=>Jy(f,()=>`input "${this.inputNames[n[m]]}"`)),l=o.map((f,m)=>f?Jy(f,()=>`output "${this.outputNames[a[m]]}"`):null),u=await LE(this.sessionId,n,i,a,l,r),d={};for(let f=0;f<u.length;f++)d[this.outputNames[a[f]]]=o[f]??Vk(u[f]);return bs(),d}startProfiling(){}endProfiling(){NE(this.sessionId)}}}),UE={};ci(UE,{OnnxruntimeWebAssemblyBackend:()=>s0,initializeFlags:()=>r0,wasmBackend:()=>BE});var r0,s0,BE,rP=ye(()=>{"use strict";vs(),$E(),tP(),r0=()=>{(typeof Ve.wasm.initTimeout!="number"||Ve.wasm.initTimeout<0)&&(Ve.wasm.initTimeout=0);let t=Ve.wasm.simd;if(typeof t!="boolean"&&t!==void 0&&t!=="fixed"&&t!=="relaxed"&&(console.warn(`Property "env.wasm.simd" is set to unknown value "${t}". Reset it to \`false\` and ignore SIMD feature checking.`),Ve.wasm.simd=!1),typeof Ve.wasm.proxy!="boolean"&&(Ve.wasm.proxy=!1),typeof Ve.wasm.trace!="boolean"&&(Ve.wasm.trace=!1),typeof Ve.wasm.numThreads!="number"||!Number.isInteger(Ve.wasm.numThreads)||Ve.wasm.numThreads<=0)if(typeof self<"u"&&!self.crossOriginIsolated)Ve.wasm.numThreads=1;else{let e=typeof navigator>"u"?zC("node:os").cpus().length:navigator.hardwareConcurrency;Ve.wasm.numThreads=Math.min(4,Math.ceil((e||1)/2))}},s0=class{async init(t){r0(),await OE(),await IE(t)}async createInferenceSessionHandler(t,e){let r=new RE;return await r.loadModel(t,e),r}},BE=new s0});vs();vs();vs();var sP="1.25.0-dev.20260209-a3749f1353",nP=pE;{let t=(rP(),xu(UE)).wasmBackend;xs("webgpu",t,5),xs("webnn",t,5),xs("cpu",t,10),xs("wasm",t,10)}Object.defineProperty(Ve.versions,"web",{value:sP,enumerable:!0});var v0={};async function DE(t){let e=t.split("/").pop(),r;try{if(r=await lu(),r){let n=await r.match(t);if(n)return n}}catch(n){console.warn(`Failed to load ${e} from cache:`,n)}let s=await fetch(t);if(!s.ok)throw new Error(`Failed to fetch ${e}: ${s.status} ${s.statusText}`);if(r)try{await r.put(t,s.clone())}catch(n){console.warn(`Failed to cache ${e}:`,n)}return s}async function FE(t){let e=await DE(t);if(!e||typeof e=="string")return null;try{return await e.arrayBuffer()}catch(r){return console.warn("Failed to read WASM binary:",r),null}}async function jE(t){let e=await DE(t);if(!e||typeof e=="string")return null;try{let r=await e.text(),s=t.split("/").slice(0,-1).join("/");r=r.replace(/import\.meta\.url/g,`"${s}"`);let n=new Blob([r],{type:"text/javascript"});return URL.createObjectURL(n)}catch(r){return console.warn("Failed to read WASM binary:",r),null}}function k0(t){return dn(t,["blob:"])}function E0(t){let e;if(typeof location<"u"&&location.href)e=location.href;else if(typeof v0<"u"&&v0.url)e=v0.url;else return t;return new URL(t,e).href}var M0=require("onnxruntime-common"),aP=Object.freeze({auto:null,gpu:null,cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",coreml:"coreml",webnn:{name:"webnn",deviceType:"cpu"},"webnn-npu":{name:"webnn",deviceType:"npu"},"webnn-gpu":{name:"webnn",deviceType:"gpu"},"webnn-cpu":{name:"webnn",deviceType:"cpu"}}),iP=["verbose","info","warning","error","fatal"],VE=4,jt=[],A0,wn,GE=Symbol.for("onnxruntime");if(GE in globalThis)wn=globalThis[GE];else if(be.IS_NODE_ENV){switch(wn=oP,process.platform){case"win32":jt.push("dml");break;case"linux":process.arch==="x64"&&jt.push("cuda");break;case"darwin":jt.push("coreml");break}jt.push("webgpu"),jt.push("cpu"),A0=["cpu"]}else wn=b0,be.IS_WEBNN_AVAILABLE&&jt.push("webnn-npu","webnn-gpu","webnn-cpu","webnn"),be.IS_WEBGPU_AVAILABLE&&jt.push("webgpu"),jt.push("wasm"),A0=["wasm"];var lP=wn.InferenceSession;function HE(t=null){if(!t)return A0;switch(t){case"auto":return jt;case"gpu":return jt.filter(e=>["webgpu","cuda","dml","webnn-gpu"].includes(e))}if(jt.includes(t))return[aP[t]??t];throw new Error(`Unsupported device: "${t}". Should be one of: ${jt.join(", ")}.`)}var XE=be.IS_BROWSER_ENV||be.IS_WEBWORKER_ENV,qE=Promise.resolve(),gn=null;async function cP(){return gn||(De.useWasmCache&&typeof ft?.wasm?.wasmPaths=="object"&&ft?.wasm?.wasmPaths?.wasm&&ft?.wasm?.wasmPaths?.mjs?(gn=(async()=>{let e=ft.wasm.wasmPaths;await Promise.all([e.wasm&&!k0(e.wasm)?(async()=>{try{let r=await FE(E0(e.wasm));r&&(ft.wasm.wasmBinary=r)}catch(r){console.warn("Failed to pre-load WASM binary:",r)}})():Promise.resolve(),e.mjs&&!k0(e.mjs)?(async()=>{try{let r=await jE(E0(e.mjs));r&&(ft.wasm.wasmPaths.mjs=r)}catch(r){console.warn("Failed to pre-load WASM factory:",r)}})():Promise.resolve()])})(),gn):(gn=Promise.resolve(),gn))}async function Eu(t,e,r){await cP();let s=()=>lP.create(t,{logSeverityLevel:VE,...e}),n=await(XE?qE=qE.then(s):s());return n.config=r,n}var WE=Promise.resolve();async function Au(t,e){let r=()=>t.run(e);return await(XE?WE=WE.then(r):r())}function Mu(t){return t instanceof wn.Tensor}var ft=wn?.env;ft.logLevel=iP[VE];if(ft?.wasm){if(!(typeof ServiceWorkerGlobalScope<"u"&&self instanceof ServiceWorkerGlobalScope)&&ft.versions?.web&&!ft.wasm.wasmPaths){let t=`https://cdn.jsdelivr.net/npm/onnxruntime-web@${ft.versions.web}/dist/`;ft.wasm.wasmPaths=be.IS_SAFARI?{mjs:`${t}ort-wasm-simd-threaded.mjs`,wasm:`${t}ort-wasm-simd-threaded.wasm`}:{mjs:`${t}ort-wasm-simd-threaded.asyncify.mjs`,wasm:`${t}ort-wasm-simd-threaded.asyncify.wasm`}}ft.wasm.proxy=!1}ft?.webgpu&&(ft.webgpu.powerPreference="high-performance");function ui(){return ft?.wasm?.proxy}De.backends.onnx=ft;var Wr=async(t,e,r)=>{let s=await Eu(new Uint8Array(t),e);return(async n=>{let o=ui(),a=Object.fromEntries(Object.entries(n).map(([l,u])=>[l,(o?u.clone():u).ort_tensor])),i=await Au(s,a);return Array.isArray(r)?r.map(l=>new U(i[l])):new U(i[r])})},lr=class{static session_options={};static get nearest_interpolate_4d(){return this._nearest_interpolate_4d||(this._nearest_interpolate_4d=Wr([8,10,18,0,58,129,1,10,41,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,18,10,4,109,111,100,101,34,7,110,101,97,114,101,115,116,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,21],this.session_options,"y")),this._nearest_interpolate_4d}static get bilinear_interpolate_4d(){return this._bilinear_interpolate_4d||(this._bilinear_interpolate_4d=Wr([8,9,18,0,58,128,1,10,40,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,17,10,4,109,111,100,101,34,6,108,105,110,101,97,114,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bilinear_interpolate_4d}static get bicubic_interpolate_4d(){return this._bicubic_interpolate_4d||(this._bicubic_interpolate_4d=Wr([8,9,18,0,58,127,10,39,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,16,10,4,109,111,100,101,34,5,99,117,98,105,99,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bicubic_interpolate_4d}static get matmul(){return this._matmul||(this._matmul=Wr([8,9,18,0,58,55,10,17,10,1,97,10,1,98,18,1,99,34,6,77,97,116,77,117,108,18,1,114,90,9,10,1,97,18,4,10,2,8,1,90,9,10,1,98,18,4,10,2,8,1,98,9,10,1,99,18,4,10,2,8,1,66,2,16,20],this.session_options,"c")),this._matmul}static get stft(){return this._stft||(this._stft=Wr([8,7,18,0,58,148,1,10,38,10,1,115,10,1,106,10,1,119,10,1,108,18,1,111,34,4,83,84,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,115,90,26,10,1,115,18,21,10,19,8,1,18,15,10,3,18,1,98,10,3,18,1,115,10,3,18,1,99,90,11,10,1,106,18,6,10,4,8,7,18,0,90,16,10,1,119,18,11,10,9,8,1,18,5,10,3,18,1,119,90,11,10,1,108,18,6,10,4,8,7,18,0,98,31,10,1,111,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,102,10,3,18,1,100,10,3,18,1,99,66,2,16,17],this.session_options,"o")),this._stft}static get rfft(){return this._rfft||(this._rfft=Wr([8,9,18,0,58,97,10,33,10,1,120,10,0,10,1,97,18,1,121,34,3,68,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,100,90,21,10,1,120,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,90,11,10,1,97,18,6,10,4,8,7,18,0,98,21,10,1,121,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,66,2,16,20],this.session_options,"y")),this._rfft}static get top_k(){return this._top_k||(this._top_k=Wr([8,10,18,0,58,73,10,18,10,1,120,10,1,107,18,1,118,18,1,105,34,4,84,111,112,75,18,1,116,90,9,10,1,120,18,4,10,2,8,1,90,15,10,1,107,18,10,10,8,8,7,18,4,10,2,8,1,98,9,10,1,118,18,4,10,2,8,1,98,9,10,1,105,18,4,10,2,8,7,66,2,16,21],this.session_options,["v","i"])),this._top_k}static get slice(){return this._slice||(this._slice=Wr([8,7,18,0,58,96,10,25,10,1,120,10,1,115,10,1,101,10,1,97,10,1,116,18,1,121,34,5,83,108,105,99,101,18,1,114,90,9,10,1,120,18,4,10,2,8,1,90,9,10,1,115,18,4,10,2,8,7,90,9,10,1,101,18,4,10,2,8,7,90,9,10,1,97,18,4,10,2,8,7,90,9,10,1,116,18,4,10,2,8,7,98,9,10,1,121,18,4,10,2,8,1,66,2,16,13],this.session_options,"y")),this._slice}};var KE=Object.freeze({auto:"auto",gpu:"gpu",cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",coreml:"coreml",webnn:"webnn","webnn-npu":"webnn-npu","webnn-gpu":"webnn-gpu","webnn-cpu":"webnn-cpu"});var YE=(function(){let t;return async function(){if(t===void 0)if(!be.IS_WEBGPU_AVAILABLE)t=!1;else try{t=(await navigator.gpu.requestAdapter()).features.has("shader-f16")}catch{t=!1}return t}})(),mt=Object.freeze({auto:"auto",fp32:"fp32",fp16:"fp16",q8:"q8",int8:"int8",uint8:"uint8",q4:"q4",bnb4:"bnb4",q4f16:"q4f16"}),T0=Object.freeze({[KE.wasm]:mt.q8}),S0=Object.freeze({[mt.fp32]:"",[mt.fp16]:"_fp16",[mt.int8]:"_int8",[mt.uint8]:"_uint8",[mt.q8]:"_quantized",[mt.q4]:"_q4",[mt.q4f16]:"_q4f16",[mt.bnb4]:"_bnb4"}),xn=Object.freeze({float32:Float32Array,float16:typeof Float16Array<"u"?Float16Array:Uint16Array,float64:Float64Array,string:Array,int8:Int8Array,uint8:Uint8Array,int16:Int16Array,uint16:Uint16Array,int32:Int32Array,uint32:Uint32Array,int64:BigInt64Array,uint64:BigUint64Array,bool:Uint8Array,uint4:Uint8Array,int4:Int8Array});var U=class t{get dims(){return this.ort_tensor.dims}set dims(e){this.ort_tensor.dims=e}get type(){return this.ort_tensor.type}get data(){return this.ort_tensor.data}get size(){return this.ort_tensor.size}get location(){return this.ort_tensor.location}ort_tensor;constructor(...e){return Mu(e[0])?this.ort_tensor=e[0]:this.ort_tensor=new M0.Tensor(e[0],e[1],e[2]),new Proxy(this,{get:(r,s)=>{if(typeof s=="string"){let n=Number(s);if(Number.isInteger(n))return r._getitem(n)}return r[s]},set:(r,s,n)=>r[s]=n})}dispose(){this.ort_tensor.dispose()}*[Symbol.iterator](){let[e,...r]=this.dims;if(r.length>0){let s=r.reduce((n,o)=>n*o);for(let n=0;n<e;++n)yield this._subarray(n,s,r)}else yield*this.data}_getitem(e){let[r,...s]=this.dims;if(e=cr(e,r),s.length>0){let n=s.reduce((o,a)=>o*a);return this._subarray(e,n,s)}else return new t(this.type,[this.data[e]],s)}indexOf(e){let r=this.data;for(let s=0;s<r.length;++s)if(r[s]==e)return s;return-1}_subarray(e,r,s){let n=e*r,o=(e+1)*r,a="subarray"in this.data?this.data.subarray(n,o):this.data.slice(n,o);return new t(this.type,a,s)}item(){let e=this.data;if(e.length!==1)throw new Error(`a Tensor with ${e.length} elements cannot be converted to Scalar`);return e[0]}tolist(){return uP(this.data,this.dims)}sigmoid(){return this.clone().sigmoid_()}sigmoid_(){let e=this.data;for(let r=0;r<e.length;++r)e[r]=1/(1+Math.exp(-e[r]));return this}map(e){return this.clone().map_(e)}map_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]=e(r[s],s,r);return this}mul(e){return this.clone().mul_(e)}mul_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]*=e;return this}div(e){return this.clone().div_(e)}div_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]/=e;return this}add(e){return this.clone().add_(e)}add_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]+=e;return this}sub(e){return this.clone().sub_(e)}sub_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]-=e;return this}clone(){return new t(this.type,this.data.slice(),this.dims.slice())}slice(...e){let r=[],s=[];for(let d=0;d<this.dims.length;++d){let f=e[d];if(f==null)s.push([0,this.dims[d]]),r.push(this.dims[d]);else if(typeof f=="number")f=cr(f,this.dims[d],d),s.push([f,f+1]);else if(Array.isArray(f)&&f.length===2){let[m,_]=f;if(m=m===null?0:cr(m,this.dims[d],d,!1),_=_===null?this.dims[d]:cr(_,this.dims[d],d,!1),m>_)throw new Error(`Invalid slice: ${f}`);let w=[Math.max(m,0),Math.min(_,this.dims[d])];s.push(w),r.push(w[1]-w[0])}else throw new Error(`Invalid slice: ${f}`)}let n=s.map(([d,f])=>f-d),o=n.reduce((d,f)=>d*f),a=this.data,i=new a.constructor(o),l=this.stride(),u=!0;for(let d=1;d<n.length;++d)if(s[d][0]!==0||s[d][1]!==this.dims[d]){u=!1;break}if(u){let d=s[0][0]*l[0],f=s[0][1]*l[0];if(ArrayBuffer.isView(a))i.set(a.subarray(d,f));else if(Array.isArray(a)){let m=a.slice(d,f);for(let _=0;_<m.length;++_)i[_]=m[_]}else throw new Error("Unsupported data type for slicing")}else for(let d=0;d<o;++d){let f=0;for(let m=n.length-1,_=d;m>=0;--m){let w=n[m];f+=(_%w+s[m][0])*l[m],_=Math.floor(_/w)}i[d]=a[f]}return new t(this.type,i,r)}permute(...e){return ZE(this,e)}transpose(...e){return this.permute(...e)}sum(e=null,r=!1){return this.norm(1,e,r)}norm(e="fro",r=null,s=!1){if(e==="fro")e=2;else if(typeof e=="string")throw Error(`Unsupported norm: ${e}`);let n=this.data,o=(u,d)=>u+d**e;if(r===null){let u=n.reduce(o,0)**(1/e);return new t(this.type,[u],[])}let[a,i,l]=pi(o,this,r,s);if(e!==1)for(let u=0;u<i.length;++u)i[u]=i[u]**(1/e);return new t(a,i,l)}normalize_(e=2,r=1){r=cr(r,this.dims.length);let s=this.norm(e,r,!0),n=this.data,o=s.data;for(let a=0;a<n.length;++a){let i=0;for(let l=this.dims.length-1,u=a,d=1;l>=0;--l){let f=this.dims[l];if(l!==r){let m=u%f;i+=m*d,d*=this.dims[l]}u=Math.floor(u/f)}n[a]/=o[i]}return this}normalize(e=2,r=1){return this.clone().normalize_(e,r)}stride(){return O0(this.dims)}squeeze(e=null){return new t(this.type,this.data,QE(this.dims,e))}squeeze_(e=null){return this.dims=QE(this.dims,e),this}unsqueeze(e){return new t(this.type,this.data,JE(this.dims,e))}unsqueeze_(e){return this.dims=JE(this.dims,e),this}flatten_(e=0,r=-1){r=(r+this.dims.length)%this.dims.length;let s=this.dims.slice(0,e),n=this.dims.slice(e,r+1),o=this.dims.slice(r+1);return this.dims=[...s,n.reduce((a,i)=>a*i,1),...o],this}flatten(e=0,r=-1){return this.clone().flatten_(e,r)}view(...e){let r=-1;for(let n=0;n<e.length;++n)if(e[n]===-1){if(r!==-1)throw new Error("Only one dimension can be inferred");r=n}let s=this.data;if(r!==-1){let n=e.reduce((o,a,i)=>i!==r?o*a:o,1);e[r]=s.length/n}return new t(this.type,s,e)}neg_(){let e=this.data;for(let r=0;r<e.length;++r)e[r]=-e[r];return this}neg(){return this.clone().neg_()}gt(e){let r=new Uint8Array(this.data.length),s=this.data;for(let n=0;n<s.length;++n)r[n]=s[n]>e?1:0;return new t("bool",r,this.dims)}lt(e){let r=new Uint8Array(this.data.length),s=this.data;for(let n=0;n<s.length;++n)r[n]=s[n]<e?1:0;return new t("bool",r,this.dims)}clamp_(e,r){let s=this.data;for(let n=0;n<s.length;++n)s[n]=Math.min(Math.max(s[n],e),r);return this}clamp(e,r){return this.clone().clamp_(e,r)}round_(){let e=this.data;for(let r=0;r<e.length;++r)e[r]=Math.round(e[r]);return this}round(){return this.clone().round_()}mean(e=null,r=!1){return fi(this,e,r)}min(e=null,r=!1){if(e===null){let a=ti(this.data)[0];return new t(this.type,[a],[])}let[s,n,o]=pi((a,i)=>Math.min(a,i),this,e,r,1/0);return new t(s,n,o)}max(e=null,r=!1){if(e===null){let a=Te(this.data)[0];return new t(this.type,[a],[])}let[s,n,o]=pi((a,i)=>Math.max(a,i),this,e,r,-1/0);return new t(s,n,o)}argmin(e=null,r=!1){if(e!==null)throw new Error("`dim !== null` not yet implemented.");let s=ti(this.data)[1];return new t("int64",[BigInt(s)],[])}argmax(e=null,r=!1){if(e!==null)throw new Error("`dim !== null` not yet implemented.");let s=Te(this.data)[1];return new t("int64",[BigInt(s)],[])}repeat(...e){if(e.length<this.dims.length)throw new Error(`Number of dimensions of repeat dims (${e.length}) cannot be smaller than number of dimensions of tensor (${this.dims.length})`);if(e.every(d=>d===1)){if(e.length===this.dims.length)return this.clone();let d=e.length-this.dims.length,f=Array(d).fill(1).concat(this.dims);return new t(this.type,this.data.slice(),f)}let r=e.length-this.dims.length,s=Array(r).fill(1).concat(this.dims),n=s.map((d,f)=>d*e[f]),o=n.reduce((d,f)=>d*f,1),a=this.data,i=new a.constructor(o),l=O0(s),u=O0(n);for(let d=0;d<o;++d){let f=d,m=0;for(let _=0;_<n.length;++_){let w=Math.floor(f/u[_]);f=f%u[_];let x=w%s[_];m+=x*l[_]}i[d]=a[m]}return new t(this.type,i,n)}tile(...e){if(e.length<this.dims.length){let r=this.dims.length-e.length;e=Array(r).fill(1).concat(e)}return this.repeat(...e)}to(e){if(this.type===e)return this;if(!xn.hasOwnProperty(e))throw new Error(`Unsupported type: ${e}`);let r,s=["int64","uint64"].includes(this.type),n=["int64","uint64"].includes(e);if(s&&!n)r=Number;else if(!s&&n)["float16","float32","float64"].includes(this.type)?r=o=>BigInt(Math.floor(o)):r=BigInt;else if(this.type==="float16"&&e=="float32"&&this.data instanceof Uint16Array)return new t(e,xk(this.data),this.dims);return new t(e,xn[e].from(this.data,r),this.dims)}};function uP(t,e){let r=t.length,s=e.reduce((o,a)=>o*a);if(r!==s)throw Error(`cannot reshape array of size ${r} into shape (${e})`);let n=t;for(let o=e.length-1;o>=0;o--)n=n.reduce((a,i)=>{let l=a[a.length-1];return l.length<e[o]?l.push(i):a.push([i]),a},[[]]);return n[0]}function ZE(t,e){let[r,s]=fk(t.data,t.dims,e);return new U(t.type,r,s)}function Su(t,[e,r],s="bilinear",n=!1){let o=t.dims.at(-3)??1,a=t.dims.at(-2),i=t.dims.at(-1),l=dk(t.data,[o,a,i],[e,r],s,n);return new U(t.type,l,[o,e,r])}async function Pt(t,{size:e=null,mode:r="bilinear"}={}){if(t.dims.length!==4)throw new Error("`interpolate_4d` currently only supports 4D input.");if(!e)throw new Error("`interpolate_4d` requires a `size` argument.");let s;if(e.length===2)s=[...t.dims.slice(0,2),...e];else if(e.length===3)s=[t.dims[0],...e];else if(e.length===4)s=e;else throw new Error("`size` must be of length 2, 3, or 4.");let n;if(r==="nearest")n=await lr.nearest_interpolate_4d;else if(r==="bilinear")n=await lr.bilinear_interpolate_4d;else if(r==="bicubic")n=await lr.bicubic_interpolate_4d;else throw new Error(`Unsupported mode: ${r}`);let o=new U("int64",new BigInt64Array(s.map(BigInt)),[s.length]);return await n({x:t,s:o})}async function I0(t,e){return await(await lr.matmul)({a:t,b:e})}async function pP(t,e){return await(await lr.rfft)({x:t,a:e})}async function Gt(t,e){let r=await lr.top_k;return e==null?e=t.dims.at(-1):e=Math.min(e,t.dims.at(-1)),await r({x:t,k:new U("int64",[BigInt(e)],[1])})}var Tu=t=>new U("int64",t,[t.length]);async function di(t,e,r,s,n){return await(await lr.slice)({x:t,s:Tu(e),e:Tu(r),a:Tu(s),t:Tu(n??new Array(s.length).fill(1))})}function C0(t,e){let r=t.data,s=e.data,n=[t.dims[0],t.dims[2]],o=new r.constructor(n[0]*n[1]),[a,i,l]=t.dims,u=0;for(let d=0;d<a;++d){let f=d*l*i;for(let m=0;m<l;++m){let _=0,w=0,x=d*i,k=f+m;for(let M=0;M<i;++M){let I=Number(s[x+M]);w+=I,_+=r[k+M*l]*I}let E=_/w;o[u++]=E}}return new U(t.type,o,n)}function dP(t,e,{eps:r=1e-5}={}){if(t.dims.length!==2)throw new Error("`layer_norm` currently only supports 2D input.");let[s,n]=t.dims;if(e.length!==1&&e[0]!==n)throw new Error("`normalized_shape` must be a 1D array with shape `[input.dims[1]]`.");let[o,a]=Ou(t,1,0,!0),i=o.data,l=a.data,u=t.data,d=new u.constructor(u.length);for(let f=0;f<s;++f){let m=f*n;for(let _=0;_<n;++_){let w=m+_;d[w]=(u[w]-l[f])/(i[f]+r)}}return new U(t.type,d,t.dims)}function QE(t,e){return t=t.slice(),e===null?t=t.filter(r=>r!==1):typeof e=="number"?t[e]===1&&t.splice(e,1):Array.isArray(e)&&(t=t.filter((r,s)=>r!==1||!e.includes(s))),t}function JE(t,e){return e=cr(e,t.length+1),t=t.slice(),t.splice(e,0,1),t}function cr(t,e,r=null,s=!0){if(t<-e||t>=e){if(s)throw new Error(`IndexError: index ${t} is out of bounds for dimension${r===null?"":" "+r} with size ${e}`);return t<-e?0:e}return t<0&&(t=(t%e+e)%e),t}function Ee(t,e=0){e=cr(e,t[0].dims.length);let r=t[0].dims.slice();r[e]=t.reduce((a,i)=>a+i.dims[e],0);let s=r.reduce((a,i)=>a*i,1),n=new t[0].data.constructor(s),o=t[0].type;if(e===0){let a=0;for(let i of t){let l=i.data;n.set(l,a),a+=l.length}}else{let a=0;for(let i=0;i<t.length;++i){let{data:l,dims:u}=t[i];for(let d=0;d<l.length;++d){let f=0;for(let m=u.length-1,_=d,w=1;m>=0;--m){let x=u[m],k=_%x;m===e&&(k+=a),f+=k*w,w*=r[m],_=Math.floor(_/x)}n[f]=l[d]}a+=u[e]}}return new U(o,n,r)}function zt(t,e=0){return Ee(t.map(r=>r.unsqueeze(e)),e)}function pi(t,e,r,s=!1,n=null){let o=e.data,a=e.dims;r=cr(r,a.length);let i=a.slice();i[r]=1;let l=new o.constructor(o.length/a[r]);n!==null&&l.fill(n);for(let u=0;u<o.length;++u){let d=0;for(let f=a.length-1,m=u,_=1;f>=0;--f){let w=a[f];if(f!==r){let x=m%w;d+=x*_,_*=i[f]}m=Math.floor(m/w)}l[d]=t(l[d],o[u],u,d)}return s||i.splice(r,1),[e.type,l,i]}function Ou(t,e=null,r=1,s=!1){let n=t.data,o=t.dims;if(e===null){let _=n.reduce((E,M)=>E+M,0)/n.length,w=Math.sqrt(n.reduce((E,M)=>E+(M-_)**2,0)/(n.length-r)),x=new U(t.type,[_],[]);return[new U(t.type,[w],[]),x]}e=cr(e,o.length);let a=fi(t,e,s),i=a.data,[l,u,d]=pi((m,_,w,x)=>m+(_-i[x])**2,t,e,s);for(let m=0;m<u.length;++m)u[m]=Math.sqrt(u[m]/(o[e]-r));return[new U(l,u,d),a]}function fi(t,e=null,r=!1){let s=t.dims,n=t.data;if(e===null){let l=n.reduce((u,d)=>u+d,0);return new U(t.type,[l/n.length],[])}e=cr(e,s.length);let[o,a,i]=pi((l,u)=>l+u,t,e,r);if(s[e]!==1)for(let l=0;l<a.length;++l)a[l]/=s[e];return new U(o,a,i)}function O0(t){let e=new Array(t.length);for(let r=t.length-1,s=1;r>=0;--r)e[r]=s,s*=t[r];return e}function P0(t,e,r,s){let n=t.reduce((o,a)=>o*a,1);return new U(r,new s(n).fill(e),t)}function Ge(t,e){let r,s;if(typeof e=="number")r="float32",s=Float32Array;else if(typeof e=="bigint")r="int64",s=BigInt64Array;else if(typeof e=="boolean")r="bool",s=Uint8Array;else throw new Error(`Unsupported data type: ${typeof e}`);return P0(t,e,r,s)}function yn(t,e){return Ge(t.dims,e)}function rt(t){return P0(t,1n,"int64",BigInt64Array)}function mi(t){return rt(t.dims)}function Iu(t){return P0(t,0n,"int64",BigInt64Array)}function Cu(t){return Iu(t.dims)}function fP(t){let e=t.reduce((r,s)=>r*s,1);return new U("float32",Float32Array.from({length:e},()=>Math.random()),t)}function z0(t){let e=t.reduce((s,n)=>s*n,1),r=new Float32Array(e);for(let s=0;s<e;s+=2){let n=1-Math.random(),o=Math.random(),a=Math.sqrt(-2*Math.log(n)),i=2*Math.PI*o;r[s]=a*Math.cos(i),s+1<e&&(r[s+1]=a*Math.sin(i))}return new U("float32",r,t)}function L0(t,e){if(t.dims.length!==2)throw new Error("The tensor must have 2 dimensions");if(t.dims.at(-1)%8!==0)throw new Error("The last dimension of the tensor must be a multiple of 8");if(!["binary","ubinary"].includes(e))throw new Error("The precision must be either 'binary' or 'ubinary'");let r=e==="binary",s=r?"int8":"uint8",n=r?Int8Array:Uint8Array,o=t.data,a=new n(o.length/8);for(let i=0;i<o.length;++i){let l=o[i]>0?1:0,u=Math.floor(i/8),d=i%8;a[u]|=l<<7-d,r&&d===0&&(a[u]-=128)}return new U(s,a,[t.dims[0],t.dims[1]/8])}async function N0(t,e){return await Promise.all([it(t,"tokenizer.json",!0,e),it(t,"tokenizer_config.json",!0,e)])}function $0(t){let e=t.dims;switch(e.length){case 1:return t.tolist();case 2:if(e[0]!==1)throw new Error("Unable to decode tensor with `batch size !== 1`. Use `tokenizer.batch_decode(...)` for batched inputs.");return t.tolist()[0];default:throw new Error(`Expected tensor to have 1-2 dimensions, got ${e.length}.`)}}var mP=["bos_token","eos_token","unk_token","sep_token","pad_token","cls_token","mask_token"];function hP(t,e,r,s){for(let n of Object.keys(t)){let o=e-t[n].length,a=r(n),i=new Array(o).fill(a);t[n]=s==="right"?dt(t[n],i):dt(i,t[n])}}function _P(t,e){for(let r of Object.keys(t))t[r].length=e}function Es(t,...e){for(let r of e){if(!Object.hasOwn(t,r))continue;let s=t[r];if(s)if(typeof s=="object"){if(s.__type==="AddedToken")return s.content;throw Error(`Unknown token: ${s}`)}else return s}return null}function gP(t){let e=[];for(let r of t.get_added_tokens_decoder().values())r.special&&e.push(r);return e}var j=class extends Je{return_token_type_ids=!1;padding_side="right";constructor(e,r){if(super(),this._tokenizerJSON=e,this._tokenizerConfig=r,this._tokenizer=new Gv(e,r),this.config=r,this.padding_side=r.padding_side??this.padding_side,this.mask_token=Es(r,"mask_token"),this.mask_token_id=this._tokenizer.token_to_id(this.mask_token),this.pad_token=Es(r,"pad_token","eos_token"),this.pad_token_id=this._tokenizer.token_to_id(this.pad_token),this.sep_token=Es(r,"sep_token"),this.sep_token_id=this._tokenizer.token_to_id(this.sep_token),this.unk_token=Es(r,"unk_token"),this.unk_token_id=this._tokenizer.token_to_id(this.unk_token),this.bos_token=Es(r,"bos_token"),this.bos_token_id=this._tokenizer.token_to_id(this.bos_token),this.eos_token=Es(r,"eos_token"),this.eos_token_id=this._tokenizer.token_to_id(this.eos_token),this.chat_template=r.chat_template??null,Array.isArray(this.chat_template)){let n=Object.create(null);for(let{name:o,template:a}of this.chat_template){if(typeof o!="string"||typeof a!="string")throw new Error('Chat template must be a list of objects with "name" and "template" properties');n[o]=a}this.chat_template=n}this._compiled_template_cache=new Map;let s=gP(this._tokenizer);this.all_special_ids=s.map(n=>n.id),this.all_special_tokens=s.map(n=>n.content)}static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main"}={}){let i=await N0(e,{progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a});return new this(...i)}get_vocab(){return this._tokenizer.get_vocab()}get model_max_length(){return this._tokenizerConfig.model_max_length??1/0}get add_eos_token(){return this._tokenizerConfig.add_eos_token}get add_bos_token(){return this._tokenizerConfig.add_bos_token}convert_tokens_to_ids(e){return typeof e=="string"?this._tokenizer.token_to_id(e):e.map(r=>this._tokenizer.token_to_id(r))}_call(e,{text_pair:r=null,add_special_tokens:s=!0,padding:n=!1,truncation:o=null,max_length:a=null,return_tensor:i=!0,return_token_type_ids:l=null}={}){let u=Array.isArray(e),d;if(u){if(e.length===0)throw Error("text array must be non-empty");if(r!==null){if(Array.isArray(r)){if(e.length!==r.length)throw Error("text and text_pair must have the same length")}else throw Error("text_pair must also be an array");d=e.map((m,_)=>this._encode_plus(m,{text_pair:r[_],add_special_tokens:s,return_token_type_ids:l}))}else d=e.map(m=>this._encode_plus(m,{add_special_tokens:s,return_token_type_ids:l}))}else{if(e==null)throw Error("text may not be null or undefined");if(Array.isArray(r))throw Error("When specifying `text_pair`, since `text` is a string, `text_pair` must also be a string (i.e., not an array).");d=[this._encode_plus(e,{text_pair:r,add_special_tokens:s,return_token_type_ids:l})]}if(a===null?a=this.model_max_length:o===null&&(n===!0?(console.warn("`max_length` is ignored when `padding: true` and there is no truncation strategy. To pad to max length, use `padding: 'max_length'`."),a=this.model_max_length):n===!1&&(console.warn("Truncation was not explicitly activated but `max_length` is provided a specific value, please use `truncation: true` to explicitly truncate examples to max length."),o=!0)),n===!0&&(a=Math.min(Te(d.map(m=>m.input_ids.length))[0],a??1/0)),a=Math.min(a,this.model_max_length??1/0),n||o)for(let m=0;m<d.length;++m)d[m].input_ids.length!==a&&(d[m].input_ids.length>a?o&&_P(d[m],a):n&&hP(d[m],a,_=>_==="input_ids"?this.pad_token_id:0,this.padding_side));let f={};if(i){if(!(n&&o)&&d.some(_=>{for(let w of Object.keys(_))if(_[w].length!==d[0][w]?.length)return!0;return!1}))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=true' and 'truncation=true' to have batched tensors with the same length.");let m=[d.length,d[0].input_ids.length];for(let _ of Object.keys(d[0]))f[_]=new U("int64",BigInt64Array.from(d.flatMap(w=>w[_]).map(BigInt)),m)}else{for(let m of Object.keys(d[0]))f[m]=d.map(_=>_[m]);if(!u)for(let m of Object.keys(f))f[m]=f[m][0]}return f}_encode_text(e){return e===null?null:this._tokenizer.encode(e).tokens}_encode_plus(e,{text_pair:r=null,add_special_tokens:s=!0,return_token_type_ids:n=null}={}){let{ids:o,attention_mask:a,token_type_ids:i}=this._tokenizer.encode(e,{text_pair:r,add_special_tokens:s,return_token_type_ids:n??this.return_token_type_ids});return{input_ids:o,attention_mask:a,...i?{token_type_ids:i}:{}}}tokenize(e,{pair:r=null,add_special_tokens:s=!1}={}){return this._tokenizer.tokenize(e,{text_pair:r,add_special_tokens:s})}encode(e,{text_pair:r=null,add_special_tokens:s=!0,return_token_type_ids:n=null}={}){return this._tokenizer.encode(e,{text_pair:r,add_special_tokens:s,return_token_type_ids:n}).ids}batch_decode(e,r={}){return e instanceof U&&(e=e.tolist()),e.map(s=>this.decode(s,r))}decode(e,r={}){if(e instanceof U&&(e=$0(e)),!Array.isArray(e)||e.length===0||!rk(e[0]))throw Error("token_ids must be a non-empty array of integers.");return this.decode_single(e,r)}decode_single(e,{skip_special_tokens:r=!1,clean_up_tokenization_spaces:s=null}){return this._tokenizer.decode(e,{skip_special_tokens:r,clean_up_tokenization_spaces:s})}get_chat_template({chat_template:e=null,tools:r=null}={}){if(this.chat_template&&typeof this.chat_template=="object"){let s=this.chat_template;if(e!==null&&Object.hasOwn(s,e))e=s[e];else if(e===null)if(r!==null&&"tool_use"in s)e=s.tool_use;else if("default"in s)e=s.default;else throw Error(`This model has multiple chat templates with no default specified! Please either pass a chat template or the name of the template you wish to use to the 'chat_template' argument. Available template names are ${Object.keys(s).sort()}.`)}else if(e===null)if(this.chat_template)e=this.chat_template;else throw Error("Cannot use apply_chat_template() because tokenizer.chat_template is not set and no template argument was passed! For information about writing templates and setting the tokenizer.chat_template attribute, please see the documentation at https://huggingface.co/docs/transformers/main/en/chat_templating");return e}apply_chat_template(e,{tools:r=null,documents:s=null,chat_template:n=null,add_generation_prompt:o=!1,tokenize:a=!0,padding:i=!1,truncation:l=!1,max_length:u=null,return_tensor:d=!0,return_dict:f=!0,tokenizer_kwargs:m={},..._}={}){if(n=this.get_chat_template({chat_template:n,tools:r}),typeof n!="string")throw Error(`chat_template must be a string, but got ${typeof n}`);let w=this._compiled_template_cache.get(n);w===void 0&&(w=new tk(n),this._compiled_template_cache.set(n,w));let x=Object.create(null);for(let E of mP){let M=Es(this.config,E);M&&(x[E]=M)}let k=w.render({messages:e,add_generation_prompt:o,tools:r,documents:s,...x,..._});if(a){let E=this._call(k,{add_special_tokens:!1,padding:i,truncation:l,max_length:u,return_tensor:d,...m});return f?E:E.input_ids}return k}};function bn(t,e,r,s){if(!("language_codes"in t)||!Array.isArray(t.language_codes))throw new Error("Tokenizer must have `language_codes` attribute set and it should be an array of language ids.");if(!("languageRegex"in t)||!(t.languageRegex instanceof RegExp))throw new Error("Tokenizer must have `languageRegex` attribute set and it should be a regular expression.");if(!("lang_to_token"in t)||typeof t.lang_to_token!="function")throw new Error("Tokenizer must have `lang_to_token` attribute set and it should be a function.");let n=s.src_lang,o=s.tgt_lang;if(!t.language_codes.includes(o))throw new Error(`Target language code "${o}" is not valid. Must be one of: {${t.language_codes.join(", ")}}`);if(n!==void 0){if(!t.language_codes.includes(n))throw new Error(`Source language code "${n}" is not valid. Must be one of: {${t.language_codes.join(", ")}}`);for(let a of t._tokenizer.post_processor.config.single)if("SpecialToken"in a&&t.languageRegex.test(a.SpecialToken.id)){a.SpecialToken.id=t.lang_to_token(n);break}}return s.forced_bos_token_id=t._tokenizer.token_to_id(t.lang_to_token(o)),t._call(e,r)}var U0={};cs(U0,{AlbertTokenizer:()=>Pu,AutoTokenizer:()=>J,BartTokenizer:()=>zu,BertTokenizer:()=>Lu,BlenderbotSmallTokenizer:()=>Nu,BlenderbotTokenizer:()=>$u,BloomTokenizer:()=>Ru,CLIPTokenizer:()=>Bu,CamembertTokenizer:()=>Uu,CodeGenTokenizer:()=>Fu,CodeLlamaTokenizer:()=>Du,CohereTokenizer:()=>ju,ConvBertTokenizer:()=>Gu,DebertaTokenizer:()=>Wu,DebertaV2Tokenizer:()=>qu,DistilBertTokenizer:()=>Vu,ElectraTokenizer:()=>Hu,EsmTokenizer:()=>Xu,FalconTokenizer:()=>Ku,GPT2Tokenizer:()=>Ju,GPTNeoXTokenizer:()=>Qu,GemmaTokenizer:()=>Yu,HerbertTokenizer:()=>Zu,LlamaTokenizer:()=>ep,M2M100Tokenizer:()=>tp,MBart50Tokenizer:()=>sp,MBartTokenizer:()=>vn,MPNetTokenizer:()=>ap,MarianTokenizer:()=>rp,MgpstrTokenizer:()=>np,MobileBertTokenizer:()=>op,NllbTokenizer:()=>ip,NougatTokenizer:()=>lp,PreTrainedTokenizer:()=>j,Qwen2Tokenizer:()=>cp,RoFormerTokenizer:()=>pp,RobertaTokenizer:()=>up,SiglipTokenizer:()=>dp,SpeechT5Tokenizer:()=>fp,SqueezeBertTokenizer:()=>mp,T5Tokenizer:()=>hp,TokenizersBackend:()=>j,VitsTokenizer:()=>_p,Wav2Vec2CTCTokenizer:()=>gp,WhisperTokenizer:()=>wp,XLMRobertaTokenizer:()=>xp,XLMTokenizer:()=>yp});var Pu=class extends j{return_token_type_ids=!0};var zu=class extends j{};var Lu=class extends j{return_token_type_ids=!0};var Nu=class extends j{};var $u=class extends j{};var Ru=class extends j{};var Uu=class extends j{};var Bu=class extends j{};var Du=class extends j{};var Fu=class extends j{};var ju=class extends j{};var Gu=class extends j{return_token_type_ids=!0};var qu=class extends j{return_token_type_ids=!0};var Wu=class extends j{return_token_type_ids=!0};var Vu=class extends j{};var Hu=class extends j{return_token_type_ids=!0};var Xu=class extends j{};var Ku=class extends j{};var Yu=class extends j{};var Qu=class extends j{};var Ju=class extends j{};var Zu=class extends j{return_token_type_ids=!0};var ep=class extends j{padding_side="left"};var tp=class extends j{constructor(e,r){super(e,r),this.languageRegex=/^__[a-z]{2,3}__$/,this.language_codes=this.all_special_tokens.filter(s=>this.languageRegex.test(s)).map(s=>s.slice(2,-2)),this.lang_to_token=s=>`__${s}__`}_build_translation_inputs(e,r,s){return bn(this,e,r,s)}};var rp=class extends j{constructor(e,r){super(e,r),this.languageRegex=/^(>>\w+<<)\s*/g,this.supported_language_codes=Array.from(this.get_vocab().keys()).filter(s=>this.languageRegex.test(s)),console.warn('WARNING: `MarianTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}_encode_text(e){if(e===null)return null;let[r,...s]=e.trim().split(this.languageRegex);if(s.length===0)return super._encode_text(r);if(s.length===2){let[n,o]=s;return this.supported_language_codes.includes(n)||console.warn(`Unsupported language code "${n}" detected, which may lead to unexpected behavior. Should be one of: ${JSON.stringify(this.supported_language_codes)}`),dt([n],super._encode_text(o))}}};var vn=class extends j{constructor(e,r){super(e,r),this.languageRegex=/^[a-z]{2}_[A-Z]{2}$/,this.language_codes=this.all_special_tokens.filter(s=>this.languageRegex.test(s)).map(s=>s),this.lang_to_token=s=>s}_build_translation_inputs(e,r,s){return bn(this,e,r,s)}};var sp=class extends vn{};var np=class extends j{};var op=class extends j{return_token_type_ids=!0};var ap=class extends j{};var ip=class extends j{constructor(e,r){super(e,r),this.languageRegex=/^[a-z]{3}_[A-Z][a-z]{3}$/,this.language_codes=this.all_special_tokens.filter(s=>this.languageRegex.test(s)),this.lang_to_token=s=>s}_build_translation_inputs(e,r,s){return bn(this,e,r,s)}};var lp=class extends j{};var cp=class extends j{};var up=class extends j{};var pp=class extends j{return_token_type_ids=!0};var dp=class extends j{};var fp=class extends j{};var mp=class extends j{return_token_type_ids=!0};var hp=class extends j{};var R0=class extends Bt{decode_chain(e){let r="";for(let s=1;s<e.length;s+=2)r+=e[s];return[r]}},_p=class extends j{constructor(e,r){super(e,r),this._tokenizer.decoder=new R0({type:"VitsDecoder"})}};var gp=class extends j{};var eA=[["en","english"],["zh","chinese"],["de","german"],["es","spanish"],["ru","russian"],["ko","korean"],["fr","french"],["ja","japanese"],["pt","portuguese"],["tr","turkish"],["pl","polish"],["ca","catalan"],["nl","dutch"],["ar","arabic"],["sv","swedish"],["it","italian"],["id","indonesian"],["hi","hindi"],["fi","finnish"],["vi","vietnamese"],["he","hebrew"],["uk","ukrainian"],["el","greek"],["ms","malay"],["cs","czech"],["ro","romanian"],["da","danish"],["hu","hungarian"],["ta","tamil"],["no","norwegian"],["th","thai"],["ur","urdu"],["hr","croatian"],["bg","bulgarian"],["lt","lithuanian"],["la","latin"],["mi","maori"],["ml","malayalam"],["cy","welsh"],["sk","slovak"],["te","telugu"],["fa","persian"],["lv","latvian"],["bn","bengali"],["sr","serbian"],["az","azerbaijani"],["sl","slovenian"],["kn","kannada"],["et","estonian"],["mk","macedonian"],["br","breton"],["eu","basque"],["is","icelandic"],["hy","armenian"],["ne","nepali"],["mn","mongolian"],["bs","bosnian"],["kk","kazakh"],["sq","albanian"],["sw","swahili"],["gl","galician"],["mr","marathi"],["pa","punjabi"],["si","sinhala"],["km","khmer"],["sn","shona"],["yo","yoruba"],["so","somali"],["af","afrikaans"],["oc","occitan"],["ka","georgian"],["be","belarusian"],["tg","tajik"],["sd","sindhi"],["gu","gujarati"],["am","amharic"],["yi","yiddish"],["lo","lao"],["uz","uzbek"],["fo","faroese"],["ht","haitian creole"],["ps","pashto"],["tk","turkmen"],["nn","nynorsk"],["mt","maltese"],["sa","sanskrit"],["lb","luxembourgish"],["my","myanmar"],["bo","tibetan"],["tl","tagalog"],["mg","malagasy"],["as","assamese"],["tt","tatar"],["haw","hawaiian"],["ln","lingala"],["ha","hausa"],["ba","bashkir"],["jw","javanese"],["su","sundanese"]],hi=new Map(eA),wP=new Map([...eA.map(([t,e])=>[e,t]),["burmese","my"],["valencian","ca"],["flemish","nl"],["haitian","ht"],["letzeburgesch","lb"],["pushto","ps"],["panjabi","pa"],["moldavian","ro"],["moldovan","ro"],["sinhalese","si"],["castilian","es"]]);function tA(t){t=t.toLowerCase();let e=wP.get(t);if(e===void 0){let r=t.match(/^<\|([a-z]{2})\|>$/);if(r&&(t=r[1]),hi.has(t))e=t;else{let n=t.length===2?hi.keys():hi.values();throw new Error(`Language "${t}" is not supported. Must be one of: ${JSON.stringify(Array.from(n))}`)}}return e}var xP="\\p{P}\\u0021-\\u002F\\u003A-\\u0040\\u005B-\\u0060\\u007B-\\u007E",rA=new RegExp(`^[${xP}]+$`,"gu"),wp=class extends j{get timestamp_begin(){return this._tokenizer.token_to_id("<|notimestamps|>")+1}_decode_asr(e,{return_timestamps:r=!1,return_language:s=!1,time_precision:n=null,force_full_sequences:o=!0}={}){if(n===null)throw Error("Must specify time_precision");let a=null,i=r==="word";function l(){return{language:a,timestamp:[null,null],text:""}}let u=[],d=l(),f=0,m=this.timestamp_begin,w=m+1500,x=[],k=[],E=!1,M=null,I=new Set(this.all_special_ids);for(let C of e){let v=C.tokens,G=i?C.token_timestamps:null,X=null,V=m;if("stride"in C){let[Y,B,P]=C.stride;if(f-=B,M=Y-P,B&&(V=B/n+m),P)for(let se=v.length-1;se>=0;--se){let ie=Number(v[se]);if(ie>=m){if(X!==null&&(ie-m)*n<M)break;X=ie}}}let Q=[],K=[];for(let Y=0;Y<v.length;++Y){let B=Number(v[Y]);if(I.has(B)){let P=this.decode([B]),se=hi.get(P.slice(2,-2));if(se!==void 0){if(a!==null&&se!==a&&!r){x.push(Q);let ie=this.findLongestCommonSequence(x)[0],S=this.decode(ie);d.text=S,u.push(d),x=[],Q=[],d=l()}a=d.language=se}}else if(B>=m&&B<=w){let P=(B-m)*n+f,se=ms(P,2);if(X!==null&&B>=X)E=!0;else if(E||x.length>0&&B<V)E=!1;else if(d.timestamp[0]===null)d.timestamp[0]=se;else if(se!==d.timestamp[0]){d.timestamp[1]=se,x.push(Q),i&&k.push(K);let[ie,S]=this.findLongestCommonSequence(x,k),L=this.decode(ie);d.text=L,i&&(d.words=this.collateWordTimestamps(ie,S,a)),u.push(d),x=[],Q=[],k=[],K=[],d=l()}}else if(Q.push(B),i){let P=ms(G[Y]+f,2),se;if(Y+1<G.length){se=ms(G[Y+1]+f,2);let ie=this.decode([B]);rA.test(ie)&&(se=ms(Math.min(P+n,se),2))}else se=null;K.push([P,se])}}if("stride"in C){let[Y,B,P]=C.stride;f+=Y-P}Q.length>0?(x.push(Q),i&&k.push(K)):x.every(Y=>Y.length===0)&&(d=l(),x=[],Q=[],k=[],K=[])}if(x.length>0){if(o&&r)throw new Error("Whisper did not predict an ending timestamp, which can happen if audio is cut off in the middle of a word. Also make sure WhisperTimeStampLogitsProcessor was used during generation.");let[C,v]=this.findLongestCommonSequence(x,k),G=this.decode(C);d.text=G,i&&(d.words=this.collateWordTimestamps(C,v,a)),u.push(d)}let T=Object.create(null),z=u.map(C=>C.text).join("");if(r||s){for(let C=0;C<u.length;++C){let v=u[C];r||delete v.timestamp,s||delete v.language}if(i){let C=[];for(let v of u)for(let G of v.words)C.push(G);T={chunks:C}}else T={chunks:u}}return[z,T]}findLongestCommonSequence(e,r=null){let s=e[0],n=s.length,o=[],a=Array.isArray(r)&&r.length>0,i=a?[]:null,l=a?r[0]:null;for(let u=1;u<e.length;++u){let d=e[u],f=0,m=[n,n,0,0],_=d.length;for(let T=1;T<n+_;++T){let z=Math.max(0,n-T),C=Math.min(n,n+_-T),v=s.slice(z,C),G=Math.max(0,T-n),X=Math.min(_,T),V=d.slice(G,X);if(v.length!==V.length)throw new Error("There is a bug within whisper `decode_asr` function, please report it. Dropping to prevent bad inference.");let Q;a?Q=v.filter((B,P)=>B===V[P]&&l[z+P]<=r[u][G+P]).length:Q=v.filter((B,P)=>B===V[P]).length;let K=T/1e4,Y=Q/T+K;Q>1&&Y>f&&(f=Y,m=[z,C,G,X])}let[w,x,k,E]=m,M=Math.floor((x+w)/2),I=Math.floor((E+k)/2);o.push(...s.slice(0,M)),s=d.slice(I),n=s.length,a&&(i.push(...l.slice(0,M)),l=r[u].slice(I))}return o.push(...s),a?(i.push(...l),[o,i]):[o,[]]}collateWordTimestamps(e,r,s){let[n,o,a]=this.combineTokensIntoWords(e,s),i=[];for(let l=0;l<n.length;++l){let u=a[l];i.push({text:n[l],timestamp:[r[u.at(0)][0],r[u.at(-1)][1]]})}return i}combineTokensIntoWords(e,r,s=`"'\u201C\xA1\xBF([{-`,n=`"'.\u3002,\uFF0C!\uFF01?\uFF1F:\uFF1A\u201D)]}\u3001`){r=r??"english";let o,a,i;return["chinese","japanese","thai","lao","myanmar"].includes(r)?[o,a,i]=this.splitTokensOnUnicode(e):[o,a,i]=this.splitTokensOnSpaces(e),this.mergePunctuations(o,a,i,s,n)}decode(e,r){let s;return r?.decode_with_timestamps?(e instanceof U&&(e=$0(e)),s=this.decodeWithTimestamps(e,r)):s=super.decode(e,r),s}decodeWithTimestamps(e,r){let s=r?.time_precision??.02,n=this.all_special_ids.at(-1)+1,o=[[]];for(let a of e)if(a=Number(a),a>=n){let i=((a-n)*s).toFixed(2);o.push(`<|${i}|>`),o.push([])}else o[o.length-1].push(a);return o=o.map(a=>typeof a=="string"?a:super.decode(a,r)),o.join("")}splitTokensOnUnicode(e){let r=this.decode(e,{decode_with_timestamps:!0}),s="\uFFFD",n=[],o=[],a=[],i=[],l=[],u=0;for(let d=0;d<e.length;++d){let f=e[d];i.push(f),l.push(d);let m=this.decode(i,{decode_with_timestamps:!0});(!m.includes(s)||r[u+m.indexOf(s)]===s)&&(n.push(m),o.push(i),a.push(l),i=[],l=[],u+=m.length)}return[n,o,a]}splitTokensOnSpaces(e){let[r,s,n]=this.splitTokensOnUnicode(e),o=[],a=[],i=[];for(let l=0;l<r.length;++l){let u=r[l],d=s[l],f=n[l],m=d[0]>=this._tokenizer.token_to_id("<|endoftext|>"),_=u.startsWith(" "),w=u.trim(),x=rA.test(w);if(m||_||x||o.length===0)o.push(u),a.push(d),i.push(f);else{let k=o.length-1;o[k]+=u,a[k].push(...d),i[k].push(...f)}}return[o,a,i]}mergePunctuations(e,r,s,n,o){let a=structuredClone(e),i=structuredClone(r),l=structuredClone(s),u=a.length-2,d=a.length-1;for(;u>=0;)a[u].startsWith(" ")&&n.includes(a[u].trim())?(a[d]=a[u]+a[d],i[d]=dt(i[u],i[d]),l[d]=dt(l[u],l[d]),a[u]="",i[u]=[],l[u]=[]):d=u,--u;for(u=0,d=1;d<a.length;)!a[u].endsWith(" ")&&o.includes(a[d])?(a[u]+=a[d],i[u]=dt(i[u],i[d]),l[u]=dt(l[u],l[d]),a[d]="",i[d]=[],l[d]=[]):u=d,++d;return[a.filter(f=>f),i.filter(f=>f.length>0),l.filter(f=>f.length>0)]}};var xp=class extends j{};var yp=class extends j{return_token_type_ids=!0;constructor(e,r){super(e,r),console.warn('WARNING: `XLMTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}};var J=class{static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main"}={}){let[i,l]=await N0(e,{progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a}),u=l.tokenizer_class?.replace(/Fast$/,"")??"PreTrainedTokenizer",d=U0[u];return d||(console.warn(`Unknown tokenizer class "${u}", attempting to construct from base class.`),d=j),new d(i,l)}};var kn="https://github.com/huggingface/transformers.js/issues/new/choose";var _i="preprocessor_config.json",En=_i,sA="processor_config.json",nA="chat_template.jinja";var ne=class extends Je{static classes=["image_processor_class","tokenizer_class","feature_extractor_class"];static uses_processor_config=!1;static uses_chat_template_file=!1;constructor(e,r,s){super(),this.config=e,this.components=r,this.chat_template=s}get image_processor(){return this.components.image_processor}get tokenizer(){return this.components.tokenizer}get feature_extractor(){return this.components.feature_extractor}apply_chat_template(e,r={}){if(!this.tokenizer)throw new Error("Unable to apply chat template without a tokenizer.");return this.tokenizer.apply_chat_template(e,{tokenize:!1,chat_template:this.chat_template??void 0,...r})}batch_decode(...e){if(!this.tokenizer)throw new Error("Unable to decode without a tokenizer.");return this.tokenizer.batch_decode(...e)}decode(...e){if(!this.tokenizer)throw new Error("Unable to decode without a tokenizer.");return this.tokenizer.decode(...e)}async _call(e,...r){for(let s of[this.image_processor,this.feature_extractor,this.tokenizer])if(s)return s(e,...r);throw new Error("No image processor, feature extractor, or tokenizer found.")}static async from_pretrained(e,r={}){let[s,n,o]=await Promise.all([this.uses_processor_config?it(e,sA,!0,r):{},Promise.all(this.classes.filter(a=>a in this).map(async a=>{let i=await this[a].from_pretrained(e,r);return[a.replace(/_class$/,""),i]})).then(Object.fromEntries),this.uses_chat_template_file?Oy(e,nA,!0,r):null]);return new this(s,n,o)}};var Xd={};cs(Xd,{ChatterboxProcessor:()=>$p,Florence2Processor:()=>Md,Gemma3nProcessor:()=>Td,GroundingDinoProcessor:()=>Sd,Idefics3Processor:()=>zi,JinaCLIPProcessor:()=>Id,LlavaProcessor:()=>Cd,MgpstrProcessor:()=>Pd,MoonshineProcessor:()=>zd,OwlViTProcessor:()=>Ld,PaliGemmaProcessor:()=>Nd,Phi3VProcessor:()=>$d,PixtralProcessor:()=>Rd,Processor:()=>ne,PyAnnoteProcessor:()=>Ud,Qwen2VLProcessor:()=>Bd,Sam2Processor:()=>Li,Sam2VideoProcessor:()=>Dd,SamProcessor:()=>zn,SmolVLMProcessor:()=>zi,SpeechT5Processor:()=>Fd,UltravoxProcessor:()=>jd,VLChatProcessor:()=>Od,VoxtralProcessor:()=>qd,Wav2Vec2Processor:()=>Wd,Wav2Vec2ProcessorWithLM:()=>Vd,WhisperProcessor:()=>Hd});var ze=class extends Je{constructor(e){super(),this.config=e}static async from_pretrained(e,r={}){let s=await it(e,_i,!0,r);return new this(s)}};function He(t,e){if(!(t instanceof Float32Array||t instanceof Float64Array))throw new Error(`${e} expects input to be a Float32Array or a Float64Array, but got ${t?.constructor?.name??typeof t} instead. If using the feature extractor directly, remember to use \`read_audio(url, sampling_rate)\` to obtain the raw audio data of the file/url.`)}var gi={};cs(gi,{ASTFeatureExtractor:()=>Ep,ChatterboxFeatureExtractor:()=>Ap,ClapFeatureExtractor:()=>Mp,DacFeatureExtractor:()=>Tn,EncodecFeatureExtractor:()=>Mn,FeatureExtractor:()=>ze,Gemma3nAudioFeatureExtractor:()=>Tp,MoonshineFeatureExtractor:()=>Sp,ParakeetFeatureExtractor:()=>Op,PyAnnoteFeatureExtractor:()=>Sn,SeamlessM4TFeatureExtractor:()=>Ip,SnacFeatureExtractor:()=>Cp,SpeechT5FeatureExtractor:()=>Pp,Wav2Vec2FeatureExtractor:()=>zp,WeSpeakerFeatureExtractor:()=>Lp,WhisperFeatureExtractor:()=>Np});var oA=Ur(require("fs"),1),aA=require("stream"),iA=require("stream/promises");async function bp(t,e){if(be.IS_BROWSER_ENV){if(be.IS_WEBWORKER_ENV)throw new Error("Unable to save a file from a Web Worker.");let r=URL.createObjectURL(e),s=document.createElement("a");s.href=r,s.download=t,s.click(),s.remove(),URL.revokeObjectURL(r)}else if(be.IS_FS_AVAILABLE){let r=e.stream(),s=aA.Readable.fromWeb(r),n=oA.default.createWriteStream(t);await(0,iA.pipeline)(s,n)}else throw new Error("Unable to save because filesystem is disabled in this environment.")}async function kp(t,e){if(typeof AudioContext>"u")throw Error("Unable to load audio from path/URL since `AudioContext` is not available in your environment. Instead, audio data should be passed directly to the pipeline/processor. For more information and some example code, see https://huggingface.co/docs/transformers.js/guides/node-audio-processing.");let r=await(await fn(t)).arrayBuffer(),s=new AudioContext({sampleRate:e});typeof e>"u"&&console.warn(`No sampling rate provided, using default of ${s.sampleRate}Hz.`);let n=await s.decodeAudioData(r),o;if(n.numberOfChannels===2){let a=Math.sqrt(2),i=n.getChannelData(0),l=n.getChannelData(1);o=new Float32Array(i.length);for(let u=0;u<n.length;++u)o[u]=a*(i[u]+l[u])/2}else o=n.getChannelData(0);return o}function uA(t,e){if(t<1)return new Float64Array;if(t===1)return new Float64Array([1]);let r=1-e,s=2*Math.PI/(t-1),n=new Float64Array(t);for(let o=0;o<t;++o)n[o]=e-r*Math.cos(o*s);return n}function lA(t){return uA(t,.5)}function yP(t){return uA(t,.54)}var bP={htk:t=>2595*Math.log10(1+t/700),kaldi:t=>1127*Math.log(1+t/700),slaney:(t,e=1e3,r=15,s=27/Math.log(6.4))=>t>=e?r+Math.log(t/e)*s:3*t/200};function B0(t,e="htk"){let r=bP[e];if(!r)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof t=="number"?r(t):t.map(s=>r(s))}var vP={htk:t=>700*(10**(t/2595)-1),kaldi:t=>700*(Math.exp(t/1127)-1),slaney:(t,e=1e3,r=15,s=Math.log(6.4)/27)=>t>=r?e*Math.exp(s*(t-r)):200*t/3};function kP(t,e="htk"){let r=vP[e];if(!r)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof t=="number"?r(t):t.map(s=>r(s))}function EP(t,e){let r=Float64Array.from({length:e.length-1},(a,i)=>e[i+1]-e[i]),s=Array.from({length:t.length},()=>new Array(e.length));for(let a=0;a<t.length;++a){let i=s[a];for(let l=0;l<e.length;++l)i[l]=e[l]-t[a]}let n=e.length-2,o=Array.from({length:n},()=>new Array(t.length));for(let a=0;a<t.length;++a){let i=s[a];for(let l=0;l<n;++l){let u=-i[l]/r[l],d=i[l+2]/r[l+1];o[l][a]=Math.max(0,Math.min(u,d))}}return o}function cA(t,e,r){let s=(e-t)/(r-1);return Float64Array.from({length:r},(n,o)=>t+s*o)}function yt(t,e,r,s,n,o=null,a="htk",i=!1){if(o!==null&&o!=="slaney")throw new Error('norm must be one of null or "slaney"');if(t<2)throw new Error(`Require num_frequency_bins: ${t} >= 2`);if(r>s)throw new Error(`Require min_frequency: ${r} <= max_frequency: ${s}`);let l=B0(r,a),u=B0(s,a),d=cA(l,u,e+2),f=kP(d,a),m;if(i){let w=n/((t-1)*2);m=B0(Float64Array.from({length:t},(x,k)=>k*w),a),f=d}else m=cA(0,Math.floor(n/2),t);let _=EP(m,f);if(o!==null&&o==="slaney")for(let w=0;w<e;++w){let x=_[w],k=2/(f[w+2]-f[w]);for(let E=0;E<t;++E)x[E]*=k}return _}function AP(t,e,r){let s=new t.constructor(t.length+e+r),n=t.length-1;for(let o=0;o<t.length;++o)s[e+o]=t[o];for(let o=1;o<=e;++o)s[e-o]=t[un(o,n)];for(let o=1;o<=r;++o)s[n+e+o]=t[un(n-o,n)];return s}function pA(t,e,r,s,n){if(r<=0)throw new Error("reference must be greater than zero");if(s<=0)throw new Error("min_value must be greater than zero");r=Math.max(s,r);let o=Math.log10(r);for(let a=0;a<t.length;++a)t[a]=e*Math.log10(Math.max(s,t[a])-o);if(n!==null){if(n<=0)throw new Error("db_range must be greater than zero");let a=Te(t)[0]-n;for(let i=0;i<t.length;++i)t[i]=Math.max(t[i],a)}return t}function MP(t,e=1,r=1e-5,s=null){return pA(t,20,e,r,s)}function TP(t,e=1,r=1e-10,s=null){return pA(t,10,e,r,s)}async function At(t,e,r,s,{fft_length:n=null,power:o=1,center:a=!0,pad_mode:i="reflect",onesided:l=!0,preemphasis:u=null,preemphasis_htk_flavor:d=!0,mel_filters:f=null,mel_floor:m=1e-10,log_mel:_=null,reference:w=1,min_value:x=1e-10,db_range:k=null,remove_dc_offset:E=null,min_num_frames:M=null,max_num_frames:I=null,do_pad:T=!0,transpose:z=!1,mel_offset:C=0}={}){let v=e.length;if(n===null&&(n=r),r>n)throw Error(`frame_length (${r}) may not be larger than fft_length (${n})`);if(v!==r)throw new Error(`Length of the window (${v}) must equal frame_length (${r})`);if(s<=0)throw new Error("hop_length must be greater than zero");if(o===null&&f!==null)throw new Error("You have provided `mel_filters` but `power` is `None`. Mel spectrogram computation is not yet supported for complex-valued spectrogram. Specify `power` to fix this issue.");if(!d)throw new Error("`preemphasis_htk_flavor=false` is not currently supported.");if(a)switch(i){case"reflect":{let L=Math.floor((n-1)/2)+1;t=AP(t,L,L);break}case"constant":{let L=Math.floor(n/2),R=new t.constructor(t.length+2*L);R.set(t,L),t=R;break}default:throw new Error(`pad_mode="${i}" not implemented yet.`)}let G=Math.floor(1+Math.floor((t.length-r)/s));M!==null&&G<M&&(G=M);let X=l?Math.floor(n/2)+1:n,V=G,Q=G;I!==null&&(I>G?T&&(Q=I):Q=V=I);let K=new uu(n),Y=new Float64Array(n),B=new Float64Array(K.outputBufferSize),P=new Float32Array(X*Q);for(let L=0;L<V;++L){let R=L*s,te=Math.min(t.length-R,r);te!==r&&Y.fill(0,0,r);for(let ue=0;ue<te;++ue)Y[ue]=t[R+ue];if(E){let ue=0;for(let Pe=0;Pe<te;++Pe)ue+=Y[Pe];let Be=ue/te;for(let Pe=0;Pe<te;++Pe)Y[Pe]-=Be}if(u!==null){for(let ue=te-1;ue>=1;--ue)Y[ue]-=u*Y[ue-1];Y[0]*=1-u}for(let ue=0;ue<e.length;++ue)Y[ue]*=e[ue];K.realTransform(B,Y);for(let ue=0;ue<X;++ue){let Be=ue<<1;P[ue*Q+L]=B[Be]**2+B[Be+1]**2}}if(o!==null&&o!==2){let L=o/2;for(let R=0;R<P.length;++R)P[R]**=L}let se=f.length,ie=await I0(new U("float32",f.flat(),[se,X]),new U("float32",P,[X,Q]));z&&(ie=ie.transpose(1,0));let S=ie.data;for(let L=0;L<S.length;++L)S[L]=C+Math.max(m,S[L]);if(o!==null&&_!==null){let L=Math.min(S.length,V*se);switch(_){case"log":for(let R=0;R<L;++R)S[R]=Math.log(S[R]);break;case"log10":for(let R=0;R<L;++R)S[R]=Math.log10(S[R]);break;case"dB":if(o===1)MP(S,w,x,k);else if(o===2)TP(S,w,x,k);else throw new Error(`Cannot use log_mel option '${_}' with power ${o}`);break;default:throw new Error(`log_mel must be one of null, 'log', 'log10' or 'dB'. Got '${_}'`)}}return ie}function Mt(t,e,{periodic:r=!0,frame_length:s=null,center:n=!0}={}){let o=r?t+1:t,a;switch(e){case"boxcar":a=new Float64Array(o).fill(1);break;case"hann":case"hann_window":a=lA(o);break;case"hamming":a=yP(o);break;case"povey":a=lA(o).map(i=>Math.pow(i,.85));break;default:throw new Error(`Unknown window type ${e}.`)}if(r&&(a=a.subarray(0,t)),s===null)return a;if(t>s)throw new Error(`Length of the window (${t}) may not be larger than frame_length (${s})`);return a}function SP(t,e){let r=t.reduce((o,a)=>o+a.length,0),s=new ArrayBuffer(44),n=new DataView(s);return vp(n,0,"RIFF"),n.setUint32(4,36+r*4,!0),vp(n,8,"WAVE"),vp(n,12,"fmt "),n.setUint32(16,16,!0),n.setUint16(20,3,!0),n.setUint16(22,1,!0),n.setUint32(24,e,!0),n.setUint32(28,e*4,!0),n.setUint16(32,4,!0),n.setUint16(34,32,!0),vp(n,36,"data"),n.setUint32(40,r*4,!0),new Blob([s,...t.map(o=>o.buffer)],{type:"audio/wav"})}function vp(t,e,r){for(let s=0;s<r.length;++s)t.setUint8(e+s,r.charCodeAt(s))}var An=class{constructor(e,r){this.audio=e,this.sampling_rate=r}get data(){if(Array.isArray(this.audio)){if(this.audio.length===0)return new Float32Array(0);if(this.audio.length===1)return this.audio[0];let e=this.audio.reduce((n,o)=>n+o.length,0),r=new Float32Array(e),s=0;for(let n of this.audio)r.set(n,s),s+=n.length;return r}else return this.audio}toBlob(){let e=this.audio;return e instanceof Float32Array&&(e=[e]),SP(e,this.sampling_rate)}async save(e){return bp(e,this.toBlob())}};var Ep=class extends ze{constructor(e){super(e);let r=this.config.sampling_rate,s=yt(257,this.config.num_mel_bins,20,Math.floor(r/2),r,null,"kaldi",!0);this.mel_filters=s,this.window=Mt(400,"hann",{periodic:!1}),this.mean=this.config.mean,this.std=this.config.std}async _extract_fbank_features(e,r){return At(e,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:r,transpose:!0})}async _call(e){He(e,"ASTFeatureExtractor");let r=await this._extract_fbank_features(e,this.config.max_length);if(this.config.do_normalize){let s=this.std*2,n=r.data;for(let o=0;o<n.length;++o)n[o]=(n[o]-this.mean)/s}return{input_values:r.unsqueeze_(0)}}};var Mn=class extends ze{async _call(e){He(e,"EncodecFeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=this.config.feature_size;if(e.length%r!==0)throw new Error(`The length of the audio data must be a multiple of the number of channels (${r}).`);let s=[1,r,e.length/r];return{input_values:new U("float32",e,s)}}};var Ap=class extends ze{async _call(e){He(e,"ChatterboxFeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=[1,e.length];return{input_values:new U("float32",e,r)}}};var Mp=class extends ze{constructor(e){super(e),this.mel_filters=yt(this.config.nb_frequency_bins,this.config.feature_size,this.config.frequency_min,this.config.frequency_max,this.config.sampling_rate,null,"htk"),this.mel_filters_slaney=yt(this.config.nb_frequency_bins,this.config.feature_size,this.config.frequency_min,this.config.frequency_max,this.config.sampling_rate,"slaney","slaney"),this.window=Mt(this.config.fft_window_size,"hann")}async _get_input_mel(e,r,s,n){let o,a=!1,i=e.length-r;if(i>0)if(s==="rand_trunc"){a=!0;let l=Math.floor(Math.random()*(i+1));e=e.subarray(l,l+r),o=await this._extract_fbank_features(e,this.mel_filters_slaney,this.config.nb_max_samples)}else throw new Error(`Truncation strategy "${s}" not implemented`);else{if(i<0){let l=new Float64Array(r);if(l.set(e),n==="repeat")for(let u=e.length;u<r;u+=e.length)l.set(e.subarray(0,Math.min(e.length,r-u)),u);else if(n==="repeatpad")for(let u=e.length;u<-i;u+=e.length)l.set(e,u);e=l}if(s==="fusion")throw new Error(`Truncation strategy "${s}" not implemented`);o=await this._extract_fbank_features(e,this.mel_filters_slaney,this.config.nb_max_samples)}return o.unsqueeze_(0)}async _extract_fbank_features(e,r,s=null){return At(e,this.window,this.config.fft_window_size,this.config.hop_length,{power:2,mel_filters:r,log_mel:"dB",max_num_frames:s,do_pad:!1,transpose:!0})}async _call(e,{max_length:r=null}={}){return He(e,"ClapFeatureExtractor"),{input_features:(await this._get_input_mel(e,r??this.config.nb_max_samples,this.config.truncation,this.config.padding)).unsqueeze_(0)}}};var Tn=class extends Mn{};var Tp=class extends ze{constructor(e){super(e);let{fft_length:r,feature_size:s,min_frequency:n,max_frequency:o,sampling_rate:a,frame_length:i}=this.config,l=yt(Math.floor(1+r/2),s,n,o,a,null,"htk",!1);this.mel_filters=l,this.window=Mt(i,"hann")}async _extract_fbank_features(e,r){return At(e,this.window,this.config.frame_length,this.config.hop_length,{fft_length:this.config.fft_length,center:!1,onesided:!0,preemphasis:this.config.preemphasis,preemphasis_htk_flavor:this.config.preemphasis_htk_flavor,mel_filters:this.mel_filters,log_mel:"log",mel_floor:this.config.mel_floor,remove_dc_offset:!1,transpose:!0})}async _call(e,{max_length:r=48e4,truncation:s=!0,padding:n=!0,pad_to_multiple_of:o=128}={}){if(He(e,"Gemma3nAudioFeatureExtractor"),s&&e.length>r&&(e=e.slice(0,r)),n&&e.length%o!==0){let l=o-e.length%o,u=new Float64Array(e.length+l);u.set(e),this.config.padding_value!==0&&u.fill(this.config.padding_value,e.length),e=u}let a=await this._extract_fbank_features(e,this.config.max_length),i=Ge([1,a.dims[0]],!0);return{input_features:a.unsqueeze_(0),input_features_mask:i}}};var Sp=class extends ze{async _call(e){He(e,"MoonshineFeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=[1,e.length];return{input_values:new U("float32",e,r)}}};var OP=1e-5,Op=class extends ze{constructor(e){super(e),this.config.mel_filters??=yt(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,this.config.sampling_rate/2,this.config.sampling_rate,"slaney","slaney");let r=Mt(this.config.win_length,"hann",{periodic:!1});this.window=new Float64Array(this.config.n_fft);let s=Math.floor((this.config.n_fft-this.config.win_length)/2);this.window.set(r,s)}async _extract_fbank_features(e){let r=this.config.preemphasis;e=new Float64Array(e);for(let n=e.length-1;n>=1;--n)e[n]-=r*e[n-1];return await At(e,this.window,this.window.length,this.config.hop_length,{fft_length:this.config.n_fft,power:2,mel_filters:this.config.mel_filters,log_mel:"log",mel_floor:-1/0,pad_mode:"constant",center:!0,transpose:!0,mel_offset:2**-24})}async _call(e){He(e,"ParakeetFeatureExtractor");let r=await this._extract_fbank_features(e),s=Math.floor((e.length+Math.floor(this.config.n_fft/2)*2-this.config.n_fft)/this.config.hop_length),n=r.data;n.fill(0,s*r.dims[1]);let[o,a]=r.dims,i=new Float64Array(a),l=new Float64Array(a);for(let f=0;f<s;++f){let m=f*a;for(let _=0;_<a;++_){let w=n[m+_];i[_]+=w,l[_]+=w*w}}let u=s>1?s-1:1;for(let f=0;f<a;++f){let m=i[f]/s,_=(l[f]-s*m*m)/u,x=1/(Math.sqrt(_)+OP);for(let k=0;k<s;++k){let E=k*a+f;n[E]=(n[E]-m)*x}}let d=new BigInt64Array(o);return d.fill(1n,0,s),{input_features:r.unsqueeze_(0),attention_mask:new U("int64",d,[1,o])}}};var Sn=class extends ze{async _call(e){He(e,"PyAnnoteFeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=[1,1,e.length];return{input_values:new U("float32",e,r)}}samples_to_frames(e){return(e-this.config.offset)/this.config.step}post_process_speaker_diarization(e,r){let s=r/this.samples_to_frames(r)/this.config.sampling_rate,n=[];for(let o of e.tolist()){let a=[],i=-1;for(let l=0;l<o.length;++l){let u=Oe(o[l]),[d,f]=Te(u),[m,_]=[l,l+1];f!==i?(i=f,a.push({id:f,start:m,end:_,score:d})):(a.at(-1).end=_,a.at(-1).score+=d)}n.push(a.map(({id:l,start:u,end:d,score:f})=>({id:l,start:u*s,end:d*s,confidence:f/(d-u)})))}return n}};var Ip=class extends ze{constructor(e){super(e);let r=this.config.sampling_rate,s=yt(257,this.config.num_mel_bins,20,Math.floor(r/2),r,null,"kaldi",!0);this.mel_filters=s,this.window=Mt(400,"povey",{periodic:!1})}async _extract_fbank_features(e,r){return e=e.map(s=>s*32768),At(e,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:r,transpose:!0})}async _call(e,{padding:r=!0,pad_to_multiple_of:s=2,do_normalize_per_mel_bins:n=!0,return_attention_mask:o=!0}={}){He(e,"SeamlessM4TFeatureExtractor");let a=await this._extract_fbank_features(e,this.config.max_length);if(n){let[w,x]=a.dims,k=a.data;for(let E=0;E<x;++E){let M=0;for(let C=0;C<w;++C)M+=k[C*x+E];let I=M/w,T=0;for(let C=0;C<w;++C)T+=(k[C*x+E]-I)**2;T/=w-1;let z=Math.sqrt(T+1e-7);for(let C=0;C<w;++C){let v=C*x+E;k[v]=(k[v]-I)/z}}}let i;if(r){let[w,x]=a.dims,k=a.data,E=w%s;if(E>0){let M=new Float32Array(x*(w+E));M.set(k),M.fill(this.config.padding_value,k.length);let I=w+E;a=new U(a.type,M,[I,x]),o&&(i=new U("int64",new BigInt64Array(I),[1,I]),i.data.fill(1n,0,w))}}let[l,u]=a.dims,d=this.config.stride;if(l%d!==0)throw new Error(`The number of frames (${l}) must be a multiple of the stride (${d}).`);let m=a.view(1,Math.floor(l/d),u*d),_={input_features:m};if(o){let w=m.dims[1],x=new BigInt64Array(w);if(i){let k=i.data;for(let E=1,M=0;E<l;E+=d,++M)x[M]=k[E]}else x.fill(1n);_.attention_mask=new U("int64",x,[1,w])}return _}};var Cp=class extends Tn{};var Pp=class extends ze{};var zp=class extends ze{_zero_mean_unit_var_norm(e){let s=e.reduce((o,a)=>o+a,0)/e.length,n=e.reduce((o,a)=>o+(a-s)**2,0)/e.length;return e.map(o=>(o-s)/Math.sqrt(n+1e-7))}async _call(e){He(e,"Wav2Vec2FeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=e;this.config.do_normalize&&(r=this._zero_mean_unit_var_norm(r));let s=[1,r.length];return{input_values:new U("float32",r,s),attention_mask:new U("int64",new BigInt64Array(r.length).fill(1n),s)}}};var Lp=class extends ze{constructor(e){super(e);let r=this.config.sampling_rate,s=yt(257,this.config.num_mel_bins,20,Math.floor(r/2),r,null,"kaldi",!0);this.mel_filters=s,this.window=Mt(400,"hamming",{periodic:!1}),this.min_num_frames=this.config.min_num_frames}async _extract_fbank_features(e){return e=e.map(r=>r*32768),At(e,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,transpose:!0,min_num_frames:this.min_num_frames})}async _call(e){He(e,"WeSpeakerFeatureExtractor");let r=(await this._extract_fbank_features(e)).unsqueeze_(0);if(this.config.fbank_centering_span===null){let s=r.mean(1).data,n=r.data,[o,a,i]=r.dims;for(let l=0;l<o;++l){let u=l*a*i,d=l*i;for(let f=0;f<a;++f){let m=u+f*i;for(let _=0;_<i;++_)n[m+_]-=s[d+_]}}}return{input_features:r}}};var Np=class extends ze{constructor(e){super(e),this.config.mel_filters??=yt(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,8e3,this.config.sampling_rate,"slaney","slaney"),this.window=Mt(this.config.n_fft,"hann")}async _extract_fbank_features(e){let r=await At(e,this.window,this.config.n_fft,this.config.hop_length,{power:2,mel_filters:this.config.mel_filters,log_mel:"log10",max_num_frames:Math.min(Math.floor(e.length/this.config.hop_length),this.config.nb_max_frames)}),s=r.data,n=Te(s)[0];for(let o=0;o<s.length;++o)s[o]=(Math.max(s[o],n-8)+4)/4;return r}async _call(e,{max_length:r=null}={}){He(e,"WhisperFeatureExtractor");let s,n=r??this.config.n_samples;return e.length>n?(e.length>this.config.n_samples&&console.warn("Attempting to extract features for audio longer than 30 seconds. If using a pipeline to extract transcript from a long audio clip, remember to specify `chunk_length_s` and/or `stride_length_s`."),s=e.slice(0,n)):(s=new Float32Array(n),s.set(e)),{input_features:(await this._extract_fbank_features(s)).unsqueeze_(0)}}};var Ze=class{static async from_pretrained(e,r={}){let s=await it(e,_i,!0,r),n=s.feature_extractor_type,o=gi[n];if(!o)throw new Error(`Unknown feature_extractor_type: '${n}'. Please report this at ${kn}.`);return new o(s)}};var $p=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e,r=null){let s=this.tokenizer(e),n=r?await this.feature_extractor(r):{};return{...s,...n}}};var Rp=Ur(require("sharp"),1),As,dA,Vr,Zt=be.IS_BROWSER_ENV||be.IS_WEBWORKER_ENV;if(Zt)As=(t,e)=>{if(!self.OffscreenCanvas)throw new Error("OffscreenCanvas not supported by this browser.");return new self.OffscreenCanvas(t,e)},Vr=self.createImageBitmap,dA=self.ImageData;else if(Rp.default)Vr=async t=>{let r=(await t.metadata()).channels,{data:s,info:n}=await t.rotate().raw().toBuffer({resolveWithObject:!0}),o=new Xe(new Uint8ClampedArray(s),n.width,n.height,n.channels);return r!==void 0&&r!==n.channels&&o.convert(r),o};else throw new Error("Unable to load image processing library.");var IP={0:"nearest",1:"lanczos",2:"bilinear",3:"bicubic",4:"box",5:"hamming"},CP=new Map([["png","image/png"],["jpg","image/jpeg"],["jpeg","image/jpeg"],["gif","image/gif"]]),Xe=class t{constructor(e,r,s,n){this.data=e,this.width=r,this.height=s,this.channels=n}get size(){return[this.width,this.height]}static async read(e){if(e instanceof t)return e;if(typeof e=="string"||e instanceof URL)return await this.fromURL(e);if(e instanceof Blob)return await this.fromBlob(e);if(typeof HTMLCanvasElement<"u"&&e instanceof HTMLCanvasElement||typeof OffscreenCanvas<"u"&&e instanceof OffscreenCanvas)return this.fromCanvas(e);throw new Error(`Unsupported input type: ${typeof e}`)}static fromCanvas(e){if(!Zt)throw new Error("fromCanvas() is only supported in browser environments.");let s=e.getContext("2d").getImageData(0,0,e.width,e.height).data;return new t(s,e.width,e.height,4)}static async fromURL(e){let r=await fn(e);if(r.status!==200)throw new Error(`Unable to read image from "${e}" (${r.status} ${r.statusText})`);let s=await r.blob();return this.fromBlob(s)}static async fromBlob(e){if(Zt){let r=await Vr(e),s=As(r.width,r.height).getContext("2d");return s.drawImage(r,0,0),new this(s.getImageData(0,0,r.width,r.height).data,r.width,r.height,4)}else{let r=(0,Rp.default)(await e.arrayBuffer());return await Vr(r)}}static fromTensor(e,r="CHW"){if(e.dims.length!==3)throw new Error(`Tensor should have 3 dimensions, but has ${e.dims.length} dimensions.`);if(r==="CHW")e=e.transpose(1,2,0);else if(r!=="HWC")throw new Error(`Unsupported channel format: ${r}`);if(!(e.data instanceof Uint8ClampedArray||e.data instanceof Uint8Array))throw new Error(`Unsupported tensor type: ${e.type}`);switch(e.dims[2]){case 1:case 2:case 3:case 4:return new t(e.data,e.dims[1],e.dims[0],e.dims[2]);default:throw new Error(`Unsupported number of channels: ${e.dims[2]}`)}}grayscale(){if(this.channels===1)return this;let e=new Uint8ClampedArray(this.width*this.height*1);switch(this.channels){case 3:case 4:for(let r=0,s=0;r<this.data.length;r+=this.channels){let n=this.data[r],o=this.data[r+1],a=this.data[r+2];e[s++]=Math.round(.2989*n+.587*o+.114*a)}break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(e,this.width,this.height,1)}rgb(){if(this.channels===3)return this;let e=new Uint8ClampedArray(this.width*this.height*3);switch(this.channels){case 1:for(let r=0,s=0;r<this.data.length;++r)e[s++]=this.data[r],e[s++]=this.data[r],e[s++]=this.data[r];break;case 4:for(let r=0,s=0;r<this.data.length;r+=4)e[s++]=this.data[r],e[s++]=this.data[r+1],e[s++]=this.data[r+2];break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(e,this.width,this.height,3)}rgba(){if(this.channels===4)return this;let e=new Uint8ClampedArray(this.width*this.height*4);switch(this.channels){case 1:for(let r=0,s=0;r<this.data.length;++r)e[s++]=this.data[r],e[s++]=this.data[r],e[s++]=this.data[r],e[s++]=255;break;case 3:for(let r=0,s=0;r<this.data.length;r+=3)e[s++]=this.data[r],e[s++]=this.data[r+1],e[s++]=this.data[r+2],e[s++]=255;break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(e,this.width,this.height,4)}putAlpha(e){if(e.width!==this.width||e.height!==this.height)throw new Error(`Expected mask size to be ${this.width}x${this.height}, but got ${e.width}x${e.height}`);if(e.channels!==1)throw new Error(`Expected mask to have 1 channel, but got ${e.channels}`);let r=this.data,s=e.data,n=this.width*this.height;if(this.channels===3){let o=new Uint8ClampedArray(n*4);for(let a=0,i=0,l=0;a<n;++a)o[l++]=r[i++],o[l++]=r[i++],o[l++]=r[i++],o[l++]=s[a];return this._update(o,this.width,this.height,4)}else if(this.channels===4){for(let o=0;o<n;++o)r[4*o+3]=s[o];return this}throw new Error(`Expected image to have 3 or 4 channels, but got ${this.channels}`)}async resize(e,r,{resample:s=2}={}){if(this.width===e&&this.height===r)return this;let n=IP[s]??s,o=Ty(e),a=Ty(r);if(o&&a)return this;if(o?e=r/this.height*this.width:a&&(r=e/this.width*this.height),Zt){let i=this.channels,l=this.toCanvas(),u=As(e,r).getContext("2d");return u.drawImage(l,0,0,e,r),new t(u.getImageData(0,0,e,r).data,e,r,4).convert(i)}else{let i=this.toSharp();switch(n){case"box":case"hamming":(n==="box"||n==="hamming")&&(console.warn(`Resampling method ${n} is not yet supported. Using bilinear instead.`),n="bilinear");case"nearest":case"bilinear":case"bicubic":i=i.affine([e/this.width,0,0,r/this.height],{interpolator:n});break;case"lanczos":i=i.resize({width:e,height:r,fit:"fill",kernel:"lanczos3"});break;default:throw new Error(`Resampling method ${n} is not supported.`)}return await Vr(i)}}async pad([e,r,s,n]){if(e=Math.max(e,0),r=Math.max(r,0),s=Math.max(s,0),n=Math.max(n,0),e===0&&r===0&&s===0&&n===0)return this;if(Zt){let o=this.channels,a=this.toCanvas(),i=this.width+e+r,l=this.height+s+n,u=As(i,l).getContext("2d");return u.drawImage(a,0,0,this.width,this.height,e,s,this.width,this.height),new t(u.getImageData(0,0,i,l).data,i,l,4).convert(o)}else{let o=this.toSharp().extend({left:e,right:r,top:s,bottom:n});return await Vr(o)}}async crop([e,r,s,n]){if(e=Math.max(e,0),r=Math.max(r,0),s=Math.min(s,this.width-1),n=Math.min(n,this.height-1),e===0&&r===0&&s===this.width-1&&n===this.height-1)return this;let o=s-e+1,a=n-r+1;if(Zt){let i=this.channels,l=this.toCanvas(),u=As(o,a).getContext("2d");return u.drawImage(l,e,r,o,a,0,0,o,a),new t(u.getImageData(0,0,o,a).data,o,a,4).convert(i)}else{let i=this.toSharp().extract({left:e,top:r,width:o,height:a});return await Vr(i)}}async center_crop(e,r){if(this.width===e&&this.height===r)return this;let s=(this.width-e)/2,n=(this.height-r)/2;if(Zt){let o=this.channels,a=this.toCanvas(),i=As(e,r).getContext("2d"),l=0,u=0,d=0,f=0;return s>=0?l=s:d=-s,n>=0?u=n:f=-n,i.drawImage(a,l,u,e,r,d,f,e,r),new t(i.getImageData(0,0,e,r).data,e,r,4).convert(o)}else{let o=this.toSharp();if(s>=0&&n>=0)o=o.extract({left:Math.floor(s),top:Math.floor(n),width:e,height:r});else if(s<=0&&n<=0){let a=Math.floor(-n),i=Math.floor(-s);o=o.extend({top:a,left:i,right:e-this.width-i,bottom:r-this.height-a})}else{let a=[0,0],i=0;n<0?(a[0]=Math.floor(-n),a[1]=r-this.height-a[0]):i=Math.floor(n);let l=[0,0],u=0;s<0?(l[0]=Math.floor(-s),l[1]=e-this.width-l[0]):u=Math.floor(s),o=o.extend({top:a[0],bottom:a[1],left:l[0],right:l[1]}).extract({left:u,top:i,width:e,height:r})}return await Vr(o)}}async toBlob(e="image/png",r=1){if(!Zt)throw new Error("toBlob() is only supported in browser environments.");return await this.toCanvas().convertToBlob({type:e,quality:r})}toTensor(e="CHW"){let r=new U("uint8",new Uint8Array(this.data),[this.height,this.width,this.channels]);if(e!=="HWC")if(e==="CHW")r=r.permute(2,0,1);else throw new Error(`Unsupported channel format: ${e}`);return r}toCanvas(){if(!Zt)throw new Error("toCanvas() is only supported in browser environments.");let e=this.clone().rgba(),r=As(e.width,e.height),s=new dA(e.data,e.width,e.height);return r.getContext("2d").putImageData(s,0,0),r}split(){let{data:e,width:r,height:s,channels:n}=this,o=e.constructor,a=e.length/n,i=Array.from({length:n},()=>new o(a));for(let l=0;l<a;++l){let u=n*l;for(let d=0;d<n;++d)i[d][l]=e[u+d]}return i.map(l=>new t(l,r,s,1))}_update(e,r,s,n=null){return this.data=e,this.width=r,this.height=s,n!==null&&(this.channels=n),this}clone(){return new t(this.data.slice(),this.width,this.height,this.channels)}convert(e){if(this.channels===e)return this;switch(e){case 1:this.grayscale();break;case 3:this.rgb();break;case 4:this.rgba();break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this}async save(e){if(Zt){if(be.IS_WEBWORKER_ENV)throw new Error("Unable to save an image from a Web Worker.");let r=e.split(".").pop().toLowerCase(),s=CP.get(r)??"image/png",n=await this.toBlob(s);return bp(e,n)}else if(be.IS_FS_AVAILABLE)await this.toSharp().toFile(e);else throw new Error("Unable to save the image because filesystem is disabled in this environment.")}toSharp(){if(Zt)throw new Error("toSharp() is only supported in server-side environments.");return(0,Rp.default)(this.data,{raw:{width:this.width,height:this.height,channels:this.channels}})}},fA=Xe.read.bind(Xe);function mA(t,e,r=0,s=null){let n=t/e,o=gk(n)*e;return s!==null&&o>s&&(o=Math.floor(n)*e),o<r&&(o=Math.ceil(n)*e),o}function D0([t,e],r){return[Math.max(Math.floor(t/r),1)*r,Math.max(Math.floor(e/r),1)*r]}function F0([t,e,r,s]){return[t-r/2,e-s/2,t+r/2,e+s/2]}function Hr(t,e=.5,r=null,s=!1){let n=t.logits,o=t.pred_boxes,[a,i,l]=n.dims;if(r!==null&&r.length!==a)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let u=[];for(let d=0;d<a;++d){let f=r!==null?r[d]:null,m={boxes:[],classes:[],scores:[]},_=n[d],w=o[d];for(let x=0;x<i;++x){let k=_[x],E=[],M;if(s){M=k.sigmoid().data;for(let I=0;I<M.length;++I)M[I]>e&&E.push(I)}else{let I=Te(k.data)[1];if(I===l-1||(M=Oe(k.data),M[I]<e))continue;E.push(I)}for(let I of E){let T=w[x].data;T=F0(T),f!==null&&(T=T.map((z,C)=>z*f[(C+1)%2])),m.boxes.push(T),m.classes.push(I),m.scores.push(M[I])}}u.push(m)}return u}function Up(t,e=null){let r=t.logits,s=r.dims[0];if(e!==null&&e.length!==s)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let n=[];for(let o=0;o<s;++o){let a=e!==null?e[o]:null,i=r[o];a!==null&&(i=Su(i,a,"bilinear",!1));let[l,u]=a??i.dims.slice(-2),d=new U("int32",new Int32Array(l*u),[l,u]),f=i[0].data,m=d.data;for(let x=1;x<i.dims[0];++x){let k=i[x].data;for(let E=0;E<k.length;++E)k[E]>f[E]&&(f[E]=k[E],m[E]=x)}let _=new Array(i.dims[0]);for(let x=0;x<m.length;++x){let k=m[x];_[k]=k}let w=_.filter(x=>x!==void 0);n.push({segmentation:d,labels:w})}return n}function PP(t,e,r,s){let n=[],o=[],a=[];for(let i=0;i<t.dims[0];++i){let l=t[i],u=e[i],d=Te(l.data)[1];if(d===s)continue;let m=Oe(l.data)[d];m>r&&(n.push(u),o.push(m),a.push(d))}return[n,o,a]}function zP(t,e,r,s=.5,n=.8){let o=[],a=0,i=0,l=e[r].data;for(let d=0;d<t.length;++d)t[d]===r&&(o.push(d),++a),l[d]>=s&&++i;let u=a>0&&i>0;return u&&(u=a/i>n),[u,o]}function LP(t,e,r,s,n,o=null,a=null){let[i,l]=a??t[0].dims,u=new U("int32",new Int32Array(i*l),[i,l]),d=[];if(a!==null)for(let x=0;x<t.length;++x)t[x]=Su(t[x],a,"bilinear",!1);let f=new Int32Array(t[0].data.length),m=new Float32Array(t[0].data.length);for(let x=0;x<t.length;++x){let k=e[x],E=t[x].data;for(let M=0;M<E.length;++M)E[M]*=k,E[M]>m[M]&&(f[M]=x,m[M]=E[M])}let _=0,w=u.data;for(let x=0;x<r.length;++x){let k=r[x],[E,M]=zP(f,t,x,s,n);if(E){++_;for(let I of M)w[I]=_;d.push({id:_,label_id:k,score:e[x]})}}return[u,d]}function NP(t,e,r=28,s=3136,n=784*1280){if(t<r||e<r)throw new Error(`height:${t} or width:${e} must be larger than factor:${r}`);if(Math.max(t,e)/Math.min(t,e)>200)throw new Error(`absolute aspect ratio must be smaller than 200, got ${Math.max(t,e)/Math.min(t,e)}`);let o=Math.round(t/r)*r,a=Math.round(e/r)*r;if(o*a>n){let i=Math.sqrt(t*e/n);o=Math.floor(t/i/r)*r,a=Math.floor(e/i/r)*r}else if(o*a<s){let i=Math.sqrt(s/(t*e));o=Math.ceil(t*i/r)*r,a=Math.ceil(e*i/r)*r}return[o,a]}function Bp(t,e=.5,r=.5,s=.8,n=null,o=null){n===null&&(console.warn("`label_ids_to_fuse` unset. No instance will be fused."),n=new Set);let a=t.class_queries_logits??t.logits,l=(t.masks_queries_logits??t.pred_masks).sigmoid(),[u,d,f]=a.dims;if(f-=1,o!==null&&o.length!==u)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let m=[];for(let _=0;_<u;++_){let w=o!==null?o[_]:null,x=a[_],k=l[_],[E,M,I]=PP(x,k,e,f);if(I.length===0){let[C,v]=w??k.dims.slice(-2),G=new U("int32",new Int32Array(C*v).fill(-1),[C,v]);m.push({segmentation:G,segments_info:[]});continue}let[T,z]=LP(E,M,I,r,s,n,w);m.push({segmentation:T,segments_info:z})}return m}function Dp(t,e=.5,r=null){throw new Error("`post_process_instance_segmentation` is not yet implemented.")}var W=class extends Je{constructor(e){super(),this.image_mean=e.image_mean??e.mean,this.image_std=e.image_std??e.std,this.resample=e.resample??2,this.do_rescale=e.do_rescale??!0,this.rescale_factor=e.rescale_factor??1/255,this.do_normalize=e.do_normalize,this.do_thumbnail=e.do_thumbnail,this.size=e.size??e.image_size,this.do_resize=e.do_resize??this.size!==void 0,this.size_divisibility=e.size_divisibility??e.size_divisor,this.do_center_crop=e.do_center_crop,this.crop_size=e.crop_size,this.do_convert_rgb=e.do_convert_rgb??!0,this.do_crop_margin=e.do_crop_margin,this.pad_size=e.pad_size,this.do_pad=e.do_pad,this.min_pixels=e.min_pixels,this.max_pixels=e.max_pixels,this.do_pad&&!this.pad_size&&this.size&&this.size.width!==void 0&&this.size.height!==void 0&&(this.pad_size=this.size),this.do_flip_channel_order=e.do_flip_channel_order??!1,this.config=e}async thumbnail(e,r,s=2){let n=e.height,o=e.width,a=r.height,i=r.width,l=Math.min(n,a),u=Math.min(o,i);return l===n&&u===o?e:(n>o?u=Math.floor(o*l/n):o>n&&(l=Math.floor(n*u/o)),await e.resize(u,l,{resample:s}))}async crop_margin(e,r=200){let s=e.clone().grayscale(),n=ti(s.data)[0],a=Te(s.data)[0]-n;if(a===0)return e;let i=r/255,l=s.width,u=s.height,d=0,f=0,m=s.data;for(let _=0;_<s.height;++_){let w=_*s.width;for(let x=0;x<s.width;++x)(m[w+x]-n)/a<i&&(l=Math.min(l,x),u=Math.min(u,_),d=Math.max(d,x),f=Math.max(f,_))}return e=await e.crop([l,u,d,f]),e}pad_image(e,r,s,{mode:n="constant",center:o=!1,constant_values:a=0}={}){let[i,l,u]=r,d,f;if(typeof s=="number"?(d=s,f=s):s==="square"?d=f=Math.max(i,l):(d=s.width,f=s.height),d!==l||f!==i){let m=new Float32Array(d*f*u);if(Array.isArray(a))for(let x=0;x<m.length;++x)m[x]=a[x%u];else a!==0&&m.fill(a);let[_,w]=o?[Math.floor((d-l)/2),Math.floor((f-i)/2)]:[0,0];for(let x=0;x<i;++x){let k=(x+w)*d,E=x*l;for(let M=0;M<l;++M){let I=(k+M+_)*u,T=(E+M)*u;for(let z=0;z<u;++z)m[I+z]=e[T+z]}}if(n==="symmetric"){if(o)throw new Error("`center` padding is not supported when `mode` is set to `symmetric`.");let x=i-1,k=l-1;for(let E=0;E<f;++E){let M=E*d,I=un(E,x)*l;for(let T=0;T<d;++T){if(E<i&&T<l)continue;let z=(M+T)*u,C=(I+un(T,k))*u;for(let v=0;v<u;++v)m[z+v]=e[C+v]}}}e=m,r=[f,d,u]}return[e,r]}rescale(e){for(let r=0;r<e.length;++r)e[r]=this.rescale_factor*e[r]}get_resize_output_image_size(e,r){let[s,n]=e.size,o,a;if(this.do_thumbnail){let{height:i,width:l}=r;o=Math.min(i,l)}else Number.isInteger(r)?(o=r,a=this.config.max_size??o):r!==void 0&&(o=r.shortest_edge,a=r.longest_edge);if(o!==void 0||a!==void 0){let i=o===void 0?1:Math.max(o/s,o/n),l=s*i,u=n*i,d=a===void 0?1:Math.min(a/l,a/u),f=Math.floor(Number((l*d).toFixed(2))),m=Math.floor(Number((u*d).toFixed(2)));return this.size_divisibility!==void 0&&([f,m]=D0([f,m],this.size_divisibility)),[f,m]}else if(r!==void 0&&r.width!==void 0&&r.height!==void 0){let i=r.width,l=r.height;if(this.config.keep_aspect_ratio&&this.config.ensure_multiple_of){let u=l/n,d=i/s;Math.abs(1-d)<Math.abs(1-u)?u=d:d=u,l=mA(u*n,this.config.ensure_multiple_of),i=mA(d*s,this.config.ensure_multiple_of)}return[i,l]}else{if(this.size_divisibility!==void 0)return D0([s,n],this.size_divisibility);if(this.min_pixels!==void 0&&this.max_pixels!==void 0){let i=this.config.patch_size*this.config.merge_size;return NP(n,s,i,this.min_pixels,this.max_pixels)}else throw new Error(`Could not resize image due to unsupported \`this.size\` option in config: ${JSON.stringify(r)}`)}}async resize(e){let[r,s]=this.get_resize_output_image_size(e,this.size);return await e.resize(r,s,{resample:this.resample})}async preprocess(e,{do_normalize:r=null,do_pad:s=null,do_convert_rgb:n=null,do_convert_grayscale:o=null,do_flip_channel_order:a=null}={}){this.do_crop_margin&&(e=await this.crop_margin(e));let[i,l]=e.size;if(n??this.do_convert_rgb?e=e.rgb():o&&(e=e.grayscale()),this.do_resize&&(e=await this.resize(e)),this.do_thumbnail&&(e=await this.thumbnail(e,this.size,this.resample)),this.do_center_crop){let _,w;Number.isInteger(this.crop_size)?(_=this.crop_size,w=this.crop_size):(_=this.crop_size.width,w=this.crop_size.height),e=await e.center_crop(_,w)}let u=[e.height,e.width],d=Float32Array.from(e.data),f=[e.height,e.width,e.channels];if(this.do_rescale&&this.rescale(d),r??this.do_normalize){let _=this.image_mean;Array.isArray(this.image_mean)||(_=new Array(e.channels).fill(_));let w=this.image_std;if(Array.isArray(this.image_std)||(w=new Array(e.channels).fill(w)),_.length!==e.channels||w.length!==e.channels)throw new Error(`When set to arrays, the length of \`image_mean\` (${_.length}) and \`image_std\` (${w.length}) must match the number of channels in the image (${e.channels}).`);for(let x=0;x<d.length;x+=e.channels)for(let k=0;k<e.channels;++k)d[x+k]=(d[x+k]-_[k])/w[k]}if(s??this.do_pad){if(this.pad_size)[d,f]=this.pad_image(d,[e.height,e.width,e.channels],this.pad_size);else if(this.size_divisibility){let[_,w]=D0([f[1],f[0]],this.size_divisibility);[d,f]=this.pad_image(d,f,{width:_,height:w})}}if(a??this.do_flip_channel_order){if(f[2]!==3)throw new Error("Flipping channel order is only supported for RGB images.");for(let _=0;_<d.length;_+=3){let w=d[_];d[_]=d[_+2],d[_+2]=w}}let m=new U("float32",d,f).permute(2,0,1);return{original_size:[l,i],reshaped_input_size:u,pixel_values:m}}async _call(e,...r){Array.isArray(e)||(e=[e]);let s=await Promise.all(e.map(o=>this.preprocess(o)));return{pixel_values:zt(s.map(o=>o.pixel_values),0),original_sizes:s.map(o=>o.original_size),reshaped_input_sizes:s.map(o=>o.reshaped_input_size)}}static async from_pretrained(e,r={}){let s=await it(e,En,!0,r);return new this(s)}};var Cn={};cs(Cn,{BeitFeatureExtractor:()=>Fp,BitImageProcessor:()=>jp,CLIPFeatureExtractor:()=>qp,CLIPImageProcessor:()=>wi,ChineseCLIPFeatureExtractor:()=>Gp,ConvNextFeatureExtractor:()=>Wp,ConvNextImageProcessor:()=>xi,DINOv3ViTImageProcessor:()=>Xp,DPTFeatureExtractor:()=>Yp,DPTImageProcessor:()=>vi,DeiTFeatureExtractor:()=>Vp,DeiTImageProcessor:()=>yi,DetrFeatureExtractor:()=>Hp,DetrImageProcessor:()=>bi,DonutFeatureExtractor:()=>Kp,DonutImageProcessor:()=>Ms,EfficientNetImageProcessor:()=>Qp,GLPNFeatureExtractor:()=>Jp,GroundingDinoImageProcessor:()=>Zp,Idefics3ImageProcessor:()=>ki,ImageFeatureExtractor:()=>W,ImageProcessor:()=>W,JinaCLIPImageProcessor:()=>td,LlavaOnevisionImageProcessor:()=>rd,Mask2FormerImageProcessor:()=>nd,MaskFormerFeatureExtractor:()=>sd,MaskFormerImageProcessor:()=>Ts,MobileNetV1FeatureExtractor:()=>od,MobileNetV1ImageProcessor:()=>Ei,MobileNetV2FeatureExtractor:()=>ad,MobileNetV2ImageProcessor:()=>Ai,MobileNetV3FeatureExtractor:()=>id,MobileNetV3ImageProcessor:()=>Mi,MobileNetV4FeatureExtractor:()=>ld,MobileNetV4ImageProcessor:()=>Ti,MobileViTFeatureExtractor:()=>cd,MobileViTImageProcessor:()=>Si,NougatImageProcessor:()=>ud,OwlViTFeatureExtractor:()=>pd,OwlViTImageProcessor:()=>Ss,Owlv2ImageProcessor:()=>dd,Phi3VImageProcessor:()=>fd,PixtralImageProcessor:()=>md,PvtImageProcessor:()=>hd,Qwen2VLImageProcessor:()=>_d,RTDetrImageProcessor:()=>gd,Sam2ImageProcessor:()=>In,Sam3ImageProcessor:()=>In,SamImageProcessor:()=>In,SapiensFeatureExtractor:()=>wd,SapiensImageProcessor:()=>Oi,SegformerFeatureExtractor:()=>xd,SegformerImageProcessor:()=>Ii,SiglipImageProcessor:()=>yd,SmolVLMImageProcessor:()=>ki,Swin2SRImageProcessor:()=>bd,VLMImageProcessor:()=>ed,ViTFeatureExtractor:()=>vd,ViTImageProcessor:()=>Ci,VitMatteImageProcessor:()=>kd,VitPoseImageProcessor:()=>Ed,YolosFeatureExtractor:()=>Ad,YolosImageProcessor:()=>Pi});var Fp=class extends W{};var jp=class extends W{};var Gp=class extends W{};var wi=class extends W{},qp=class extends wi{};var xi=class extends W{constructor(e){super(e),this.crop_pct=this.config.crop_pct??224/256}async resize(e){let r=this.size?.shortest_edge;if(r===void 0)throw new Error("Size dictionary must contain 'shortest_edge' key.");if(r<384){let s=Math.floor(r/this.crop_pct),[n,o]=this.get_resize_output_image_size(e,{shortest_edge:s});e=await e.resize(n,o,{resample:this.resample}),e=await e.center_crop(r,r)}else e=await e.resize(r,r,{resample:this.resample});return e}},Wp=class extends xi{};var yi=class extends W{},Vp=class extends yi{};var bi=class extends W{async _call(e){let r=await super._call(e),s=[r.pixel_values.dims[0],64,64],n=Ge(s,1n);return{...r,pixel_mask:n}}post_process_object_detection(...e){return Hr(...e)}post_process_panoptic_segmentation(...e){return Bp(...e)}post_process_instance_segmentation(...e){return Dp(...e)}},Hp=class extends bi{};var Xp=class extends W{};var Ms=class extends W{pad_image(e,r,s,n={}){let[o,a,i]=r,l=this.image_mean;Array.isArray(this.image_mean)||(l=new Array(i).fill(l));let u=this.image_std;Array.isArray(u)||(u=new Array(i).fill(l));let d=l.map((f,m)=>-f/u[m]);return super.pad_image(e,r,s,{center:!0,constant_values:d,...n})}},Kp=class extends Ms{};var vi=class extends W{},Yp=class extends vi{};var Qp=class extends W{constructor(e){super(e),this.include_top=this.config.include_top??!0,this.include_top&&(this.image_std=this.image_std.map(r=>r*r))}};var Jp=class extends W{};var Zp=class extends W{async _call(e){let r=await super._call(e),s=r.pixel_values.dims,n=rt([s[0],s[2],s[3]]);return{...r,pixel_mask:n}}};var ki=class extends W{constructor(e){super(e),this.do_image_splitting=e.do_image_splitting??!0,this.max_image_size=e.max_image_size}get_resize_for_vision_encoder(e,r){let[s,n]=e.dims.slice(-2),o=n/s;return n>=s?(n=Math.ceil(n/r)*r,s=Math.floor(n/o),s=Math.ceil(s/r)*r):(s=Math.ceil(s/r)*r,n=Math.floor(s*o),n=Math.ceil(n/r)*r),{height:s,width:n}}async _call(e,{do_image_splitting:r=null,return_row_col_info:s=!1}={}){let n;if(!Array.isArray(e))n=[[e]];else{if(e.length===0||!e[0])throw new Error("No images provided.");Array.isArray(e[0])?n=e:n=[e]}let o=[],a=[],i=[],l=[],u=[];for(let E of n){let M=await Promise.all(E.map(z=>this.preprocess(z)));l.push(...M.map(z=>z.original_size)),u.push(...M.map(z=>z.reshaped_input_size)),M.forEach(z=>z.pixel_values.unsqueeze_(0));let{longest_edge:I}=this.max_image_size,T;if(r??this.do_image_splitting){let z=new Array(M.length),C=new Array(M.length);T=await Promise.all(M.map(async(v,G)=>{let X=this.get_resize_for_vision_encoder(v.pixel_values,I),V=await Pt(v.pixel_values,{size:[X.height,X.width]}),{frames:Q,num_splits_h:K,num_splits_w:Y}=await this.split_image(V,this.max_image_size);return z[G]=K,C[G]=Y,Ee(Q,0)})),a.push(z),i.push(C)}else{let z=[I,I];T=await Promise.all(M.map(C=>Pt(C.pixel_values,{size:z}))),a.push(new Array(M.length).fill(0)),i.push(new Array(M.length).fill(0))}o.push(Ee(T,0))}let d=o.length,[f,m,_,w]=o[0].dims,x,k;if(d===1)x=o[0].unsqueeze_(0),k=Ge([d,f,_,w],!0);else{let E=Math.max(...o.map(T=>T.dims.at(0)));k=Ge([d,E,_,w],!0);let M=k.data,I=E*_*w;for(let T=0;T<d;++T){let z=o[T].dims[0];if(z<E){o[T]=Ee([o[T],Ge([E-z,m,_,w],0)],0);let C=T*I+z*_*w,v=(T+1)*I;M.fill(!1,C,v)}}x=zt(o,0)}return{pixel_values:x,pixel_attention_mask:k,original_sizes:l,reshaped_input_sizes:u,...s?{rows:a,cols:i}:{}}}async split_image(e,{longest_edge:r}){let s=r,n=r,o=[],[a,i]=e.dims.slice(-2),l=0,u=0;if(a>s||i>n){l=Math.ceil(a/s),u=Math.ceil(i/n);let d=Math.ceil(a/l),f=Math.ceil(i/u);for(let w=0;w<l;++w)for(let x=0;x<u;++x){let k,E,M,I;w===l-1?(E=a-d,I=a):(E=w*d,I=(w+1)*d),x===u-1?(k=i-f,M=i):(k=x*f,M=(x+1)*f);let C=await di(e,[E,k],[I,M],[2,3]);o.push(C)}let m=s,_=n;(a!==m||i!==_)&&(e=await Pt(e,{size:[m,_]}))}return o.push(e),{frames:o,num_splits_h:l,num_splits_w:u}}};var ed=class extends W{constructor(e){super({do_pad:!0,pad_size:{width:e.image_size,height:e.image_size},...e}),this.constant_values=this.config.background_color.map(r=>r*this.rescale_factor)}pad_image(e,r,s,n){return super.pad_image(e,r,s,{constant_values:this.constant_values,center:!0,...n})}};var td=class extends W{constructor(e){let{resize_mode:r,fill_color:s,interpolation:n,size:o,...a}=e,i=r==="squash"?{width:o,height:o}:r==="shortest"?{shortest_edge:o}:{longest_edge:o},l=n==="bicubic"?3:2;super({...a,size:i,resample:l,do_center_crop:!0,crop_size:o,do_normalize:!0})}};var rd=class extends W{};var Ts=class extends W{post_process_panoptic_segmentation(...e){return Bp(...e)}post_process_instance_segmentation(...e){return Dp(...e)}},sd=class extends Ts{};var nd=class extends Ts{};var Ei=class extends W{},od=class extends Ei{};var Ai=class extends W{},ad=class extends Ai{};var Mi=class extends W{},id=class extends Mi{};var Ti=class extends W{},ld=class extends Ti{};var Si=class extends W{},cd=class extends Si{};var ud=class extends Ms{};var Ss=class extends W{post_process_object_detection(...e){return Hr(...e)}},pd=class extends Ss{};var dd=class extends Ss{};var Lt=336,$P=[2,3],{ceil:j0,floor:On,sqrt:G0}=Math,fd=class extends W{constructor(e){super({...e,do_normalize:!0,do_pad:!0,pad_size:"custom",do_convert_rgb:!0,do_resize:!0}),this._num_crops=e.num_crops}calc_num_image_tokens_from_image_size(e,r){let{num_img_tokens:s}=this.config;return On((On(r/Lt)*On(e/Lt)+1)*s+1+(On(r/Lt)+1)*G0(s))}get_resize_output_image_size(e,r){let s=this._num_crops,[n,o]=e.size,a=n/o,i=1;for(;i*Math.ceil(i/a)<=s;)i+=1;i-=1;let l=Math.floor(i*336),u=Math.floor(l/a);return[l,u]}pad_image(e,r,s,n={}){let[o,a]=r,i=Lt*j0(o/Lt),l=Lt*j0(a/Lt),u=[1,1,1].map((d,f)=>(d-this.image_mean[f])/this.image_std[f]);return super.pad_image(e,r,{width:l,height:i},{center:!0,constant_values:u,...n})}async _call(e,{num_crops:r=null}={}){if(this._num_crops=r??=this.config.num_crops,r<4||G0(r)%1!==0)throw new Error("num_crops must be a square number >= 4");Array.isArray(e)||(e=[e]);let s=e.length,n=await Promise.all(e.map(m=>this.preprocess(m))),o=n.map(m=>m.original_size),a=n.map(m=>m.reshaped_input_size),i=[];for(let{pixel_values:m}of n){m.unsqueeze_(0);let[_,w]=m.dims.slice(-2),x=await Pt(m,{size:[Lt,Lt],mode:"bicubic"});if(r>0){let k=[],E=G0(r),M=On(w/E),I=On(_/E);for(let z=0;z<E;++z)for(let C=0;C<E;++C){let v,G,X,V;z===E-1?(G=_-I,V=_):(G=z*I,V=(z+1)*I),C===E-1?(v=w-M,X=w):(v=C*M,X=(C+1)*M);let Y=await di(m,[G,v],[V,X],$P);k.push(Y)}let T=await Pt(Ee(k,0),{size:[Lt,Lt],mode:"bicubic"});i.push(Ee([x,T],0))}else i.push(x)}let l=zt(i,0),u=a.map(m=>m.map(_=>Lt*j0(_/Lt))),d=new U("int64",u.flat(),[s,2]),f=u.map(([m,_])=>this.calc_num_image_tokens_from_image_size(_,m));return{pixel_values:l,original_sizes:o,reshaped_input_sizes:a,image_sizes:d,num_img_tokens:f}}};var md=class extends W{get_resize_output_image_size(e,r){let{longest_edge:s}=r;if(s===void 0)throw new Error("size must contain 'longest_edge'");let[n,o]=e.size,a=Math.max(n,o)/s,i=n,l=o;a>1&&(i=Math.floor(n/a),l=Math.floor(o/a));let{patch_size:u,spatial_merge_size:d}=this.config;if(!d)throw new Error("config must contain 'spatial_merge_size'");let f=u*d,m=Math.floor((i-1)/f)+1,_=Math.floor((l-1)/f)+1;return[m*f,_*f]}};var hd=class extends W{};var _d=class extends W{async _call(e,...r){let{pixel_values:s,original_sizes:n,reshaped_input_sizes:o}=await super._call(e,...r),a=s,{temporal_patch_size:i,merge_size:l,patch_size:u}=this.config;a.dims[0]===1&&(a=Ee(Array.from({length:i},()=>a),0));let d=a.dims[0]/i,f=a.dims[1],m=Math.floor(a.dims[2]/u),_=Math.floor(a.dims[3]/u),w=a.view(d,i,f,Math.floor(m/l),l,u,Math.floor(_/l),l,u).permute(0,3,6,4,7,2,1,5,8).view(d*m*_,f*i*u*u),x=new U("int64",[d,m,_],[1,3]);return{pixel_values:w,image_grid_thw:x,original_sizes:n,reshaped_input_sizes:o}}};var gd=class extends W{post_process_object_detection(...e){return Hr(...e)}};var In=class extends W{reshape_input_points(e,r,s,n=!1){e=structuredClone(e);let o=Sy(e);if(o.length===3)n||(o=[1,...o]),e=[e];else if(o.length!==4)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");for(let a=0;a<e.length;++a){let[i,l]=r[a],[u,d]=s[a],f=[d/l,u/i];for(let m=0;m<e[a].length;++m)for(let _=0;_<e[a][m].length;++_)for(let w=0;w<e[a][m][_].length;++w)e[a][m][_][w]*=f[w%2]}return new U("float32",Float32Array.from(e.flat(1/0)),o)}add_input_labels(e,r){let s=Sy(e);if(s.length===2)s=[1,...s],e=[e];else if(s.length!==3)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");if(s.some((n,o)=>n!==r.dims[o]))throw Error(`The first ${s.length} dimensions of 'input_points' and 'input_labels' must be the same.`);return new U("int64",e.flat(1/0).map(BigInt),s)}async _call(e,{input_points:r=null,input_labels:s=null,input_boxes:n=null}={}){let o=await super._call(e);if(r&&(o.input_points=this.reshape_input_points(r,o.original_sizes,o.reshaped_input_sizes)),s){if(!o.input_points)throw Error("`input_points` must be provided if `input_labels` are provided.");o.input_labels=this.add_input_labels(s,o.input_points)}return n&&(o.input_boxes=this.reshape_input_points(n,o.original_sizes,o.reshaped_input_sizes,!0)),o}async post_process_masks(e,r,s,{mask_threshold:n=0,binarize:o=!0,pad_size:a=null}={}){let i=[];a=a??this.pad_size??this.size;let l=[a.height,a.width];for(let u=0;u<r.length;++u){let d=r[u],f=s[u],m=await Pt(e[u],{mode:"bilinear",size:l});if(m=m.slice(null,null,[0,f[0]],[0,f[1]]),m=await Pt(m,{mode:"bilinear",size:d}),o){let _=m.data,w=new Uint8Array(_.length);for(let x=0;x<_.length;++x)_[x]>n&&(w[x]=1);m=new U("bool",w,m.dims)}i.push(m)}return i}generate_crop_boxes(e,r,{crop_n_layers:s=0,overlap_ratio:n=512/1500,points_per_crop:o=32,crop_n_points_downscale_factor:a=1}={}){}};var Oi=class extends W{post_process_semantic_segmentation(...e){return Up(...e)}},wd=class extends Oi{};var Ii=class extends W{post_process_semantic_segmentation(...e){return Up(...e)}},xd=class extends Ii{};var yd=class extends W{};var bd=class extends W{pad_image(e,r,s,n={}){let[o,a,i]=r;return super.pad_image(e,r,{width:a+(s-a%s)%s,height:o+(s-o%s)%s},{mode:"symmetric",center:!1,constant_values:-1,...n})}};var Ci=class extends W{},vd=class extends Ci{};var kd=class extends W{async _call(e,r){Array.isArray(e)||(e=[e]),Array.isArray(r)||(r=[r]);let s=await Promise.all(e.map(a=>this.preprocess(a))),n=await Promise.all(r.map(a=>this.preprocess(a,{do_normalize:!1,do_convert_rgb:!1,do_convert_grayscale:!0})));return{pixel_values:zt(s.map((a,i)=>Ee([a.pixel_values,n[i].pixel_values],0)),0),original_sizes:s.map(a=>a.original_size),reshaped_input_sizes:s.map(a=>a.reshaped_input_size)}}};var Ed=class extends W{post_process_pose_estimation(e,r,{threshold:s=null}={}){let n=e.tolist(),[o,a,i,l]=e.dims,u=[];for(let d=0;d<o;++d){let f=n[d],m=r[d],_=[];for(let w=0;w<m.length;++w){let x=m[w],k=[],E=[],M=[],I=x.at(-2)/l,T=x.at(-1)/i;for(let z=0;z<f.length;++z){let[C,v]=[0,0],G=0,X=-1/0,V=f[z];for(let K=0;K<V.length;++K){let Y=V[K];for(let B=0;B<Y.length;++B){let P=Y[B];G+=P,X=Math.max(X,P),C+=(B+.5)*P,v+=K*P}}if(s!=null&&X<s)continue;let Q=[I*C/G,T*v/G];k.push(Q),M.push(z),E.push(X)}_.push({bbox:x,scores:E,labels:M,keypoints:k})}u.push(_)}return u}};var Pi=class extends W{post_process_object_detection(...e){return Hr(...e)}},Ad=class extends Pi{};var Le=class{static async from_pretrained(e,r={}){let s=await it(e,En,!0,r),n=s.image_processor_type??s.feature_extractor_type,o=Cn[n?.replace(/Fast$/,"")];return o||(n!==void 0&&console.warn(`Image processor type '${n}' not found, assuming base ImageProcessor. Please report this at ${kn}.`),o=W),new o(s)}};var Md=class extends ne{static tokenizer_class=J;static image_processor_class=Le;constructor(e,r,s){super(e,r,s);let{tasks_answer_post_processing_type:n,task_prompts_without_inputs:o,task_prompts_with_input:a}=this.image_processor.config;this.tasks_answer_post_processing_type=new Map(Object.entries(n??{})),this.task_prompts_without_inputs=new Map(Object.entries(o??{})),this.task_prompts_with_input=new Map(Object.entries(a??{})),this.regexes={quad_boxes:/(.+?)<loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)>/gm,bboxes:/([^<]+)?<loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)>/gm},this.size_per_bin=1e3}construct_prompts(e){typeof e=="string"&&(e=[e]);let r=[];for(let s of e)if(this.task_prompts_without_inputs.has(s))r.push(this.task_prompts_without_inputs.get(s));else{for(let[n,o]of this.task_prompts_with_input)if(s.includes(n)){r.push(o.replaceAll("{input}",s).replaceAll(n,""));break}r.length!==e.length&&r.push(s)}return r}post_process_generation(e,r,s){let n=this.tasks_answer_post_processing_type.get(r)??"pure_text";e=e.replaceAll("<s>","").replaceAll("</s>","");let o;switch(n){case"pure_text":o=e;break;case"description_with_bboxes":case"bboxes":case"phrase_grounding":case"ocr":let a=n==="ocr"?"quad_boxes":"bboxes",i=e.matchAll(this.regexes[a]),l=[],u=[];for(let[d,f,...m]of i)l.push(f?f.trim():l.at(-1)??""),u.push(m.map((_,w)=>(Number(_)+.5)/this.size_per_bin*s[w%2]));o={labels:l,[a]:u};break;default:throw new Error(`Task "${r}" (of type "${n}") not yet implemented.`)}return{[r]:o}}async _call(e,r=null,s={}){if(!e&&!r)throw new Error("Either text or images must be provided");let n=await this.image_processor(e,s),o=r?this.tokenizer(this.construct_prompts(r),s):{};return{...n,...o}}};var Td=class extends ne{static image_processor_class=Le;static feature_extractor_class=Ze;static tokenizer_class=J;static uses_processor_config=!0;static uses_chat_template_file=!0;constructor(e,r,s){super(e,r,s),this.audio_seq_length=this.config.audio_seq_length,this.image_seq_length=this.config.image_seq_length;let{audio_token_id:n,boa_token:o,audio_token:a,eoa_token:i,image_token_id:l,boi_token:u,image_token:d,eoi_token:f}=this.tokenizer.config;this.audio_token_id=n,this.boa_token=o,this.audio_token=a;let m=a.repeat(this.audio_seq_length);this.full_audio_sequence=`
|
|
14
|
+
`))[0]=="Error"&&g.shift(),Qb(g);for(var b=3;g[b]&&Vc(g[b])!=c;)++b;for(c=0;c<h&&g[c+b];++c)(v(),B)[p+4*c>>>2>>>0]=Vc(g[c+b]);return c}var nr=c=>{var p=mr(c)+1,h=Qc(p);return fr(c,h,p),h},ay=[],xt=(c,p)=>{ay[c>>>=0]=p},or=[],Xc=[],nn=(c,p)=>{Xc[c]=new Promise(h=>p.finally(()=>h(c)))},re=c=>{if(c)return ay[c>>>0]},Kc=(c,p,h)=>{(v(),P)[c>>>2>>>0]=p,(v(),P)[c+4>>>2>>>0]=h},Jb=c=>{var p=(v(),P)[c>>>2>>>0];return c=(v(),P)[c+4>>>2>>>0],rn(p,c)},hr=c=>{var p=(v(),P)[c>>>2>>>0];return c=(v(),P)[c+4>>>2>>>0],p?rn(p,c):c===0?"":void 0},MM=c=>{var p=hr(c+4),h=(h=(v(),P)[c+12>>>2>>>0])?re(h):"auto";if(c+=16){var g=re((v(),P)[c+4>>>2>>>0]),b=(v(),P)[c+16>>>2>>>0],A=(v(),P)[c+20>>>2>>>0];if(b){for(var O={},N=0;N<b;++N){var D=A+24*N;O[Jb(D+4)]=(v(),ie)[D+16>>>3>>>0]}b=O}else b=void 0;c={module:g,constants:b,entryPoint:hr(c+8)}}else c=void 0;return{label:p,layout:h,compute:c}},Zb=(c,p)=>{function h(b,A){b=c[b],(v(),B)[p+A>>>2>>>0]=b}function g(b,A){b=c[b],(v(),S)[p+A>>>3>>>0]=BigInt(b)}h("maxTextureDimension1D",4),h("maxTextureDimension2D",8),h("maxTextureDimension3D",12),h("maxTextureArrayLayers",16),h("maxBindGroups",20),h("maxBindGroupsPlusVertexBuffers",24),h("maxBindingsPerBindGroup",28),h("maxDynamicUniformBuffersPerPipelineLayout",32),h("maxDynamicStorageBuffersPerPipelineLayout",36),h("maxSampledTexturesPerShaderStage",40),h("maxSamplersPerShaderStage",44),h("maxStorageBuffersPerShaderStage",48),h("maxStorageTexturesPerShaderStage",52),h("maxUniformBuffersPerShaderStage",56),h("minUniformBufferOffsetAlignment",80),h("minStorageBufferOffsetAlignment",84),g("maxUniformBufferBindingSize",64),g("maxStorageBufferBindingSize",72),h("maxVertexBuffers",88),g("maxBufferSize",96),h("maxVertexAttributes",104),h("maxVertexBufferArrayStride",108),h("maxInterStageShaderVariables",112),h("maxColorAttachments",116),h("maxColorAttachmentBytesPerSample",120),h("maxComputeWorkgroupStorageSize",124),h("maxComputeInvocationsPerWorkgroup",128),h("maxComputeWorkgroupSizeX",132),h("maxComputeWorkgroupSizeY",136),h("maxComputeWorkgroupSizeZ",140),h("maxComputeWorkgroupsPerDimension",144),c.Le!==void 0&&h("maxImmediateSize",148)},TM=[,"validation","out-of-memory","internal"],SM=[,"compatibility","core"],e1={1:"core-features-and-limits",2:"depth-clip-control",3:"depth32float-stencil8",4:"texture-compression-bc",5:"texture-compression-bc-sliced-3d",6:"texture-compression-etc2",7:"texture-compression-astc",8:"texture-compression-astc-sliced-3d",9:"timestamp-query",10:"indirect-first-instance",11:"shader-f16",12:"rg11b10ufloat-renderable",13:"bgra8unorm-storage",14:"float32-filterable",15:"float32-blendable",16:"clip-distances",17:"dual-source-blending",18:"subgroups",19:"texture-formats-tier1",20:"texture-formats-tier2",21:"primitive-index",327692:"chromium-experimental-unorm16-texture-formats",327693:"chromium-experimental-snorm16-texture-formats",327732:"chromium-experimental-multi-draw-indirect"},OM=[,"low-power","high-performance"],IM=[,"occlusion","timestamp"],CM={undefined:1,unknown:1,destroyed:2};function PM(c,p,h,g,b,A){p=wt(p),h=wt(h),g>>>=0,b>>>=0,A>>>=0;var O=re(c>>>0);if(c={},A){var N=(v(),P)[A+12>>>2>>>0];if(N){var D=(v(),P)[A+16>>>2>>>0];c.requiredFeatures=Array.from((v(),P).subarray(D>>>2>>>0,D+4*N>>>2>>>0),ee=>e1[ee])}var q=(v(),P)[A+20>>>2>>>0];if(q){let ee=function(Ut,nt,ls=!1){nt=q+nt,(nt=(v(),P)[nt>>>2>>>0])==4294967295||ls&&nt==0||(Re[Ut]=nt)},ct=function(Ut,nt){nt=q+nt;var ls=(v(),P)[nt>>>2>>>0],oS=(v(),P)[nt+4>>>2>>>0];ls==4294967295&&oS==4294967295||(Re[Ut]=4294967296*(v(),P)[nt+4>>>2>>>0]+(v(),P)[nt>>>2>>>0])};var fe=ee,me=ct,Re={};ee("maxTextureDimension1D",4),ee("maxTextureDimension2D",8),ee("maxTextureDimension3D",12),ee("maxTextureArrayLayers",16),ee("maxBindGroups",20),ee("maxBindGroupsPlusVertexBuffers",24),ee("maxDynamicUniformBuffersPerPipelineLayout",32),ee("maxDynamicStorageBuffersPerPipelineLayout",36),ee("maxSampledTexturesPerShaderStage",40),ee("maxSamplersPerShaderStage",44),ee("maxStorageBuffersPerShaderStage",48),ee("maxStorageTexturesPerShaderStage",52),ee("maxUniformBuffersPerShaderStage",56),ee("minUniformBufferOffsetAlignment",80),ee("minStorageBufferOffsetAlignment",84),ct("maxUniformBufferBindingSize",64),ct("maxStorageBufferBindingSize",72),ee("maxVertexBuffers",88),ct("maxBufferSize",96),ee("maxVertexAttributes",104),ee("maxVertexBufferArrayStride",108),ee("maxInterStageShaderVariables",112),ee("maxColorAttachments",116),ee("maxColorAttachmentBytesPerSample",120),ee("maxComputeWorkgroupStorageSize",124),ee("maxComputeInvocationsPerWorkgroup",128),ee("maxComputeWorkgroupSizeX",132),ee("maxComputeWorkgroupSizeY",136),ee("maxComputeWorkgroupSizeZ",140),ee("maxComputeWorkgroupsPerDimension",144),ee("maxImmediateSize",148,!0),c.requiredLimits=Re}(N=(v(),P)[A+24>>>2>>>0])&&(N={label:hr(N+4)},c.defaultQueue=N),c.label=hr(A+4)}ge+=1,nn(p,O.requestDevice(c).then(ee=>{--ge,xt(b,ee.queue),xt(g,ee),h&&(ge+=1,nn(h,ee.lost.then(ct=>{--ge,ee.onuncapturederror=()=>{};var Ut=ae(),nt=nr(ct.message);py(h,CM[ct.reason],nt),oe(Ut)}))),ee.onuncapturederror=ct=>{var Ut=5;ct.error instanceof GPUValidationError?Ut=2:ct.error instanceof GPUOutOfMemoryError?Ut=3:ct.error instanceof GPUInternalError&&(Ut=4);var nt=ae();ct=nr(ct.error.message),b1(g,Ut,ct),oe(nt)},"adapterInfo"in ee||(ee.adapterInfo=O.info),my(p,1,g,0)},ee=>{--ge;var ct=ae();ee=nr(ee.message),my(p,3,g,ee),h&&py(h,4,ee),oe(ct)}))}function zM(c){var p=re(c>>>=0),h=or[c];if(h){for(var g=0;g<h.length;++g)h[g]();delete or[c]}p.destroy()}var on=()=>{var c="getMappedRange size=0 no longer means WGPU_WHOLE_MAP_SIZE";on.ed||(on.ed={}),on.ed[c]||(on.ed[c]=1,T(c))};function LM(c,p,h){p>>>=0,h>>>=0;var g=re(c>>>=0);h===0&&on(),h==4294967295&&(h=void 0);try{var b=g.getMappedRange(p,h)}catch{return 0}var A=gy(16,b.byteLength);return(v(),Q).set(new Uint8Array(b),A>>>0),or[c].push(()=>Rt(A)),A}function NM(c,p,h){p>>>=0,h>>>=0;var g=re(c>>>=0);h===0&&on(),h==4294967295&&(h=void 0);try{var b=g.getMappedRange(p,h)}catch{return 0}var A=gy(16,b.byteLength);return(v(),Q).fill(0,A,b.byteLength),or[c].push(()=>{new Uint8Array(b).set((v(),Q).subarray(A>>>0,A+b.byteLength>>>0)),Rt(A)}),A}function $M(c,p,h,g,b){c>>>=0,p=wt(p),h=wt(h),b>>>=0;var A=re(c);or[c]=[],b==4294967295&&(b=void 0),ge+=1,nn(p,A.mapAsync(h,g>>>0,b).then(()=>{--ge,dy(p,1,0)},O=>{--ge,ae();var N=nr(O.message);dy(p,O.name==="AbortError"?4:O.name==="OperationError"?3:0,N),delete or[c]}))}function RM(c){var p=re(c>>>=0),h=or[c];if(h){for(var g=0;g<h.length;++g)h[g]();delete or[c],p.unmap()}}function UM(c){delete ay[c>>>0]}function BM(c,p,h){c>>>=0,p>>>=0,h>>>=0;var g=!!(v(),P)[p+32>>>2>>>0];p={label:hr(p+4),usage:(v(),P)[p+16>>>2>>>0],size:4294967296*(v(),P)[p+28>>>2>>>0]+(v(),P)[p+24>>>2>>>0],mappedAtCreation:g},c=re(c);try{var b=c.createBuffer(p)}catch{return!1}return xt(h,b),g&&(or[h]=[]),!0}function DM(c,p,h,g){c>>>=0,p=wt(p),g>>>=0,h=MM(h>>>0),c=re(c),ge+=1,nn(p,c.createComputePipelineAsync(h).then(b=>{--ge,xt(g,b),uy(p,1,g,0)},b=>{--ge;var A=ae(),O=nr(b.message);uy(p,b.reason==="validation"?3:b.reason==="internal"?4:0,g,O),oe(A)}))}function FM(c,p,h){c>>>=0,p>>>=0,h>>>=0;var g=(v(),P)[p>>>2>>>0],b=(v(),P)[g+4>>>2>>>0];p={label:hr(p+4),code:""},b===2&&(p.code=Jb(g+8)),xt(h,re(c).createShaderModule(p))}var jM=c=>{(c=re(c)).onuncapturederror=null,c.destroy()};function GM(c,p){p=wt(p),c=re(c>>>0),ge+=1,nn(p,c.popErrorScope().then(h=>{--ge;var g=5;h?h instanceof GPUValidationError?g=2:h instanceof GPUOutOfMemoryError?g=3:h instanceof GPUInternalError&&(g=4):g=1;var b=ae();h=h?nr(h.message):0,fy(p,1,g,h),oe(b)},h=>{--ge;var g=ae();h=nr(h.message),fy(p,1,5,h),oe(g)}))}function qM(c,p,h,g){if(p=wt(p),g>>>=0,h>>>=0){var b=(v(),P)[h+4>>>2>>>0];b={featureLevel:SM[b],powerPreference:OM[(v(),P)[h+8>>>2>>>0]],forceFallbackAdapter:!!(v(),P)[h+12>>>2>>>0]},(h=(v(),P)[h>>>2>>>0])!==0&&(v(),b.Qe=!!(v(),P)[h+8>>>2>>>0])}"gpu"in navigator?(ge+=1,nn(p,navigator.gpu.requestAdapter(b).then(A=>{if(--ge,A)xt(g,A),Wa(p,1,g,0);else{A=ae();var O=nr("WebGPU not available on this browser (requestAdapter returned null)");Wa(p,3,g,O),oe(A)}},A=>{--ge;var O=ae();A=nr(A.message),Wa(p,4,g,A),oe(O)}))):(h=ae(),b=nr("WebGPU not available on this browser (navigator.gpu is not available)"),Wa(p,3,g,b),oe(h))}function WM(c,p,h){return c>>>=0,p>>>=0,h>>>=0,Fb(async()=>{var g=[];if(h){var b=(v(),B)[h>>>2>>>0];g.length=p+1,g[p]=new Promise(N=>setTimeout(N,b,0))}else g.length=p;for(var A=0;A<p;++A){var O=4294967296*(v(),P)[c+8*A+4>>>2>>>0]+(v(),P)[c+8*A>>>2>>>0];if(!(O in Xc))return O;g[A]=Xc[O]}return g=await Promise.race(g),delete Xc[g],g})}var iy,ly={},t1=()=>{if(!iy){var c,p={USER:"web_user",LOGNAME:"web_user",PATH:"/",PWD:"/",HOME:"/home/web_user",LANG:(globalThis.navigator?.language??"C").replace("-","_")+".UTF-8",_:"./this.program"};for(c in ly)ly[c]===void 0?delete p[c]:p[c]=ly[c];var h=[];for(c in p)h.push(`${c}=${p[c]}`);iy=h}return iy};function r1(c,p){if(n)return $e(19,1,c,p);c>>>=0,p>>>=0;var h,g=0,b=0;for(h of t1()){var A=p+g;(v(),P)[c+b>>>2>>>0]=A,g+=fr(h,A,1/0)+1,b+=4}return 0}function s1(c,p){if(n)return $e(20,1,c,p);c>>>=0,p>>>=0;var h=t1();for(var g of((v(),P)[c>>>2>>>0]=h.length,c=0,h))c+=mr(g)+1;return(v(),P)[p>>>2>>>0]=c,0}function n1(c){return n?$e(21,1,c):52}function o1(c,p,h,g){return n?$e(22,1,c,p,h,g):52}function a1(c,p,h,g){return n?$e(23,1,c,p,h,g):70}var VM=[null,[],[]];function i1(c,p,h,g){if(n)return $e(24,1,c,p,h,g);p>>>=0,h>>>=0,g>>>=0;for(var b=0,A=0;A<h;A++){var O=(v(),P)[p>>>2>>>0],N=(v(),P)[p+4>>>2>>>0];p+=8;for(var D=0;D<N;D++){var q=c,fe=(v(),Q)[O+D>>>0],me=VM[q];fe===0||fe===10?((q===1?I:T)(bb(me)),me.length=0):me.push(fe)}b+=N}return(v(),P)[g>>>2>>>0]=b,0}function HM(c){return c>>>0}function XM(c,p){return Zb(re(c>>>0).limits,p>>>0),1}function KM(c,p){return re(c>>>0).features.has(e1[p])}function YM(c){return BigInt(re(c>>>0).size)}function QM(c){return BigInt(re(c>>>0).usage)}function JM(c,p){if(c>>>=0,p>>>=0){var h=hr(p+4);h={label:h,timestampWrites:p=(p=(v(),P)[p+12>>>2>>>0])!==0?{querySet:re((v(),P)[p+4>>>2>>>0]),beginningOfPassWriteIndex:(v(),P)[p+8>>>2>>>0],endOfPassWriteIndex:(v(),P)[p+12>>>2>>>0]}:void 0}}return c=re(c),p=_1(0),xt(p,c.beginComputePass(h)),p}function ZM(c,p,h,g,b,A){h=wt(h),b=wt(b),A=wt(A),re(c>>>0).copyBufferToBuffer(re(p>>>0),h,re(g>>>0),b,A)}function eT(c){c=re(c>>>0);var p=m1(0);return xt(p,c.finish()),p}function tT(c,p,h,g,b,A){A=wt(A),re(c>>>0).resolveQuerySet(re(p>>>0),h,g,re(b>>>0),A)}function rT(c,p,h,g){re(c>>>0).dispatchWorkgroups(p,h,g)}function sT(c,p,h){h=wt(h),re(c>>>0).dispatchWorkgroupsIndirect(re(p>>>0),h)}function nT(c){re(c>>>0).end()}function oT(c,p,h,g,b){g>>>=0,b>>>=0,c=re(c>>>0),h=re(h>>>0),g==0?c.setBindGroup(p,h):c.setBindGroup(p,h,(v(),P),b>>>2,g)}function aT(c,p){re(c>>>0).setPipeline(re(p>>>0))}function iT(c,p,h){re(c>>>0).Pe(re(p>>>0),h)}function lT(c,p){c=re(c>>>0);var h=f1(0);return xt(h,c.getBindGroupLayout(p)),h}function cT(c,p){c>>>=0;var h=hr(4+(p>>>=0)),g=re((v(),P)[p+12>>>2>>>0]),b=(v(),P)[p+16>>>2>>>0];p=(v(),P)[p+20>>>2>>>0];for(var A=[],O=0;O<b;++O){var N=A,D=N.push,q=p+40*O,fe=(v(),P)[q+8>>>2>>>0],me=(v(),P)[q+32>>>2>>>0],Re=(v(),P)[q+36>>>2>>>0],ee=(v(),P)[q+4>>>2>>>0];fe?(me=q+24,(me=(v(),P)[me>>>2>>>0]+4294967296*(v(),B)[me+4>>>2>>>0])==-1&&(me=void 0),q={binding:ee,resource:{buffer:re(fe),offset:4294967296*(v(),P)[q+4+16>>>2>>>0]+(v(),P)[q+16>>>2>>>0],size:me}}):q=me?{binding:ee,resource:re(me)}:{binding:ee,resource:re(Re)},D.call(N,q)}return h={label:h,layout:g,entries:A},c=re(c),g=d1(0),xt(g,c.createBindGroup(h)),g}function uT(c,p){var h;return c>>>=0,(p>>>=0)&&(h={label:hr(p+4)}),c=re(c),p=h1(0),xt(p,c.createCommandEncoder(h)),p}function pT(c,p){c>>>=0,p>>>=0,p={type:IM[(v(),P)[p+12>>>2>>>0]],count:(v(),P)[p+16>>>2>>>0]},c=re(c);var h=g1(0);return xt(h,c.createQuerySet(p)),h}function dT(c,p){c=re(c>>>0).adapterInfo,p>>>=0,(v(),B)[p+52>>>2>>>0]=c.subgroupMinSize,(v(),B)[p+56>>>2>>>0]=c.subgroupMaxSize;var h=Yb(c.vendor+c.architecture+c.device+c.description),g=mr(c.vendor);return Kc(p+4,h,g),h+=g,g=mr(c.architecture),Kc(p+12,h,g),h+=g,g=mr(c.device),Kc(p+20,h,g),Kc(p+28,h+g,mr(c.description)),(v(),B)[p+36>>>2>>>0]=2,c=c.isFallbackAdapter?3:4,(v(),B)[p+40>>>2>>>0]=c,(v(),B)[p+44>>>2>>>0]=0,(v(),B)[p+48>>>2>>>0]=0,1}var fT={"core-features-and-limits":1,"depth-clip-control":2,"depth32float-stencil8":3,"texture-compression-bc":4,"texture-compression-bc-sliced-3d":5,"texture-compression-etc2":6,"texture-compression-astc":7,"texture-compression-astc-sliced-3d":8,"timestamp-query":9,"indirect-first-instance":10,"shader-f16":11,"rg11b10ufloat-renderable":12,"bgra8unorm-storage":13,"float32-filterable":14,"float32-blendable":15,"clip-distances":16,"dual-source-blending":17,subgroups:18,"texture-formats-tier1":19,"texture-formats-tier2":20,"primitive-index":21,"chromium-experimental-unorm16-texture-formats":327692,"chromium-experimental-snorm16-texture-formats":327693,"chromium-experimental-multi-draw-indirect":327732};function mT(c,p){p>>>=0,c=re(c>>>0);var h=an(4*c.features.size),g=0,b=0;c.features.forEach(A=>{0<=(A=fT[A])&&((v(),B)[h+g>>>2>>>0]=A,g+=4,b++)}),(v(),P)[p+4>>>2>>>0]=h,(v(),P)[p>>>2>>>0]=b}function hT(c,p){return Zb(re(c>>>0).limits,p>>>0),1}function _T(c,p){re(c>>>0).pushErrorScope(TM[p])}function gT(c,p,h){p>>>=0,h>>>=0,c=re(c>>>0),p=Array.from((v(),B).subarray(h>>>2>>>0,h+4*p>>>2>>>0),g=>re(g)),c.submit(p)}function wT(c,p,h,g,b){h=wt(h),g>>>=0,b>>>=0,c=re(c>>>0),p=re(p>>>0),g=(v(),Q).subarray(g>>>0,g+b>>>0),c.writeBuffer(p,h,g,0,b)}n||(function(){for(var c=e.numThreads-1;c--;)mb();Me.push(async()=>{var p=(async function(){if(!n)return Promise.all(tt.map(fb))})();xe++,await p,--xe==0&&qe&&(p=qe,qe=null,p())})})(),n||($r=new WebAssembly.Memory({initial:256,maximum:65536,shared:!0}),ue()),e.wasmBinary&&(f=e.wasmBinary),e.stackSave=()=>ae(),e.stackRestore=c=>oe(c),e.stackAlloc=c=>Qc(c),e.setValue=function(c,p,h="i8"){switch(h.endsWith("*")&&(h="*"),h){case"i1":case"i8":(v(),V)[c>>>0]=p;break;case"i16":(v(),K)[c>>>1>>>0]=p;break;case"i32":(v(),B)[c>>>2>>>0]=p;break;case"i64":(v(),S)[c>>>3>>>0]=BigInt(p);break;case"float":(v(),se)[c>>>2>>>0]=p;break;case"double":(v(),ie)[c>>>3>>>0]=p;break;case"*":(v(),P)[c>>>2>>>0]=p;break;default:Pe(`invalid type for setValue: ${h}`)}},e.getValue=function(c,p="i8"){switch(p.endsWith("*")&&(p="*"),p){case"i1":case"i8":return(v(),V)[c>>>0];case"i16":return(v(),K)[c>>>1>>>0];case"i32":return(v(),B)[c>>>2>>>0];case"i64":return(v(),S)[c>>>3>>>0];case"float":return(v(),se)[c>>>2>>>0];case"double":return(v(),ie)[c>>>3>>>0];case"*":return(v(),P)[c>>>2>>>0];default:Pe(`invalid type for getValue: ${p}`)}},e.UTF8ToString=rn,e.stringToUTF8=fr,e.lengthBytesUTF8=mr;var l1,c1,cy,Yc,Rt,an,u1,p1,d1,f1,m1,h1,_1,g1,w1,x1,y1,uy,py,dy,fy,Wa,my,b1,hy,v1,k1,E1,_y,A1,M1,gy,he,Va,T1,oe,Qc,ae,S1,wy,O1,I1,C1,xy,P1,z1,L1,N1,$1,R1,U1,B1,D1,F1,j1,G1,q1,W1,V1,H1,X1,K1,Y1,Q1,J1,Z1,ev,tv,rv,sv,nv,ov,av,iv,lv,cv,uv,pv,dv,fv,mv,hv,_v,gv,_r,xT=[Nr,ns,gb,vb,kb,Eb,Ab,Mb,Tb,Sb,Ob,Ib,Cb,Pb,zb,Lb,Vb,Hb,Xb,r1,s1,n1,o1,a1,i1],yy={1117404:(c,p,h,g,b)=>{if(e===void 0||!e.Zc)return 1;if((c=rn(Number(c>>>0))).startsWith("./")&&(c=c.substring(2)),!(c=e.Zc.get(c)))return 2;if(p=Number(p>>>0),h=Number(h>>>0),g=Number(g>>>0),p+h>c.byteLength)return 3;try{let A=c.subarray(p,p+h);switch(b){case 0:(v(),Q).set(A,g>>>0);break;case 1:e.ie?e.ie(g,A):e.Ke(g,A);break;default:return 4}return 0}catch{return 4}},1118228:(c,p,h)=>{e.ke(c,(v(),Q).subarray(p>>>0,p+h>>>0))},1118292:()=>e.Ie(),1118334:c=>{e.je(c)},1118371:()=>typeof wasmOffsetConverter<"u"};function yT(){return typeof wasmOffsetConverter<"u"}function bT(c,p,h,g){var b=ae();try{return B1(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function vT(c,p,h){var g=ae();try{return $1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function kT(c,p,h){var g=ae();try{C1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function ET(c,p){var h=ae();try{return xy(c,p)}catch(g){if(oe(h),g!==g+0)throw g;he(1,0)}}function AT(c){var p=ae();try{P1(c)}catch(h){if(oe(p),h!==h+0)throw h;he(1,0)}}function MT(c,p,h,g,b,A,O){var N=ae();try{return N1(c,p,h,g,b,A,O)}catch(D){if(oe(N),D!==D+0)throw D;he(1,0)}}function TT(c,p){var h=ae();try{D1(c,p)}catch(g){if(oe(h),g!==g+0)throw g;he(1,0)}}function ST(c,p,h,g,b,A){var O=ae();try{z1(c,p,h,g,b,A)}catch(N){if(oe(O),N!==N+0)throw N;he(1,0)}}function OT(c,p,h,g){var b=ae();try{U1(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function IT(c,p,h,g,b,A,O){var N=ae();try{j1(c,p,h,g,b,A,O)}catch(D){if(oe(N),D!==D+0)throw D;he(1,0)}}function CT(c,p,h,g,b,A,O){var N=ae();try{G1(c,p,h,g,b,A,O)}catch(D){if(oe(N),D!==D+0)throw D;he(1,0)}}function PT(c,p,h,g,b,A,O,N){var D=ae();try{Z1(c,p,h,g,b,A,O,N)}catch(q){if(oe(D),q!==q+0)throw q;he(1,0)}}function zT(c,p,h,g,b){var A=ae();try{L1(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;he(1,0)}}function LT(c,p,h,g,b){var A=ae();try{return F1(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;he(1,0)}}function NT(c,p,h,g,b,A,O,N){var D=ae();try{ev(c,p,h,g,b,A,O,N)}catch(q){if(oe(D),q!==q+0)throw q;he(1,0)}}function $T(c,p,h,g,b,A,O,N,D,q,fe,me){var Re=ae();try{q1(c,p,h,g,b,A,O,N,D,q,fe,me)}catch(ee){if(oe(Re),ee!==ee+0)throw ee;he(1,0)}}function RT(c,p,h,g,b,A){var O=ae();try{return Q1(c,p,h,g,b,A)}catch(N){if(oe(O),N!==N+0)throw N;he(1,0)}}function UT(c,p,h){var g=ae();try{return X1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;return he(1,0),0n}}function BT(c,p,h,g,b,A,O,N,D){var q=ae();try{R1(c,p,h,g,b,A,O,N,D)}catch(fe){if(oe(q),fe!==fe+0)throw fe;he(1,0)}}function DT(c){var p=ae();try{return V1(c)}catch(h){if(oe(p),h!==h+0)throw h;he(1,0)}}function FT(c,p,h){var g=ae();try{return tv(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function jT(c,p){var h=ae();try{return fv(c,p)}catch(g){if(oe(h),g!==g+0)throw g;return he(1,0),0n}}function GT(c,p,h,g,b){var A=ae();try{rv(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;he(1,0)}}function qT(c){var p=ae();try{return W1(c)}catch(h){if(oe(p),h!==h+0)throw h;return he(1,0),0n}}function WT(c,p,h,g,b,A){var O=ae();try{return ov(c,p,h,g,b,A)}catch(N){if(oe(O),N!==N+0)throw N;he(1,0)}}function VT(c,p,h,g,b,A){var O=ae();try{return av(c,p,h,g,b,A)}catch(N){if(oe(O),N!==N+0)throw N;he(1,0)}}function HT(c,p,h,g,b,A,O,N){var D=ae();try{return J1(c,p,h,g,b,A,O,N)}catch(q){if(oe(D),q!==q+0)throw q;he(1,0)}}function XT(c,p,h,g,b){var A=ae();try{return iv(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;return he(1,0),0n}}function KT(c,p,h,g){var b=ae();try{return lv(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function YT(c,p,h,g){var b=ae();try{return cv(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function QT(c,p,h,g,b,A,O,N,D,q,fe,me){var Re=ae();try{return uv(c,p,h,g,b,A,O,N,D,q,fe,me)}catch(ee){if(oe(Re),ee!==ee+0)throw ee;he(1,0)}}function JT(c,p,h,g,b,A,O,N,D,q,fe){var me=ae();try{sv(c,p,h,g,b,A,O,N,D,q,fe)}catch(Re){if(oe(me),Re!==Re+0)throw Re;he(1,0)}}function ZT(c,p,h,g,b,A,O,N,D,q,fe,me,Re,ee,ct,Ut){var nt=ae();try{nv(c,p,h,g,b,A,O,N,D,q,fe,me,Re,ee,ct,Ut)}catch(ls){if(oe(nt),ls!==ls+0)throw ls;he(1,0)}}function eS(c,p,h,g){var b=ae();try{return pv(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function tS(c,p,h,g,b){var A=ae();try{return dv(c,p,h,g,b)}catch(O){if(oe(A),O!==O+0)throw O;he(1,0)}}function rS(c,p,h){var g=ae();try{return H1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function sS(c,p,h){var g=ae();try{return K1(c,p,h)}catch(b){if(oe(g),b!==b+0)throw b;he(1,0)}}function nS(c,p,h,g){var b=ae();try{Y1(c,p,h,g)}catch(A){if(oe(b),A!==A+0)throw A;he(1,0)}}function Jc(){if(0<xe)qe=Jc;else if(n)w?.(e),Be();else{for(var c=Me;0<c.length;)c.shift()(e);0<xe?qe=Jc:(e.calledRun=!0,z||(Be(),w?.(e)))}}return n||(_r=await Qe(),Jc()),e.PTR_SIZE=4,e.webgpuInit=c=>{let p=new WeakMap,h,g,b=1;e.webgpuRegisterDevice=N=>{if(g!==void 0)throw Error("another WebGPU EP inference session is being created.");if(N){var D=p.get(N);if(!D){let q=((fe,me=0)=>{var Re=y1(me);return me=x1(me,Re),xt(Re,fe.queue),xt(me,fe),me})(N,D=p1(0));D=[b++,D,q],p.set(N,D)}return h=N,g=D[0],D}h=void 0,g=0};let A=new Map;e.webgpuOnCreateSession=N=>{if(g!==void 0){var D=g;if(g=void 0,N){let q=cy(D);A.set(N,q),D===0&&c(h??re(q))}h=void 0}},e.webgpuOnReleaseSession=N=>{A.delete(N)};let O=Symbol("gpuBufferMetadata");e.webgpuRegisterBuffer=(N,D,q)=>{if(q)return N[O]=[q,NaN],q;if(q=N[O])return q[1]++,q[0];if((D=A.get(D))===void 0)throw Error("Invalid session handle passed to webgpuRegisterBuffer");return D=((fe,me=0)=>(fe.mapState!="pending"||Pe(),me=w1(me,fe.mapState=="mapped"?3:1),xt(me,fe),fe.mapState=="mapped"&&(or[me]=[]),me))(N,D),N[O]=[D,1],D},e.webgpuUnregisterBuffer=N=>{let D=N[O];if(!D)throw Error("Buffer is not registered");D[1]--,D[1]===0&&(u1(D[0]),delete N[O])},e.webgpuGetBuffer=N=>re(N),e.webgpuCreateDownloader=(N,D,q)=>{if((q=A.get(q))===void 0)throw Error("Invalid session handle passed to webgpuRegisterBuffer");let fe=re(q),me=16*Math.ceil(Number(D)/16);return async()=>{let Re=fe.createBuffer({size:me,usage:9});try{let ee=fe.createCommandEncoder();return ee.copyBufferToBuffer(N,0,Re,0,me),fe.queue.submit([ee.finish()]),await Re.mapAsync(GPUMapMode.READ),Re.getMappedRange().slice(0,D)}finally{Re.destroy()}}},e.ie=(N,D)=>{var q=D.buffer;let fe=D.byteOffset,me=D.byteLength;if(D=16*Math.ceil(Number(me)/16),N=re(N),!h){var Re=cy(g);h=re(Re)}let ee=(Re=h.createBuffer({mappedAtCreation:!0,size:D,usage:6})).getMappedRange();new Uint8Array(ee).set(new Uint8Array(q,fe,me)),Re.unmap(),(q=h.createCommandEncoder()).copyBufferToBuffer(Re,0,N,0,D),h.queue.submit([q.finish()]),Re.destroy()}},e.webnnInit=c=>{let p=c[0];[e.Ie,e.je,e.webnnEnsureTensor,e.ke,e.webnnDownloadTensor,e.He,e.webnnEnableTraceEvent]=c.slice(1),e.webnnReleaseTensorId=e.je,e.webnnUploadTensor=e.ke,e.webnnRegisterMLContext=e.He,e.webnnOnRunStart=h=>p.onRunStart(h),e.webnnOnRunEnd=p.onRunEnd.bind(p),e.webnnOnReleaseSession=h=>{p.onReleaseSession(h)},e.webnnCreateMLTensorDownloader=(h,g)=>p.createMLTensorDownloader(h,g),e.webnnRegisterMLTensor=(h,g,b,A)=>p.registerMLTensor(h,g,b,A),e.webnnCreateMLContext=h=>p.createMLContext(h),e.webnnRegisterMLConstant=(h,g,b,A,O,N)=>p.registerMLConstant(h,g,b,A,O,e.Zc,N),e.webnnRegisterGraphInput=p.registerGraphInput.bind(p),e.webnnIsGraphInput=p.isGraphInput.bind(p),e.webnnRegisterGraphOutput=p.registerGraphOutput.bind(p),e.webnnIsGraphOutput=p.isGraphOutput.bind(p),e.webnnCreateTemporaryTensor=p.createTemporaryTensor.bind(p),e.webnnIsGraphInputOutputTypeSupported=p.isGraphInputOutputTypeSupported.bind(p)},te?e:new Promise((c,p)=>{w=c,x=p})}var hE,vk,KC=ye(()=>{"use strict";hE=bk,vk=globalThis.self?.name?.startsWith("em-pthread"),vk&&bk()}),Ry,Zy,kk,Ot,_E,fu,Ek,Ak,Uy,Mk,By,gE,Dy,wE,l0=ye(()=>{"use strict";i0(),Ry=typeof location>"u"?void 0:location.origin,Zy=Qt.url>"file:"&&Qt.url<"file;",kk=()=>{if(Zy){let t=URL;return new URL(new t("ort.webgpu.bundle.min.mjs",Qt.url).href,Ry).href}return Qt.url},Ot=kk(),_E=()=>{if(Ot&&!Ot.startsWith("blob:"))return Ot.substring(0,Ot.lastIndexOf("/")+1)},fu=(t,e)=>{try{let r=e??Ot;return(r?new URL(t,r):new URL(t)).origin===Ry}catch{return!1}},Ek=(t,e)=>{let r=e??Ot;try{return(r?new URL(t,r):new URL(t)).href}catch{return}},Ak=(t,e)=>`${e??"./"}${t}`,Uy=async t=>{let e=await(await fetch(t,{credentials:"same-origin"})).blob();return URL.createObjectURL(e)},Mk=async t=>(await import(t)).default,By=(XC(),xu(dE)).default,gE=async()=>{if(!Ot)throw new Error("Failed to load proxy worker: cannot determine the script source URL.");if(fu(Ot))return[void 0,By()];let t=await Uy(Ot);return[t,By(t)]},Dy=(KC(),xu(mE)).default,wE=async(t,e,r,s)=>{let n=Dy&&!(t||e);if(n)if(Ot)n=fu(Ot);else if(s&&!r)n=!0;else throw new Error("cannot determine the script source URL.");if(n)return[void 0,Dy];{let o="ort-wasm-simd-threaded.asyncify.mjs",a=t??Ek(o,e),i=r&&a&&!fu(a,e),l=i?await Uy(a):a??Ak(o,e);return[i?l:void 0,await Mk(l)]}}}),Fy,mu,si,jy,Tk,Sk,Ok,c0,Ue,ks=ye(()=>{"use strict";l0(),mu=!1,si=!1,jy=!1,Tk=()=>{if(typeof SharedArrayBuffer>"u")return!1;try{return typeof MessageChannel<"u"&&new MessageChannel().port1.postMessage(new SharedArrayBuffer(1)),WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,5,4,1,3,1,1,10,11,1,9,0,65,0,254,16,2,0,26,11]))}catch{return!1}},Sk=()=>{try{return WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,4,1,96,0,0,3,2,1,0,10,30,1,28,0,65,0,253,15,253,12,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,253,186,1,26,11]))}catch{return!1}},Ok=()=>{try{return WebAssembly.validate(new Uint8Array([0,97,115,109,1,0,0,0,1,5,1,96,0,1,123,3,2,1,0,10,19,1,17,0,65,1,253,15,65,2,253,15,65,3,253,15,253,147,2,11]))}catch{return!1}},c0=async t=>{if(mu)return Promise.resolve();if(si)throw new Error("multiple calls to 'initializeWebAssembly()' detected.");if(jy)throw new Error("previous call to 'initializeWebAssembly()' failed.");si=!0;let e=t.initTimeout,r=t.numThreads;if(t.simd!==!1){if(t.simd==="relaxed"){if(!Ok())throw new Error("Relaxed WebAssembly SIMD is not supported in the current environment.")}else if(!Sk())throw new Error("WebAssembly SIMD is not supported in the current environment.")}let s=Tk();r>1&&!s&&(typeof self<"u"&&!self.crossOriginIsolated&&console.warn("env.wasm.numThreads is set to "+r+", but this will not work unless you enable crossOriginIsolated mode. See https://web.dev/cross-origin-isolation-guide/ for more info."),console.warn("WebAssembly multi-threading is not supported in the current environment. Falling back to single-threading."),t.numThreads=r=1);let n=t.wasmPaths,o=typeof n=="string"?n:void 0,a=n?.mjs,i=a?.href??a,l=n?.wasm,u=l?.href??l,d=t.wasmBinary,[f,m]=await wE(i,o,r>1,!!d||!!u),_=!1,w=[];if(e>0&&w.push(new Promise(x=>{setTimeout(()=>{_=!0,x()},e)})),w.push(new Promise((x,k)=>{let E={numThreads:r};if(d)E.wasmBinary=d;else if(u||o)E.locateFile=M=>u??o+M;else if(i&&i.indexOf("blob:")!==0)E.locateFile=M=>new URL(M,i).href;else if(f){let M=_E();M&&(E.locateFile=I=>M+I)}m(E).then(M=>{si=!1,mu=!0,Fy=M,x(),f&&URL.revokeObjectURL(f)},M=>{si=!1,jy=!0,k(M)})})),await Promise.race(w),_)throw new Error(`WebAssembly backend initializing failed due to timeout: ${e}ms`)},Ue=()=>{if(mu&&Fy)return Fy;throw new Error("WebAssembly is not initialized yet.")}}),It,bu,Ie,u0=ye(()=>{"use strict";ks(),It=(t,e)=>{let r=Ue(),s=r.lengthBytesUTF8(t)+1,n=r._malloc(s);return r.stringToUTF8(t,n,s),e.push(n),n},bu=(t,e,r,s)=>{if(typeof t=="object"&&t!==null){if(r.has(t))throw new Error("Circular reference in options");r.add(t)}Object.entries(t).forEach(([n,o])=>{let a=e?e+n:n;if(typeof o=="object")bu(o,a+".",r,s);else if(typeof o=="string"||typeof o=="number")s(a,o.toString());else if(typeof o=="boolean")s(a,o?"1":"0");else throw new Error(`Can't handle extra config type: ${typeof o}`)})},Ie=t=>{let e=Ue(),r=e.stackSave();try{let s=e.PTR_SIZE,n=e.stackAlloc(2*s);e._OrtGetLastError(n,n+s);let o=Number(e.getValue(n,s===4?"i32":"i64")),a=e.getValue(n+s,"*"),i=a?e.UTF8ToString(a):"";throw new Error(`${t} ERROR_CODE: ${o}, ERROR_MESSAGE: ${i}`)}finally{e.stackRestore(r)}}}),xE,YC=ye(()=>{"use strict";ks(),u0(),xE=t=>{let e=Ue(),r=0,s=[],n=t||{};try{if(t?.logSeverityLevel===void 0)n.logSeverityLevel=2;else if(typeof t.logSeverityLevel!="number"||!Number.isInteger(t.logSeverityLevel)||t.logSeverityLevel<0||t.logSeverityLevel>4)throw new Error(`log severity level is not valid: ${t.logSeverityLevel}`);if(t?.logVerbosityLevel===void 0)n.logVerbosityLevel=0;else if(typeof t.logVerbosityLevel!="number"||!Number.isInteger(t.logVerbosityLevel))throw new Error(`log verbosity level is not valid: ${t.logVerbosityLevel}`);t?.terminate===void 0&&(n.terminate=!1);let o=0;return t?.tag!==void 0&&(o=It(t.tag,s)),r=e._OrtCreateRunOptions(n.logSeverityLevel,n.logVerbosityLevel,!!n.terminate,o),r===0&&Ie("Can't create run options."),t?.extra!==void 0&&bu(t.extra,"",new WeakSet,(a,i)=>{let l=It(a,s),u=It(i,s);e._OrtAddRunConfigEntry(r,l,u)!==0&&Ie(`Can't set a run config entry: ${a} - ${i}.`)}),[r,s]}catch(o){throw r!==0&&e._OrtReleaseRunOptions(r),s.forEach(a=>e._free(a)),o}}}),Ik,Ck,Pk,hu,Dr,zk,yE,QC=ye(()=>{"use strict";ks(),u0(),Ik=t=>{switch(t){case"disabled":return 0;case"basic":return 1;case"extended":return 2;case"layout":return 3;case"all":return 99;default:throw new Error(`unsupported graph optimization level: ${t}`)}},Ck=t=>{switch(t){case"sequential":return 0;case"parallel":return 1;default:throw new Error(`unsupported execution mode: ${t}`)}},Pk=t=>{t.extra||(t.extra={}),t.extra.session||(t.extra.session={});let e=t.extra.session;e.use_ort_model_bytes_directly||(e.use_ort_model_bytes_directly="1"),t.executionProviders&&t.executionProviders.some(r=>(typeof r=="string"?r:r.name)==="webgpu")&&(t.enableMemPattern=!1)},hu=(t,e,r,s)=>{let n=It(e,s),o=It(r,s);Ue()._OrtAddSessionConfigEntry(t,n,o)!==0&&Ie(`Can't set a session config entry: ${e} - ${r}.`)},Dr=(t,e,r,s)=>{let n=It(e,s),o=It(r,s);t.push([n,o])},zk=async(t,e,r)=>{let s=e.executionProviders;for(let n of s){let o=typeof n=="string"?n:n.name,a=[];switch(o){case"webnn":if(o="WEBNN",typeof n!="string"){let f=n?.deviceType;f&&hu(t,"deviceType",f,r)}break;case"webgpu":{o="WebGPU";let f;if(typeof n!="string"){let _=n;if(_.device)if(typeof GPUDevice<"u"&&_.device instanceof GPUDevice)f=_.device;else throw new Error("Invalid GPU device set in WebGPU EP options.");let{enableGraphCapture:w}=e;if(typeof w=="boolean"&&w&&Dr(a,"enableGraphCapture","1",r),typeof _.preferredLayout=="string"&&Dr(a,"preferredLayout",_.preferredLayout,r),_.forceCpuNodeNames){let x=Array.isArray(_.forceCpuNodeNames)?_.forceCpuNodeNames:[_.forceCpuNodeNames];Dr(a,"forceCpuNodeNames",x.join(`
|
|
15
|
+
`),r)}_.validationMode&&Dr(a,"validationMode",_.validationMode,r)}let m=Ue().webgpuRegisterDevice(f);if(m){let[_,w,x]=m;Dr(a,"deviceId",_.toString(),r),Dr(a,"webgpuInstance",w.toString(),r),Dr(a,"webgpuDevice",x.toString(),r)}}break;case"wasm":case"cpu":continue;default:throw new Error(`not supported execution provider: ${o}`)}let i=It(o,r),l=a.length,u=0,d=0;if(l>0){u=Ue()._malloc(l*Ue().PTR_SIZE),r.push(u),d=Ue()._malloc(l*Ue().PTR_SIZE),r.push(d);for(let f=0;f<l;f++)Ue().setValue(u+f*Ue().PTR_SIZE,a[f][0],"*"),Ue().setValue(d+f*Ue().PTR_SIZE,a[f][1],"*")}await Ue()._OrtAppendExecutionProvider(t,i,u,d,l)!==0&&Ie(`Can't append execution provider: ${o}.`)}},yE=async t=>{let e=Ue(),r=0,s=[],n=t||{};Pk(n);try{let o=Ik(n.graphOptimizationLevel??"all"),a=Ck(n.executionMode??"sequential"),i=typeof n.logId=="string"?It(n.logId,s):0,l=n.logSeverityLevel??2;if(!Number.isInteger(l)||l<0||l>4)throw new Error(`log severity level is not valid: ${l}`);let u=n.logVerbosityLevel??0;if(!Number.isInteger(u)||u<0||u>4)throw new Error(`log verbosity level is not valid: ${u}`);let d=typeof n.optimizedModelFilePath=="string"?It(n.optimizedModelFilePath,s):0;if(r=e._OrtCreateSessionOptions(o,!!n.enableCpuMemArena,!!n.enableMemPattern,a,!!n.enableProfiling,0,i,l,u,d),r===0&&Ie("Can't create session options."),n.executionProviders&&await zk(r,n,s),n.enableGraphCapture!==void 0){if(typeof n.enableGraphCapture!="boolean")throw new Error(`enableGraphCapture must be a boolean value: ${n.enableGraphCapture}`);hu(r,"enableGraphCapture",n.enableGraphCapture.toString(),s)}if(n.freeDimensionOverrides)for(let[f,m]of Object.entries(n.freeDimensionOverrides)){if(typeof f!="string")throw new Error(`free dimension override name must be a string: ${f}`);if(typeof m!="number"||!Number.isInteger(m)||m<0)throw new Error(`free dimension override value must be a non-negative integer: ${m}`);let _=It(f,s);e._OrtAddFreeDimensionOverride(r,_,m)!==0&&Ie(`Can't set a free dimension override: ${f} - ${m}.`)}return n.extra!==void 0&&bu(n.extra,"",new WeakSet,(f,m)=>{hu(r,f,m,s)}),[r,s]}catch(o){throw r!==0&&e._OrtReleaseSessionOptions(r)!==0&&Ie("Can't release session options."),s.forEach(a=>e._free(a)),o}}}),ws,wu,hn,li,vu,p0,d0,e0,_n=ye(()=>{"use strict";ws=t=>{switch(t){case"int8":return 3;case"uint8":return 2;case"bool":return 9;case"int16":return 5;case"uint16":return 4;case"int32":return 6;case"uint32":return 12;case"float16":return 10;case"float32":return 1;case"float64":return 11;case"string":return 8;case"int64":return 7;case"uint64":return 13;case"int4":return 22;case"uint4":return 21;default:throw new Error(`unsupported data type: ${t}`)}},wu=t=>{switch(t){case 3:return"int8";case 2:return"uint8";case 9:return"bool";case 5:return"int16";case 4:return"uint16";case 6:return"int32";case 12:return"uint32";case 10:return"float16";case 1:return"float32";case 11:return"float64";case 8:return"string";case 7:return"int64";case 13:return"uint64";case 22:return"int4";case 21:return"uint4";default:throw new Error(`unsupported data type: ${t}`)}},hn=(t,e)=>{let r=[-1,4,1,1,2,2,4,8,-1,1,2,8,4,8,-1,-1,-1,-1,-1,-1,-1,.5,.5][t],s=typeof e=="number"?e:e.reduce((n,o)=>n*o,1);return r>0?Math.ceil(s*r):void 0},li=t=>{switch(t){case"float16":return typeof Float16Array<"u"&&Float16Array.from?Float16Array:Uint16Array;case"float32":return Float32Array;case"uint8":return Uint8Array;case"int8":return Int8Array;case"uint16":return Uint16Array;case"int16":return Int16Array;case"int32":return Int32Array;case"bool":return Uint8Array;case"float64":return Float64Array;case"uint32":return Uint32Array;case"int64":return BigInt64Array;case"uint64":return BigUint64Array;default:throw new Error(`unsupported type: ${t}`)}},vu=t=>{switch(t){case"verbose":return 0;case"info":return 1;case"warning":return 2;case"error":return 3;case"fatal":return 4;default:throw new Error(`unsupported logging level: ${t}`)}},p0=t=>t==="float32"||t==="float16"||t==="int32"||t==="int64"||t==="uint32"||t==="uint8"||t==="bool"||t==="uint4"||t==="int4",d0=t=>t==="float32"||t==="float16"||t==="int32"||t==="int64"||t==="uint32"||t==="uint64"||t==="int8"||t==="uint8"||t==="bool"||t==="uint4"||t==="int4",e0=t=>{switch(t){case"none":return 0;case"cpu":return 1;case"cpu-pinned":return 2;case"texture":return 3;case"gpu-buffer":return 4;case"ml-tensor":return 5;default:throw new Error(`unsupported data location: ${t}`)}}}),f0,bE=ye(()=>{"use strict";i0(),f0=async t=>{if(typeof t=="string"){let e=await fetch(t);if(!e.ok)throw new Error(`failed to load external data file: ${t}`);let r=e.headers.get("Content-Length"),s=r?parseInt(r,10):0;if(s<1073741824)return new Uint8Array(await e.arrayBuffer());{if(!e.body)throw new Error(`failed to load external data file: ${t}, no response body.`);let n=e.body.getReader(),o;try{o=new ArrayBuffer(s)}catch(i){if(i instanceof RangeError){let l=Math.ceil(s/65536);o=new WebAssembly.Memory({initial:l,maximum:l}).buffer}else throw i}let a=0;for(;;){let{done:i,value:l}=await n.read();if(i)break;let u=l.byteLength;new Uint8Array(o,a,u).set(l),a+=u}return new Uint8Array(o,0,s)}}else return t instanceof Blob?new Uint8Array(await t.arrayBuffer()):t instanceof Uint8Array?t:new Uint8Array(t)}}),vE,JC=ye(()=>{"use strict";_n(),vE=(t,e)=>new(li(e))(t)}),Lk,Nk,$k,Rk,kE,Uk,_t,EE=ye(()=>{"use strict";_n(),Lk=["V","I","W","E","F"],Nk=(t,e)=>{console.log(`[${Lk[t]},${new Date().toISOString()}]${e}`)},kE=(t,e)=>{$k=t,Rk=e},Uk=(t,e)=>{let r=vu(t),s=vu($k);r>=s&&Nk(r,typeof e=="function"?e():e)},_t=(...t)=>{Rk&&Uk(...t)}}),Gy,t0,qy,Bk,Wy,Dk,Vy,Hy,Xy,Fk,AE,ZC=ye(()=>{"use strict";_n(),EE(),Gy=new Map([["float32",32],["float16",16],["int32",32],["uint32",32],["int64",64],["uint64",64],["int8",8],["uint8",8],["int4",4],["uint4",4]]),t0=(t,e)=>{if(e==="int32")return t;let r=Gy.get(e);if(!r)throw new Error(`WebNN backend does not support data type: ${e}`);let s=r/8;if(t.byteLength%s!==0)throw new Error(`Invalid Uint8Array length - must be a multiple of ${s}.`);let n=t.byteLength/s,o=new(li(e))(t.buffer,t.byteOffset,n);switch(e){case"int64":case"uint64":{let a=new Int32Array(n);for(let i=0;i<n;i++){let l=o[i];if(l>2147483647n||l<-2147483648n)throw new Error("Can not convert int64 data to int32 - value out of range.");a[i]=Number(l)}return new Uint8Array(a.buffer)}case"int8":case"uint8":case"uint32":{if(e==="uint32"&&o.some(i=>i>2147483647))throw new Error("Can not convert uint32 data to int32 - value out of range.");let a=Int32Array.from(o,Number);return new Uint8Array(a.buffer)}default:throw new Error(`Unsupported data conversion from ${e} to 'int32'`)}},qy=(t,e)=>{if(e==="int32")return t;if(t.byteLength%4!==0)throw new Error("Invalid Uint8Array length - must be a multiple of 4 (int32).");let r=t.byteLength/4,s=new Int32Array(t.buffer,t.byteOffset,r);switch(e){case"int64":{let n=BigInt64Array.from(s,BigInt);return new Uint8Array(n.buffer)}case"uint64":{if(s.some(o=>o<0))throw new Error("Can not convert int32 data to uin64 - negative value found.");let n=BigUint64Array.from(s,BigInt);return new Uint8Array(n.buffer)}case"int8":{if(s.some(o=>o<-128||o>127))throw new Error("Can not convert int32 data to int8 - value out of range.");let n=Int8Array.from(s,Number);return new Uint8Array(n.buffer)}case"uint8":{if(s.some(n=>n<0||n>255))throw new Error("Can not convert int32 data to uint8 - value out of range.");return Uint8Array.from(s,Number)}case"uint32":{if(s.some(o=>o<0))throw new Error("Can not convert int32 data to uint32 - negative value found.");let n=Uint32Array.from(s,Number);return new Uint8Array(n.buffer)}default:throw new Error(`Unsupported data conversion from 'int32' to ${e}`)}},Bk=1,Wy=()=>Bk++,Dk=new Map([["int8","int32"],["uint8","int32"],["uint32","int32"],["int64","int32"]]),Vy=(t,e)=>{let r=Gy.get(t);if(!r)throw new Error(`WebNN backend does not support data type: ${t}`);return e.length>0?Math.ceil(e.reduce((s,n)=>s*n)*r/8):0},Hy=class{constructor(t){this.isDataConverted=!1;let{sessionId:e,context:r,tensor:s,dataType:n,shape:o,fallbackDataType:a}=t;this.sessionId=e,this.mlContext=r,this.mlTensor=s,this.dataType=n,this.tensorShape=o,this.fallbackDataType=a}get tensor(){return this.mlTensor}get type(){return this.dataType}get fallbackType(){return this.fallbackDataType}get shape(){return this.tensorShape}get byteLength(){return Vy(this.dataType,this.tensorShape)}destroy(){_t("verbose",()=>"[WebNN] TensorWrapper.destroy"),this.mlTensor.destroy()}write(t){this.mlContext.writeTensor(this.mlTensor,t)}async read(t){if(this.fallbackDataType){let e=await this.mlContext.readTensor(this.mlTensor),r=qy(new Uint8Array(e),this.dataType);if(t){(t instanceof ArrayBuffer?new Uint8Array(t):new Uint8Array(t.buffer,t.byteOffset,t.byteLength)).set(r);return}else return r.buffer}else return t?this.mlContext.readTensor(this.mlTensor,t):this.mlContext.readTensor(this.mlTensor)}canReuseTensor(t,e,r){return this.mlContext===t&&this.dataType===e&&this.tensorShape.length===r.length&&this.tensorShape.every((s,n)=>s===r[n])}setIsDataConverted(t){this.isDataConverted=t}},Xy=class{constructor(t,e){this.tensorManager=t,this.wrapper=e}get tensorWrapper(){return this.wrapper}releaseTensor(){this.tensorWrapper&&(this.tensorManager.releaseTensor(this.tensorWrapper),this.wrapper=void 0)}async ensureTensor(t,e,r,s){let n=this.tensorManager.getMLContext(t),o=this.tensorManager.getMLOpSupportLimits(t),a;if(!o?.input.dataTypes.includes(e)){if(a=Dk.get(e),!a||o?.input.dataTypes.includes(a))throw new Error(`WebNN backend does not support data type: ${e}`);_t("verbose",()=>`[WebNN] TensorIdTracker.ensureTensor: fallback dataType from ${e} to ${a}`)}if(this.wrapper){if(this.wrapper.canReuseTensor(n,e,r))return this.wrapper.tensor;if(s){if(this.wrapper.byteLength!==Vy(e,r))throw new Error("Unable to copy data to tensor with different size.");this.activeUpload=new Uint8Array(await this.wrapper.read())}this.tensorManager.releaseTensor(this.wrapper)}let i=typeof MLTensorUsage>"u"?void 0:MLTensorUsage.READ|MLTensorUsage.WRITE;return this.wrapper=await this.tensorManager.getCachedTensor(t,e,r,i,!0,!0,a),s&&this.activeUpload&&(this.wrapper.write(this.activeUpload),this.activeUpload=void 0),this.wrapper.tensor}upload(t){let e=t;if(this.wrapper){if(this.wrapper.fallbackType)if(this.wrapper.fallbackType==="int32")e=t0(t,this.wrapper.type),this.wrapper.setIsDataConverted(!0);else throw new Error(`Unsupported fallback data type: ${this.wrapper.fallbackType}`);if(t.byteLength===this.wrapper.byteLength){this.wrapper.write(e);return}else _t("verbose",()=>"Data size does not match tensor size. Releasing tensor."),this.releaseTensor()}this.activeUpload?this.activeUpload.set(e):this.activeUpload=new Uint8Array(e)}async download(t){if(this.activeUpload){let e=this.wrapper?.isDataConverted?qy(this.activeUpload,this.wrapper?.type):this.activeUpload;if(t){t instanceof ArrayBuffer?new Uint8Array(t).set(e):new Uint8Array(t.buffer,t.byteOffset,t.byteLength).set(e);return}else return e.buffer}if(!this.wrapper)throw new Error("Tensor has not been created.");return t?this.wrapper.read(t):this.wrapper.read()}},Fk=class{constructor(t){this.backend=t,this.tensorTrackersById=new Map,this.freeTensors=[],this.externalTensors=new Set}getMLContext(t){let e=this.backend.getMLContext(t);if(!e)throw new Error("MLContext not found for session.");return e}getMLOpSupportLimits(t){return this.backend.getMLOpSupportLimits(t)}reserveTensorId(){let t=Wy();return this.tensorTrackersById.set(t,new Xy(this)),t}releaseTensorId(t){let e=this.tensorTrackersById.get(t);e&&(this.tensorTrackersById.delete(t),e.tensorWrapper&&this.releaseTensor(e.tensorWrapper))}async ensureTensor(t,e,r,s,n){_t("verbose",()=>`[WebNN] TensorManager.ensureTensor {tensorId: ${e}, dataType: ${r}, shape: ${s}, copyOld: ${n}}`);let o=this.tensorTrackersById.get(e);if(!o)throw new Error("Tensor not found.");return o.ensureTensor(t,r,s,n)}upload(t,e){let r=this.tensorTrackersById.get(t);if(!r)throw new Error("Tensor not found.");r.upload(e)}async download(t,e){_t("verbose",()=>`[WebNN] TensorManager.download {tensorId: ${t}, dstBuffer: ${e?.byteLength}}`);let r=this.tensorTrackersById.get(t);if(!r)throw new Error("Tensor not found.");return r.download(e)}releaseTensorsForSession(t){for(let e of this.freeTensors)e.sessionId===t&&e.destroy();this.freeTensors=this.freeTensors.filter(e=>e.sessionId!==t)}registerTensor(t,e,r,s){let n=this.getMLContext(t),o=Wy(),a=new Hy({sessionId:t,context:n,tensor:e,dataType:r,shape:s});return this.tensorTrackersById.set(o,new Xy(this,a)),this.externalTensors.add(a),o}async getCachedTensor(t,e,r,s,n,o,a){let i=this.getMLContext(t);for(let[u,d]of this.freeTensors.entries())if(d.canReuseTensor(i,e,r)){_t("verbose",()=>`[WebNN] Reusing tensor {dataType: ${e}, ${a?`fallbackDataType: ${a},`:""} shape: ${r}`);let f=this.freeTensors.splice(u,1)[0];return f.sessionId=t,f}_t("verbose",()=>`[WebNN] MLContext.createTensor {dataType: ${e}, ${a?`fallbackDataType: ${a},`:""} shape: ${r}}`);let l=await i.createTensor({dataType:a??e,shape:r,dimensions:r,usage:s,writable:n,readable:o});return new Hy({sessionId:t,context:i,tensor:l,dataType:e,shape:r,fallbackDataType:a})}releaseTensor(t){this.externalTensors.has(t)&&this.externalTensors.delete(t),this.freeTensors.push(t)}},AE=(...t)=>new Fk(...t)}),ME={};ci(ME,{WebNNBackend:()=>TE});var ni,jk,TE,eP=ye(()=>{"use strict";_n(),ks(),JC(),ZC(),EE(),ni=new Map([[1,"float32"],[10,"float16"],[6,"int32"],[12,"uint32"],[7,"int64"],[13,"uint64"],[22,"int4"],[21,"uint4"],[3,"int8"],[2,"uint8"],[9,"uint8"]]),jk=(t,e)=>{if(t===e)return!0;if(t===void 0||e===void 0)return!1;let r=Object.keys(t).sort(),s=Object.keys(e).sort();return r.length===s.length&&r.every((n,o)=>n===s[o]&&t[n]===e[n])},TE=class{constructor(t){this.tensorManager=AE(this),this.mlContextBySessionId=new Map,this.sessionIdsByMLContext=new Map,this.mlContextCache=[],this.sessionGraphInputs=new Map,this.sessionGraphOutputs=new Map,this.temporaryGraphInputs=[],this.temporaryGraphOutputs=[],this.temporarySessionTensorIds=new Map,this.mlOpSupportLimitsBySessionId=new Map,kE(t.logLevel,!!t.debug)}get currentSessionId(){if(this.activeSessionId===void 0)throw new Error("No active session");return this.activeSessionId}onRunStart(t){_t("verbose",()=>`[WebNN] onRunStart {sessionId: ${t}}`),this.activeSessionId=t}onRunEnd(t){_t("verbose",()=>`[WebNN] onRunEnd {sessionId: ${t}}`);let e=this.temporarySessionTensorIds.get(t);if(e){for(let r of e)_t("verbose",()=>`[WebNN] releasing temporary tensor {tensorId: ${r}}`),this.tensorManager.releaseTensorId(r);this.temporarySessionTensorIds.delete(t),this.activeSessionId=void 0}}async createMLContext(t){if(t instanceof GPUDevice){let r=this.mlContextCache.findIndex(s=>s.gpuDevice===t);if(r!==-1)return this.mlContextCache[r].mlContext;{let s=await navigator.ml.createContext(t);return this.mlContextCache.push({gpuDevice:t,mlContext:s}),s}}else if(t===void 0){let r=this.mlContextCache.findIndex(s=>s.options===void 0&&s.gpuDevice===void 0);if(r!==-1)return this.mlContextCache[r].mlContext;{let s=await navigator.ml.createContext();return this.mlContextCache.push({mlContext:s}),s}}let e=this.mlContextCache.findIndex(r=>jk(r.options,t));if(e!==-1)return this.mlContextCache[e].mlContext;{let r=await navigator.ml.createContext(t);return this.mlContextCache.push({options:t,mlContext:r}),r}}registerMLContext(t,e){this.mlContextBySessionId.set(t,e);let r=this.sessionIdsByMLContext.get(e);r||(r=new Set,this.sessionIdsByMLContext.set(e,r)),r.add(t),this.mlOpSupportLimitsBySessionId.has(t)||this.mlOpSupportLimitsBySessionId.set(t,e.opSupportLimits()),this.temporaryGraphInputs.length>0&&(this.sessionGraphInputs.set(t,this.temporaryGraphInputs),this.temporaryGraphInputs=[]),this.temporaryGraphOutputs.length>0&&(this.sessionGraphOutputs.set(t,this.temporaryGraphOutputs),this.temporaryGraphOutputs=[])}onReleaseSession(t){this.sessionGraphInputs.delete(t),this.sessionGraphOutputs.delete(t);let e=this.mlContextBySessionId.get(t);if(!e)return;this.tensorManager.releaseTensorsForSession(t),this.mlContextBySessionId.delete(t),this.mlOpSupportLimitsBySessionId.delete(t);let r=this.sessionIdsByMLContext.get(e);if(r.delete(t),r.size===0){this.sessionIdsByMLContext.delete(e);let s=this.mlContextCache.findIndex(n=>n.mlContext===e);s!==-1&&this.mlContextCache.splice(s,1)}}getMLContext(t){return this.mlContextBySessionId.get(t)}getMLOpSupportLimits(t){return this.mlOpSupportLimitsBySessionId.get(t)}reserveTensorId(){return this.tensorManager.reserveTensorId()}releaseTensorId(t){_t("verbose",()=>`[WebNN] releaseTensorId {tensorId: ${t}}`),this.tensorManager.releaseTensorId(t)}async ensureTensor(t,e,r,s,n){let o=ni.get(r);if(!o)throw new Error(`Unsupported ONNX data type: ${r}`);return this.tensorManager.ensureTensor(t??this.currentSessionId,e,o,s,n)}async createTemporaryTensor(t,e,r){_t("verbose",()=>`[WebNN] createTemporaryTensor {onnxDataType: ${e}, shape: ${r}}`);let s=ni.get(e);if(!s)throw new Error(`Unsupported ONNX data type: ${e}`);let n=this.tensorManager.reserveTensorId();await this.tensorManager.ensureTensor(t,n,s,r,!1);let o=this.temporarySessionTensorIds.get(t);return o?o.push(n):this.temporarySessionTensorIds.set(t,[n]),n}uploadTensor(t,e){if(!Ue().shouldTransferToMLTensor)throw new Error("Trying to upload to a MLTensor while shouldTransferToMLTensor is false");_t("verbose",()=>`[WebNN] uploadTensor {tensorId: ${t}, data: ${e.byteLength}}`),this.tensorManager.upload(t,e)}async downloadTensor(t,e){return this.tensorManager.download(t,e)}createMLTensorDownloader(t,e){return async()=>{let r=await this.tensorManager.download(t);return vE(r,e)}}registerMLTensor(t,e,r,s){let n=ni.get(r);if(!n)throw new Error(`Unsupported ONNX data type: ${r}`);let o=this.tensorManager.registerTensor(t,e,n,s);return _t("verbose",()=>`[WebNN] registerMLTensor {tensor: ${e}, dataType: ${n}, dimensions: ${s}} -> {tensorId: ${o}}`),o}registerMLConstant(t,e,r,s,n,o,a=!1){if(!o)throw new Error("External mounted files are not available.");let i=t;t.startsWith("./")&&(i=t.substring(2));let l=o.get(i);if(!l)throw new Error(`File with name ${i} not found in preloaded files.`);if(e+r>l.byteLength)throw new Error("Out of bounds: data offset and length exceed the external file data size.");let u=l.slice(e,e+r).buffer,d;switch(n.dataType){case"float32":d=new Float32Array(u);break;case"float16":d=typeof Float16Array<"u"&&Float16Array.from?new Float16Array(u):new Uint16Array(u);break;case"int32":d=new Int32Array(u);break;case"uint32":d=new Uint32Array(u);break;case"int64":if(a){let f=t0(new Uint8Array(u),"int64");d=new Int32Array(f.buffer),n.dataType="int32"}else d=new BigInt64Array(u);break;case"uint64":d=new BigUint64Array(u);break;case"int8":d=new Int8Array(u);break;case"int4":case"uint4":case"uint8":d=new Uint8Array(u);break;default:throw new Error(`Unsupported data type: ${n.dataType} in creating WebNN Constant from external data.`)}return _t("verbose",()=>`[WebNN] registerMLConstant {dataType: ${n.dataType}, shape: ${n.shape}}} ${a?"(Note: it was int64 data type and registered to int32 as workaround)":""}`),s.constant(n,d)}registerGraphInput(t){this.temporaryGraphInputs.push(t)}registerGraphOutput(t){this.temporaryGraphOutputs.push(t)}isGraphInput(t,e){let r=this.sessionGraphInputs.get(t);return r?r.includes(e):!1}isGraphOutput(t,e){let r=this.sessionGraphOutputs.get(t);return r?r.includes(e):!1}isGraphInputOutputTypeSupported(t,e,r=!0){let s=ni.get(ws(e)),n=this.mlOpSupportLimitsBySessionId.get(t);return typeof s>"u"?!1:r?!!n?.input.dataTypes.includes(s):!!n?.output.dataTypes.includes(s)}flush(){}}}),Gk,m0,h0,Fr,qk,Ky,ku,_0,g0,Yy,w0,x0,y0,SE=ye(()=>{"use strict";vs(),YC(),QC(),_n(),ks(),u0(),bE(),Gk=(t,e)=>{Ue()._OrtInit(t,e)!==0&&Ie("Can't initialize onnxruntime.")},m0=async t=>{Gk(t.wasm.numThreads,vu(t.logLevel))},h0=async(t,e)=>{Ue().asyncInit?.();let r=t.webgpu.adapter;if(e==="webgpu"){if(typeof navigator>"u"||!navigator.gpu)throw new Error("WebGPU is not supported in current environment");if(r){if(typeof r.limits!="object"||typeof r.features!="object"||typeof r.requestDevice!="function")throw new Error("Invalid GPU adapter set in `env.webgpu.adapter`. It must be a GPUAdapter object.")}else{let s=t.webgpu.powerPreference;if(s!==void 0&&s!=="low-power"&&s!=="high-performance")throw new Error(`Invalid powerPreference setting: "${s}"`);let n=t.webgpu.forceFallbackAdapter;if(n!==void 0&&typeof n!="boolean")throw new Error(`Invalid forceFallbackAdapter setting: "${n}"`);if(r=await navigator.gpu.requestAdapter({powerPreference:s,forceFallbackAdapter:n}),!r)throw new Error('Failed to get GPU adapter. You may need to enable flag "--enable-unsafe-webgpu" if you are using Chrome.')}}if(e==="webnn"&&(typeof navigator>"u"||!navigator.ml))throw new Error("WebNN is not supported in current environment");if(e==="webgpu"&&Ue().webgpuInit(s=>{t.webgpu.device=s}),e==="webnn"){let s=new(eP(),xu(ME)).WebNNBackend(t);Ue().webnnInit([s,()=>s.reserveTensorId(),n=>s.releaseTensorId(n),async(n,o,a,i,l)=>s.ensureTensor(n,o,a,i,l),(n,o)=>{s.uploadTensor(n,o)},async(n,o)=>s.downloadTensor(n,o),(n,o)=>s.registerMLContext(n,o),!!t.trace])}},Fr=new Map,qk=t=>{let e=Ue(),r=e.stackSave();try{let s=e.PTR_SIZE,n=e.stackAlloc(2*s);e._OrtGetInputOutputCount(t,n,n+s)!==0&&Ie("Can't get session input/output count.");let o=s===4?"i32":"i64";return[Number(e.getValue(n,o)),Number(e.getValue(n+s,o))]}finally{e.stackRestore(r)}},Ky=(t,e)=>{let r=Ue(),s=r.stackSave(),n=0;try{let o=r.PTR_SIZE,a=r.stackAlloc(2*o);r._OrtGetInputOutputMetadata(t,e,a,a+o)!==0&&Ie("Can't get session input/output metadata.");let i=Number(r.getValue(a,"*"));n=Number(r.getValue(a+o,"*"));let l=r.HEAP32[n/4];if(l===0)return[i,0];let u=r.HEAPU32[n/4+1],d=[];for(let f=0;f<u;f++){let m=Number(r.getValue(n+8+f*o,"*"));d.push(m!==0?r.UTF8ToString(m):Number(r.getValue(n+8+(f+u)*o,"*")))}return[i,l,d]}finally{r.stackRestore(s),n!==0&&r._OrtFree(n)}},ku=t=>{let e=Ue(),r=e._malloc(t.byteLength);if(r===0)throw new Error(`Can't create a session. failed to allocate a buffer of size ${t.byteLength}.`);return e.HEAPU8.set(t,r),[r,t.byteLength]},_0=async(t,e)=>{let r,s,n=Ue();Array.isArray(t)?[r,s]=t:t.buffer===n.HEAPU8.buffer?[r,s]=[t.byteOffset,t.byteLength]:[r,s]=ku(t);let o=0,a=0,i=0,l=[],u=[],d=[];try{if([a,l]=await yE(e),e?.externalData&&n.mountExternalData){let T=[];for(let z of e.externalData){let C=typeof z=="string"?z:z.path;T.push(f0(typeof z=="string"?z:z.data).then(v=>{n.mountExternalData(C,v)}))}await Promise.all(T)}for(let T of e?.executionProviders??[])if((typeof T=="string"?T:T.name)==="webnn"){if(n.shouldTransferToMLTensor=!1,typeof T!="string"){let z=T,C=z?.context,v=z?.gpuDevice,G=z?.deviceType,X=z?.powerPreference;C?n.currentContext=C:v?n.currentContext=await n.webnnCreateMLContext(v):n.currentContext=await n.webnnCreateMLContext({deviceType:G,powerPreference:X})}else n.currentContext=await n.webnnCreateMLContext();break}o=await n._OrtCreateSession(r,s,a),n.webgpuOnCreateSession?.(o),o===0&&Ie("Can't create a session."),n.jsepOnCreateSession?.(),n.currentContext&&(n.webnnRegisterMLContext(o,n.currentContext),n.currentContext=void 0,n.shouldTransferToMLTensor=!0);let[f,m]=qk(o),_=!!e?.enableGraphCapture,w=[],x=[],k=[],E=[],M=[];for(let T=0;T<f;T++){let[z,C,v]=Ky(o,T);z===0&&Ie("Can't get an input name."),u.push(z);let G=n.UTF8ToString(z);w.push(G),k.push(C===0?{name:G,isTensor:!1}:{name:G,isTensor:!0,type:wu(C),shape:v})}for(let T=0;T<m;T++){let[z,C,v]=Ky(o,T+f);z===0&&Ie("Can't get an output name."),d.push(z);let G=n.UTF8ToString(z);x.push(G),E.push(C===0?{name:G,isTensor:!1}:{name:G,isTensor:!0,type:wu(C),shape:v});{if(_&&e?.preferredOutputLocation===void 0){M.push("gpu-buffer");continue}let X=typeof e?.preferredOutputLocation=="string"?e.preferredOutputLocation:e?.preferredOutputLocation?.[G]??"cpu",V=n.webnnIsGraphOutput;if(X==="cpu"&&V&&V(o,G)){M.push("ml-tensor-cpu-output");continue}if(X!=="cpu"&&X!=="cpu-pinned"&&X!=="gpu-buffer"&&X!=="ml-tensor")throw new Error(`Not supported preferred output location: ${X}.`);if(_&&X!=="gpu-buffer")throw new Error(`Not supported preferred output location: ${X}. Only 'gpu-buffer' location is supported when enableGraphCapture is true.`);M.push(X)}}let I=null;return M.some(T=>T==="gpu-buffer"||T==="ml-tensor"||T==="ml-tensor-cpu-output")&&(i=n._OrtCreateBinding(o),i===0&&Ie("Can't create IO binding."),I={handle:i,outputPreferredLocations:M,outputPreferredLocationsEncoded:M.map(T=>T==="ml-tensor-cpu-output"?"ml-tensor":T).map(T=>e0(T))}),Fr.set(o,[o,u,d,I,_,!1]),[o,w,x,k,E]}catch(f){throw u.forEach(m=>n._OrtFree(m)),d.forEach(m=>n._OrtFree(m)),i!==0&&n._OrtReleaseBinding(i)!==0&&Ie("Can't release IO binding."),o!==0&&n._OrtReleaseSession(o)!==0&&Ie("Can't release session."),f}finally{n._free(r),a!==0&&n._OrtReleaseSessionOptions(a)!==0&&Ie("Can't release session options."),l.forEach(f=>n._free(f)),n.unmountExternalData?.()}},g0=t=>{let e=Ue(),r=Fr.get(t);if(!r)throw new Error(`cannot release session. invalid session id: ${t}`);let[s,n,o,a,i]=r;a&&(i&&e._OrtClearBoundOutputs(a.handle)!==0&&Ie("Can't clear bound outputs."),e._OrtReleaseBinding(a.handle)!==0&&Ie("Can't release IO binding.")),e.jsepOnReleaseSession?.(t),e.webnnOnReleaseSession?.(t),e.webgpuOnReleaseSession?.(t),n.forEach(l=>e._OrtFree(l)),o.forEach(l=>e._OrtFree(l)),e._OrtReleaseSession(s)!==0&&Ie("Can't release session."),Fr.delete(t)},Yy=async(t,e,r,s,n,o,a=!1)=>{if(!t){e.push(0);return}let i=Ue(),l=i.PTR_SIZE,u=t[0],d=t[1],f=t[3],m=f,_,w;if(u==="string"&&(f==="gpu-buffer"||f==="ml-tensor"))throw new Error("String tensor is not supported on GPU.");if(a&&f!=="gpu-buffer")throw new Error(`External buffer must be provided for input/output index ${o} when enableGraphCapture is true.`);if(f==="gpu-buffer"){let E=t[2].gpuBuffer;w=hn(ws(u),d);{let M=i.webgpuRegisterBuffer;if(!M)throw new Error('Tensor location "gpu-buffer" is not supported without using WebGPU.');_=M(E,s)}}else if(f==="ml-tensor"){let E=t[2].mlTensor;w=hn(ws(u),d);let M=i.webnnRegisterMLTensor;if(!M)throw new Error('Tensor location "ml-tensor" is not supported without using WebNN.');_=M(s,E,ws(u),d)}else{let E=t[2];if(Array.isArray(E)){w=l*E.length,_=i._malloc(w),r.push(_);for(let M=0;M<E.length;M++){if(typeof E[M]!="string")throw new TypeError(`tensor data at index ${M} is not a string`);i.setValue(_+M*l,It(E[M],r),"*")}}else{let M=i.webnnIsGraphInput,I=i.webnnIsGraphOutput;if(u!=="string"&&M&&I){let T=i.UTF8ToString(n);if(M(s,T)||I(s,T)){let z=ws(u);w=hn(z,d),m="ml-tensor";let C=i.webnnCreateTemporaryTensor,v=i.webnnUploadTensor;if(!C||!v)throw new Error('Tensor location "ml-tensor" is not supported without using WebNN.');let G=await C(s,z,d);v(G,new Uint8Array(E.buffer,E.byteOffset,E.byteLength)),_=G}else w=E.byteLength,_=i._malloc(w),r.push(_),i.HEAPU8.set(new Uint8Array(E.buffer,E.byteOffset,w),_)}else w=E.byteLength,_=i._malloc(w),r.push(_),i.HEAPU8.set(new Uint8Array(E.buffer,E.byteOffset,w),_)}}let x=i.stackSave(),k=i.stackAlloc(4*d.length);try{d.forEach((M,I)=>i.setValue(k+I*l,M,l===4?"i32":"i64"));let E=i._OrtCreateTensor(ws(u),_,w,k,d.length,e0(m));E===0&&Ie(`Can't create tensor for input/output. session=${s}, index=${o}.`),e.push(E)}finally{i.stackRestore(x)}},w0=async(t,e,r,s,n,o)=>{let a=Ue(),i=a.PTR_SIZE,l=Fr.get(t);if(!l)throw new Error(`cannot run inference. invalid session id: ${t}`);let u=l[0],d=l[1],f=l[2],m=l[3],_=l[4],w=l[5],x=e.length,k=s.length,E=0,M=[],I=[],T=[],z=[],C=[],v=a.stackSave(),G=a.stackAlloc(x*i),X=a.stackAlloc(x*i),V=a.stackAlloc(k*i),Q=a.stackAlloc(k*i);try{[E,M]=xE(o),Gr("wasm prepareInputOutputTensor");for(let P=0;P<x;P++)await Yy(r[P],I,z,t,d[e[P]],e[P],_);for(let P=0;P<k;P++)await Yy(n[P],T,z,t,f[s[P]],x+s[P],_);qr("wasm prepareInputOutputTensor");for(let P=0;P<x;P++)a.setValue(G+P*i,I[P],"*"),a.setValue(X+P*i,d[e[P]],"*");for(let P=0;P<k;P++)a.setValue(V+P*i,T[P],"*"),a.setValue(Q+P*i,f[s[P]],"*");if(m&&!w){let{handle:P,outputPreferredLocations:se,outputPreferredLocationsEncoded:ie}=m;if(d.length!==x)throw new Error(`input count from feeds (${x}) is expected to be always equal to model's input count (${d.length}).`);Gr("wasm bindInputsOutputs");for(let S=0;S<x;S++){let L=e[S];await a._OrtBindInput(P,d[L],I[S])!==0&&Ie(`Can't bind input[${S}] for session=${t}.`)}for(let S=0;S<k;S++){let L=s[S];n[S]?.[3]?(C.push(T[S]),a._OrtBindOutput(P,f[L],T[S],0)!==0&&Ie(`Can't bind pre-allocated output[${S}] for session=${t}.`)):a._OrtBindOutput(P,f[L],0,ie[L])!==0&&Ie(`Can't bind output[${S}] to ${se[S]} for session=${t}.`)}qr("wasm bindInputsOutputs"),Fr.set(t,[u,d,f,m,_,!0])}a.jsepOnRunStart?.(u),a.webnnOnRunStart?.(u);let K;m?K=await a._OrtRunWithBinding(u,m.handle,k,V,E):K=await a._OrtRun(u,X,G,x,Q,k,V,E),K!==0&&Ie("failed to call OrtRun().");let Y=[],B=[];Gr("wasm ProcessOutputTensor");for(let P=0;P<k;P++){let se=Number(a.getValue(V+P*i,"*"));if(se===T[P]||C.includes(T[P])){Y.push(n[P]),se!==T[P]&&a._OrtReleaseTensor(se)!==0&&Ie("Can't release tensor.");continue}let ie=a.stackSave(),S=a.stackAlloc(4*i),L=!1,R,te=0;try{a._OrtGetTensorData(se,S,S+i,S+2*i,S+3*i)!==0&&Ie(`Can't access output tensor data on index ${P}.`);let ue=i===4?"i32":"i64",Be=Number(a.getValue(S,ue));te=a.getValue(S+i,"*");let Pe=a.getValue(S+i*2,"*"),vt=Number(a.getValue(S+i*3,ue)),Qe=[];for(let Me=0;Me<vt;Me++)Qe.push(Number(a.getValue(Pe+Me*i,ue)));a._OrtFree(Pe)!==0&&Ie("Can't free memory for tensor dims.");let et=Qe.reduce((Me,xe)=>Me*xe,1);R=wu(Be);let st=m?.outputPreferredLocations[s[P]];if(R==="string"){if(st==="gpu-buffer"||st==="ml-tensor")throw new Error("String tensor is not supported on GPU.");let Me=[];for(let xe=0;xe<et;xe++){let qe=a.getValue(te+xe*i,"*"),kt=a.getValue(te+(xe+1)*i,"*"),ge=xe===et-1?void 0:kt-qe;Me.push(a.UTF8ToString(qe,ge))}Y.push([R,Qe,Me,"cpu"])}else if(st==="gpu-buffer"&&et>0){let Me=a.webgpuGetBuffer;if(!Me)throw new Error('preferredLocation "gpu-buffer" is not supported without using WebGPU.');let xe=Me(te),qe=hn(Be,et);if(qe===void 0||!p0(R))throw new Error(`Unsupported data type: ${R}`);L=!0;{a.webgpuRegisterBuffer(xe,t,te);let kt=a.webgpuCreateDownloader(xe,qe,t);Y.push([R,Qe,{gpuBuffer:xe,download:async()=>{let ge=await kt();return new(li(R))(ge)},dispose:()=>{a._OrtReleaseTensor(se)!==0&&Ie("Can't release tensor.")}},"gpu-buffer"])}}else if(st==="ml-tensor"&&et>0){let Me=a.webnnEnsureTensor,xe=a.webnnIsGraphInputOutputTypeSupported;if(!Me||!xe)throw new Error('preferredLocation "ml-tensor" is not supported without using WebNN.');if(hn(Be,et)===void 0||!d0(R))throw new Error(`Unsupported data type: ${R}`);if(!xe(t,R,!1))throw new Error(`preferredLocation "ml-tensor" for ${R} output is not supported by current WebNN Context.`);let qe=await Me(t,te,Be,Qe,!1);L=!0,Y.push([R,Qe,{mlTensor:qe,download:a.webnnCreateMLTensorDownloader(te,R),dispose:()=>{a.webnnReleaseTensorId(te),a._OrtReleaseTensor(se)}},"ml-tensor"])}else if(st==="ml-tensor-cpu-output"&&et>0){let Me=a.webnnCreateMLTensorDownloader(te,R)(),xe=Y.length;L=!0,B.push((async()=>{let qe=[xe,await Me];return a.webnnReleaseTensorId(te),a._OrtReleaseTensor(se),qe})()),Y.push([R,Qe,[],"cpu"])}else{let Me=li(R),xe=new Me(et);new Uint8Array(xe.buffer,xe.byteOffset,xe.byteLength).set(a.HEAPU8.subarray(te,te+xe.byteLength)),Y.push([R,Qe,xe,"cpu"])}}finally{a.stackRestore(ie),R==="string"&&te&&a._free(te),L||a._OrtReleaseTensor(se)}}m&&!_&&(a._OrtClearBoundOutputs(m.handle)!==0&&Ie("Can't clear bound outputs."),Fr.set(t,[u,d,f,m,_,!1]));for(let[P,se]of await Promise.all(B))Y[P][2]=se;return qr("wasm ProcessOutputTensor"),Y}finally{a.webnnOnRunEnd?.(u),a.stackRestore(v),r.forEach(K=>{K&&K[3]==="gpu-buffer"&&a.webgpuUnregisterBuffer(K[2].gpuBuffer)}),n.forEach(K=>{K&&K[3]==="gpu-buffer"&&a.webgpuUnregisterBuffer(K[2].gpuBuffer)}),I.forEach(K=>a._OrtReleaseTensor(K)),T.forEach(K=>a._OrtReleaseTensor(K)),z.forEach(K=>a._free(K)),E!==0&&a._OrtReleaseRunOptions(E),M.forEach(K=>a._free(K))}},x0=t=>{let e=Ue(),r=Fr.get(t);if(!r)throw new Error("invalid session id");let s=r[0],n=e._OrtEndProfiling(s);n===0&&Ie("Can't get an profile file name."),e._OrtFree(n)},y0=t=>{let e=[];for(let r of t){let s=r[2];!Array.isArray(s)&&"buffer"in s&&e.push(s.buffer)}return e}}),jr,Ft,mn,oi,ai,_u,Qy,gu,hs,_s,Wk,OE,IE,CE,PE,zE,LE,NE,$E=ye(()=>{"use strict";vs(),SE(),ks(),l0(),jr=()=>!!Ve.wasm.proxy&&typeof document<"u",mn=!1,oi=!1,ai=!1,gu=new Map,hs=(t,e)=>{let r=gu.get(t);r?r.push(e):gu.set(t,[e])},_s=()=>{if(mn||!oi||ai||!Ft)throw new Error("worker not ready")},Wk=t=>{switch(t.data.type){case"init-wasm":mn=!1,t.data.err?(ai=!0,Qy[1](t.data.err)):(oi=!0,Qy[0]()),_u&&(URL.revokeObjectURL(_u),_u=void 0);break;case"init-ep":case"copy-from":case"create":case"release":case"run":case"end-profiling":{let e=gu.get(t.data.type);t.data.err?e.shift()[1](t.data.err):e.shift()[0](t.data.out);break}default:}},OE=async()=>{if(!oi){if(mn)throw new Error("multiple calls to 'initWasm()' detected.");if(ai)throw new Error("previous call to 'initWasm()' failed.");if(mn=!0,jr())return new Promise((t,e)=>{Ft?.terminate(),gE().then(([r,s])=>{try{Ft=s,Ft.onerror=o=>e(o),Ft.onmessage=Wk,Qy=[t,e];let n={type:"init-wasm",in:Ve};!n.in.wasm.wasmPaths&&(r||Zy)&&(n.in.wasm.wasmPaths={wasm:new URL("ort-wasm-simd-threaded.asyncify.wasm",Qt.url).href}),Ft.postMessage(n),_u=r}catch(n){e(n)}},e)});try{await c0(Ve.wasm),await m0(Ve),oi=!0}catch(t){throw ai=!0,t}finally{mn=!1}}},IE=async t=>{if(jr())return _s(),new Promise((e,r)=>{hs("init-ep",[e,r]);let s={type:"init-ep",in:{epName:t,env:Ve}};Ft.postMessage(s)});await h0(Ve,t)},CE=async t=>jr()?(_s(),new Promise((e,r)=>{hs("copy-from",[e,r]);let s={type:"copy-from",in:{buffer:t}};Ft.postMessage(s,[t.buffer])})):ku(t),PE=async(t,e)=>{if(jr()){if(e?.preferredOutputLocation)throw new Error('session option "preferredOutputLocation" is not supported for proxy.');return _s(),new Promise((r,s)=>{hs("create",[r,s]);let n={type:"create",in:{model:t,options:{...e}}},o=[];t instanceof Uint8Array&&o.push(t.buffer),Ft.postMessage(n,o)})}else return _0(t,e)},zE=async t=>{if(jr())return _s(),new Promise((e,r)=>{hs("release",[e,r]);let s={type:"release",in:t};Ft.postMessage(s)});g0(t)},LE=async(t,e,r,s,n,o)=>{if(jr()){if(r.some(a=>a[3]!=="cpu"))throw new Error("input tensor on GPU is not supported for proxy.");if(n.some(a=>a))throw new Error("pre-allocated output tensor is not supported for proxy.");return _s(),new Promise((a,i)=>{hs("run",[a,i]);let l=r,u={type:"run",in:{sessionId:t,inputIndices:e,inputs:l,outputIndices:s,options:o}};Ft.postMessage(u,y0(l))})}else return w0(t,e,r,s,n,o)},NE=async t=>{if(jr())return _s(),new Promise((e,r)=>{hs("end-profiling",[e,r]);let s={type:"end-profiling",in:t};Ft.postMessage(s)});x0(t)}}),Jy,Vk,RE,tP=ye(()=>{"use strict";vs(),$E(),_n(),i0(),bE(),Jy=(t,e)=>{switch(t.location){case"cpu":return[t.type,t.dims,t.data,"cpu"];case"gpu-buffer":return[t.type,t.dims,{gpuBuffer:t.gpuBuffer},"gpu-buffer"];case"ml-tensor":return[t.type,t.dims,{mlTensor:t.mlTensor},"ml-tensor"];default:throw new Error(`invalid data location: ${t.location} for ${e()}`)}},Vk=t=>{switch(t[3]){case"cpu":return new Jt(t[0],t[2],t[1]);case"gpu-buffer":{let e=t[0];if(!p0(e))throw new Error(`not supported data type: ${e} for deserializing GPU tensor`);let{gpuBuffer:r,download:s,dispose:n}=t[2];return Jt.fromGpuBuffer(r,{dataType:e,dims:t[1],download:s,dispose:n})}case"ml-tensor":{let e=t[0];if(!d0(e))throw new Error(`not supported data type: ${e} for deserializing MLTensor tensor`);let{mlTensor:r,download:s,dispose:n}=t[2];return Jt.fromMLTensor(r,{dataType:e,dims:t[1],download:s,dispose:n})}default:throw new Error(`invalid data location: ${t[3]}`)}},RE=class{async fetchModelAndCopyToWasmMemory(t){return CE(await f0(t))}async loadModel(t,e){ys();let r;typeof t=="string"?r=await this.fetchModelAndCopyToWasmMemory(t):r=t,[this.sessionId,this.inputNames,this.outputNames,this.inputMetadata,this.outputMetadata]=await PE(r,e),bs()}async dispose(){return zE(this.sessionId)}async run(t,e,r){ys();let s=[],n=[];Object.entries(t).forEach(f=>{let m=f[0],_=f[1],w=this.inputNames.indexOf(m);if(w===-1)throw new Error(`invalid input '${m}'`);s.push(_),n.push(w)});let o=[],a=[];Object.entries(e).forEach(f=>{let m=f[0],_=f[1],w=this.outputNames.indexOf(m);if(w===-1)throw new Error(`invalid output '${m}'`);o.push(_),a.push(w)});let i=s.map((f,m)=>Jy(f,()=>`input "${this.inputNames[n[m]]}"`)),l=o.map((f,m)=>f?Jy(f,()=>`output "${this.outputNames[a[m]]}"`):null),u=await LE(this.sessionId,n,i,a,l,r),d={};for(let f=0;f<u.length;f++)d[this.outputNames[a[f]]]=o[f]??Vk(u[f]);return bs(),d}startProfiling(){}endProfiling(){NE(this.sessionId)}}}),UE={};ci(UE,{OnnxruntimeWebAssemblyBackend:()=>s0,initializeFlags:()=>r0,wasmBackend:()=>BE});var r0,s0,BE,rP=ye(()=>{"use strict";vs(),$E(),tP(),r0=()=>{(typeof Ve.wasm.initTimeout!="number"||Ve.wasm.initTimeout<0)&&(Ve.wasm.initTimeout=0);let t=Ve.wasm.simd;if(typeof t!="boolean"&&t!==void 0&&t!=="fixed"&&t!=="relaxed"&&(console.warn(`Property "env.wasm.simd" is set to unknown value "${t}". Reset it to \`false\` and ignore SIMD feature checking.`),Ve.wasm.simd=!1),typeof Ve.wasm.proxy!="boolean"&&(Ve.wasm.proxy=!1),typeof Ve.wasm.trace!="boolean"&&(Ve.wasm.trace=!1),typeof Ve.wasm.numThreads!="number"||!Number.isInteger(Ve.wasm.numThreads)||Ve.wasm.numThreads<=0)if(typeof self<"u"&&!self.crossOriginIsolated)Ve.wasm.numThreads=1;else{let e=typeof navigator>"u"?zC("node:os").cpus().length:navigator.hardwareConcurrency;Ve.wasm.numThreads=Math.min(4,Math.ceil((e||1)/2))}},s0=class{async init(t){r0(),await OE(),await IE(t)}async createInferenceSessionHandler(t,e){let r=new RE;return await r.loadModel(t,e),r}},BE=new s0});vs();vs();vs();var sP="1.25.0-dev.20260212-1a71a5f46e",nP=pE;{let t=(rP(),xu(UE)).wasmBackend;xs("webgpu",t,5),xs("webnn",t,5),xs("cpu",t,10),xs("wasm",t,10)}Object.defineProperty(Ve.versions,"web",{value:sP,enumerable:!0});var v0={};async function DE(t){let e=t.split("/").pop(),r;try{if(r=await lu(),r){let n=await r.match(t);if(n)return n}}catch(n){console.warn(`Failed to load ${e} from cache:`,n)}let s=await fetch(t);if(!s.ok)throw new Error(`Failed to fetch ${e}: ${s.status} ${s.statusText}`);if(r)try{await r.put(t,s.clone())}catch(n){console.warn(`Failed to cache ${e}:`,n)}return s}async function FE(t){let e=await DE(t);if(!e||typeof e=="string")return null;try{return await e.arrayBuffer()}catch(r){return console.warn("Failed to read WASM binary:",r),null}}async function jE(t){let e=await DE(t);if(!e||typeof e=="string")return null;try{let r=await e.text(),s=t.split("/").slice(0,-1).join("/");r=r.replace(/import\.meta\.url/g,`"${s}"`);let n=new Blob([r],{type:"text/javascript"});return URL.createObjectURL(n)}catch(r){return console.warn("Failed to read WASM binary:",r),null}}function k0(t){return dn(t,["blob:"])}function E0(t){let e;if(typeof location<"u"&&location.href)e=location.href;else if(typeof v0<"u"&&v0.url)e=v0.url;else return t;return new URL(t,e).href}var M0=require("onnxruntime-common"),aP=Object.freeze({auto:null,gpu:null,cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",coreml:"coreml",webnn:{name:"webnn",deviceType:"cpu"},"webnn-npu":{name:"webnn",deviceType:"npu"},"webnn-gpu":{name:"webnn",deviceType:"gpu"},"webnn-cpu":{name:"webnn",deviceType:"cpu"}}),iP=["verbose","info","warning","error","fatal"],VE=4,jt=[],A0,wn,GE=Symbol.for("onnxruntime");if(GE in globalThis)wn=globalThis[GE];else if(be.IS_NODE_ENV){switch(wn=oP,process.platform){case"win32":jt.push("dml");break;case"linux":process.arch==="x64"&&jt.push("cuda");break;case"darwin":jt.push("coreml");break}jt.push("webgpu"),jt.push("cpu"),A0=["cpu"]}else wn=b0,be.IS_WEBNN_AVAILABLE&&jt.push("webnn-npu","webnn-gpu","webnn-cpu","webnn"),be.IS_WEBGPU_AVAILABLE&&jt.push("webgpu"),jt.push("wasm"),A0=["wasm"];var lP=wn.InferenceSession;function HE(t=null){if(!t)return A0;switch(t){case"auto":return jt;case"gpu":return jt.filter(e=>["webgpu","cuda","dml","webnn-gpu"].includes(e))}if(jt.includes(t))return[aP[t]??t];throw new Error(`Unsupported device: "${t}". Should be one of: ${jt.join(", ")}.`)}var XE=be.IS_BROWSER_ENV||be.IS_WEBWORKER_ENV,qE=Promise.resolve(),gn=null;async function cP(){return gn||(De.useWasmCache&&typeof ft?.wasm?.wasmPaths=="object"&&ft?.wasm?.wasmPaths?.wasm&&ft?.wasm?.wasmPaths?.mjs?(gn=(async()=>{let e=ft.wasm.wasmPaths;await Promise.all([e.wasm&&!k0(e.wasm)?(async()=>{try{let r=await FE(E0(e.wasm));r&&(ft.wasm.wasmBinary=r)}catch(r){console.warn("Failed to pre-load WASM binary:",r)}})():Promise.resolve(),e.mjs&&!k0(e.mjs)?(async()=>{try{let r=await jE(E0(e.mjs));r&&(ft.wasm.wasmPaths.mjs=r)}catch(r){console.warn("Failed to pre-load WASM factory:",r)}})():Promise.resolve()])})(),gn):(gn=Promise.resolve(),gn))}async function Eu(t,e,r){await cP();let s=()=>lP.create(t,{logSeverityLevel:VE,...e}),n=await(XE?qE=qE.then(s):s());return n.config=r,n}var WE=Promise.resolve();async function Au(t,e){let r=()=>t.run(e);return await(XE?WE=WE.then(r):r())}function Mu(t){return t instanceof wn.Tensor}var ft=wn?.env;ft.logLevel=iP[VE];if(ft?.wasm){if(!(typeof ServiceWorkerGlobalScope<"u"&&self instanceof ServiceWorkerGlobalScope)&&ft.versions?.web&&!ft.wasm.wasmPaths){let t=`https://cdn.jsdelivr.net/npm/onnxruntime-web@${ft.versions.web}/dist/`;ft.wasm.wasmPaths=be.IS_SAFARI?{mjs:`${t}ort-wasm-simd-threaded.mjs`,wasm:`${t}ort-wasm-simd-threaded.wasm`}:{mjs:`${t}ort-wasm-simd-threaded.asyncify.mjs`,wasm:`${t}ort-wasm-simd-threaded.asyncify.wasm`}}ft.wasm.proxy=!1}ft?.webgpu&&(ft.webgpu.powerPreference="high-performance");function ui(){return ft?.wasm?.proxy}De.backends.onnx=ft;var Wr=async(t,e,r)=>{let s=await Eu(new Uint8Array(t),e);return(async n=>{let o=ui(),a=Object.fromEntries(Object.entries(n).map(([l,u])=>[l,(o?u.clone():u).ort_tensor])),i=await Au(s,a);return Array.isArray(r)?r.map(l=>new U(i[l])):new U(i[r])})},lr=class{static session_options={};static get nearest_interpolate_4d(){return this._nearest_interpolate_4d||(this._nearest_interpolate_4d=Wr([8,10,18,0,58,129,1,10,41,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,18,10,4,109,111,100,101,34,7,110,101,97,114,101,115,116,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,21],this.session_options,"y")),this._nearest_interpolate_4d}static get bilinear_interpolate_4d(){return this._bilinear_interpolate_4d||(this._bilinear_interpolate_4d=Wr([8,9,18,0,58,128,1,10,40,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,17,10,4,109,111,100,101,34,6,108,105,110,101,97,114,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bilinear_interpolate_4d}static get bicubic_interpolate_4d(){return this._bicubic_interpolate_4d||(this._bicubic_interpolate_4d=Wr([8,9,18,0,58,127,10,39,10,1,120,10,0,10,0,10,1,115,18,1,121,34,6,82,101,115,105,122,101,42,16,10,4,109,111,100,101,34,5,99,117,98,105,99,160,1,3,18,1,114,90,31,10,1,120,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,90,15,10,1,115,18,10,10,8,8,7,18,4,10,2,8,4,98,31,10,1,121,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,99,10,3,18,1,104,10,3,18,1,119,66,2,16,20],this.session_options,"y")),this._bicubic_interpolate_4d}static get matmul(){return this._matmul||(this._matmul=Wr([8,9,18,0,58,55,10,17,10,1,97,10,1,98,18,1,99,34,6,77,97,116,77,117,108,18,1,114,90,9,10,1,97,18,4,10,2,8,1,90,9,10,1,98,18,4,10,2,8,1,98,9,10,1,99,18,4,10,2,8,1,66,2,16,20],this.session_options,"c")),this._matmul}static get stft(){return this._stft||(this._stft=Wr([8,7,18,0,58,148,1,10,38,10,1,115,10,1,106,10,1,119,10,1,108,18,1,111,34,4,83,84,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,115,90,26,10,1,115,18,21,10,19,8,1,18,15,10,3,18,1,98,10,3,18,1,115,10,3,18,1,99,90,11,10,1,106,18,6,10,4,8,7,18,0,90,16,10,1,119,18,11,10,9,8,1,18,5,10,3,18,1,119,90,11,10,1,108,18,6,10,4,8,7,18,0,98,31,10,1,111,18,26,10,24,8,1,18,20,10,3,18,1,98,10,3,18,1,102,10,3,18,1,100,10,3,18,1,99,66,2,16,17],this.session_options,"o")),this._stft}static get rfft(){return this._rfft||(this._rfft=Wr([8,9,18,0,58,97,10,33,10,1,120,10,0,10,1,97,18,1,121,34,3,68,70,84,42,15,10,8,111,110,101,115,105,100,101,100,24,1,160,1,2,18,1,100,90,21,10,1,120,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,90,11,10,1,97,18,6,10,4,8,7,18,0,98,21,10,1,121,18,16,10,14,8,1,18,10,10,3,18,1,115,10,3,18,1,99,66,2,16,20],this.session_options,"y")),this._rfft}static get top_k(){return this._top_k||(this._top_k=Wr([8,10,18,0,58,73,10,18,10,1,120,10,1,107,18,1,118,18,1,105,34,4,84,111,112,75,18,1,116,90,9,10,1,120,18,4,10,2,8,1,90,15,10,1,107,18,10,10,8,8,7,18,4,10,2,8,1,98,9,10,1,118,18,4,10,2,8,1,98,9,10,1,105,18,4,10,2,8,7,66,2,16,21],this.session_options,["v","i"])),this._top_k}static get slice(){return this._slice||(this._slice=Wr([8,7,18,0,58,96,10,25,10,1,120,10,1,115,10,1,101,10,1,97,10,1,116,18,1,121,34,5,83,108,105,99,101,18,1,114,90,9,10,1,120,18,4,10,2,8,1,90,9,10,1,115,18,4,10,2,8,7,90,9,10,1,101,18,4,10,2,8,7,90,9,10,1,97,18,4,10,2,8,7,90,9,10,1,116,18,4,10,2,8,7,98,9,10,1,121,18,4,10,2,8,1,66,2,16,13],this.session_options,"y")),this._slice}};var KE=Object.freeze({auto:"auto",gpu:"gpu",cpu:"cpu",wasm:"wasm",webgpu:"webgpu",cuda:"cuda",dml:"dml",coreml:"coreml",webnn:"webnn","webnn-npu":"webnn-npu","webnn-gpu":"webnn-gpu","webnn-cpu":"webnn-cpu"});var YE=(function(){let t;return async function(){if(t===void 0)if(!be.IS_WEBGPU_AVAILABLE)t=!1;else try{t=(await navigator.gpu.requestAdapter()).features.has("shader-f16")}catch{t=!1}return t}})(),mt=Object.freeze({auto:"auto",fp32:"fp32",fp16:"fp16",q8:"q8",int8:"int8",uint8:"uint8",q4:"q4",bnb4:"bnb4",q4f16:"q4f16"}),T0=Object.freeze({[KE.wasm]:mt.q8}),S0=Object.freeze({[mt.fp32]:"",[mt.fp16]:"_fp16",[mt.int8]:"_int8",[mt.uint8]:"_uint8",[mt.q8]:"_quantized",[mt.q4]:"_q4",[mt.q4f16]:"_q4f16",[mt.bnb4]:"_bnb4"}),xn=Object.freeze({float32:Float32Array,float16:typeof Float16Array<"u"?Float16Array:Uint16Array,float64:Float64Array,string:Array,int8:Int8Array,uint8:Uint8Array,int16:Int16Array,uint16:Uint16Array,int32:Int32Array,uint32:Uint32Array,int64:BigInt64Array,uint64:BigUint64Array,bool:Uint8Array,uint4:Uint8Array,int4:Int8Array});var U=class t{get dims(){return this.ort_tensor.dims}set dims(e){this.ort_tensor.dims=e}get type(){return this.ort_tensor.type}get data(){return this.ort_tensor.data}get size(){return this.ort_tensor.size}get location(){return this.ort_tensor.location}ort_tensor;constructor(...e){return Mu(e[0])?this.ort_tensor=e[0]:this.ort_tensor=new M0.Tensor(e[0],e[1],e[2]),new Proxy(this,{get:(r,s)=>{if(typeof s=="string"){let n=Number(s);if(Number.isInteger(n))return r._getitem(n)}return r[s]},set:(r,s,n)=>r[s]=n})}dispose(){this.ort_tensor.dispose()}*[Symbol.iterator](){let[e,...r]=this.dims;if(r.length>0){let s=r.reduce((n,o)=>n*o);for(let n=0;n<e;++n)yield this._subarray(n,s,r)}else yield*this.data}_getitem(e){let[r,...s]=this.dims;if(e=cr(e,r),s.length>0){let n=s.reduce((o,a)=>o*a);return this._subarray(e,n,s)}else return new t(this.type,[this.data[e]],s)}indexOf(e){let r=this.data;for(let s=0;s<r.length;++s)if(r[s]==e)return s;return-1}_subarray(e,r,s){let n=e*r,o=(e+1)*r,a="subarray"in this.data?this.data.subarray(n,o):this.data.slice(n,o);return new t(this.type,a,s)}item(){let e=this.data;if(e.length!==1)throw new Error(`a Tensor with ${e.length} elements cannot be converted to Scalar`);return e[0]}tolist(){return uP(this.data,this.dims)}sigmoid(){return this.clone().sigmoid_()}sigmoid_(){let e=this.data;for(let r=0;r<e.length;++r)e[r]=1/(1+Math.exp(-e[r]));return this}map(e){return this.clone().map_(e)}map_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]=e(r[s],s,r);return this}mul(e){return this.clone().mul_(e)}mul_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]*=e;return this}div(e){return this.clone().div_(e)}div_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]/=e;return this}add(e){return this.clone().add_(e)}add_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]+=e;return this}sub(e){return this.clone().sub_(e)}sub_(e){let r=this.data;for(let s=0;s<r.length;++s)r[s]-=e;return this}clone(){return new t(this.type,this.data.slice(),this.dims.slice())}slice(...e){let r=[],s=[];for(let d=0;d<this.dims.length;++d){let f=e[d];if(f==null)s.push([0,this.dims[d]]),r.push(this.dims[d]);else if(typeof f=="number")f=cr(f,this.dims[d],d),s.push([f,f+1]);else if(Array.isArray(f)&&f.length===2){let[m,_]=f;if(m=m===null?0:cr(m,this.dims[d],d,!1),_=_===null?this.dims[d]:cr(_,this.dims[d],d,!1),m>_)throw new Error(`Invalid slice: ${f}`);let w=[Math.max(m,0),Math.min(_,this.dims[d])];s.push(w),r.push(w[1]-w[0])}else throw new Error(`Invalid slice: ${f}`)}let n=s.map(([d,f])=>f-d),o=n.reduce((d,f)=>d*f),a=this.data,i=new a.constructor(o),l=this.stride(),u=!0;for(let d=1;d<n.length;++d)if(s[d][0]!==0||s[d][1]!==this.dims[d]){u=!1;break}if(u){let d=s[0][0]*l[0],f=s[0][1]*l[0];if(ArrayBuffer.isView(a))i.set(a.subarray(d,f));else if(Array.isArray(a)){let m=a.slice(d,f);for(let _=0;_<m.length;++_)i[_]=m[_]}else throw new Error("Unsupported data type for slicing")}else for(let d=0;d<o;++d){let f=0;for(let m=n.length-1,_=d;m>=0;--m){let w=n[m];f+=(_%w+s[m][0])*l[m],_=Math.floor(_/w)}i[d]=a[f]}return new t(this.type,i,r)}permute(...e){return ZE(this,e)}transpose(...e){return this.permute(...e)}sum(e=null,r=!1){return this.norm(1,e,r)}norm(e="fro",r=null,s=!1){if(e==="fro")e=2;else if(typeof e=="string")throw Error(`Unsupported norm: ${e}`);let n=this.data,o=(u,d)=>u+d**e;if(r===null){let u=n.reduce(o,0)**(1/e);return new t(this.type,[u],[])}let[a,i,l]=pi(o,this,r,s);if(e!==1)for(let u=0;u<i.length;++u)i[u]=i[u]**(1/e);return new t(a,i,l)}normalize_(e=2,r=1){r=cr(r,this.dims.length);let s=this.norm(e,r,!0),n=this.data,o=s.data;for(let a=0;a<n.length;++a){let i=0;for(let l=this.dims.length-1,u=a,d=1;l>=0;--l){let f=this.dims[l];if(l!==r){let m=u%f;i+=m*d,d*=this.dims[l]}u=Math.floor(u/f)}n[a]/=o[i]}return this}normalize(e=2,r=1){return this.clone().normalize_(e,r)}stride(){return O0(this.dims)}squeeze(e=null){return new t(this.type,this.data,QE(this.dims,e))}squeeze_(e=null){return this.dims=QE(this.dims,e),this}unsqueeze(e){return new t(this.type,this.data,JE(this.dims,e))}unsqueeze_(e){return this.dims=JE(this.dims,e),this}flatten_(e=0,r=-1){r=(r+this.dims.length)%this.dims.length;let s=this.dims.slice(0,e),n=this.dims.slice(e,r+1),o=this.dims.slice(r+1);return this.dims=[...s,n.reduce((a,i)=>a*i,1),...o],this}flatten(e=0,r=-1){return this.clone().flatten_(e,r)}view(...e){let r=-1;for(let n=0;n<e.length;++n)if(e[n]===-1){if(r!==-1)throw new Error("Only one dimension can be inferred");r=n}let s=this.data;if(r!==-1){let n=e.reduce((o,a,i)=>i!==r?o*a:o,1);e[r]=s.length/n}return new t(this.type,s,e)}neg_(){let e=this.data;for(let r=0;r<e.length;++r)e[r]=-e[r];return this}neg(){return this.clone().neg_()}gt(e){let r=new Uint8Array(this.data.length),s=this.data;for(let n=0;n<s.length;++n)r[n]=s[n]>e?1:0;return new t("bool",r,this.dims)}lt(e){let r=new Uint8Array(this.data.length),s=this.data;for(let n=0;n<s.length;++n)r[n]=s[n]<e?1:0;return new t("bool",r,this.dims)}clamp_(e,r){let s=this.data;for(let n=0;n<s.length;++n)s[n]=Math.min(Math.max(s[n],e),r);return this}clamp(e,r){return this.clone().clamp_(e,r)}round_(){let e=this.data;for(let r=0;r<e.length;++r)e[r]=Math.round(e[r]);return this}round(){return this.clone().round_()}mean(e=null,r=!1){return fi(this,e,r)}min(e=null,r=!1){if(e===null){let a=ti(this.data)[0];return new t(this.type,[a],[])}let[s,n,o]=pi((a,i)=>Math.min(a,i),this,e,r,1/0);return new t(s,n,o)}max(e=null,r=!1){if(e===null){let a=Te(this.data)[0];return new t(this.type,[a],[])}let[s,n,o]=pi((a,i)=>Math.max(a,i),this,e,r,-1/0);return new t(s,n,o)}argmin(e=null,r=!1){if(e!==null)throw new Error("`dim !== null` not yet implemented.");let s=ti(this.data)[1];return new t("int64",[BigInt(s)],[])}argmax(e=null,r=!1){if(e!==null)throw new Error("`dim !== null` not yet implemented.");let s=Te(this.data)[1];return new t("int64",[BigInt(s)],[])}repeat(...e){if(e.length<this.dims.length)throw new Error(`Number of dimensions of repeat dims (${e.length}) cannot be smaller than number of dimensions of tensor (${this.dims.length})`);if(e.every(d=>d===1)){if(e.length===this.dims.length)return this.clone();let d=e.length-this.dims.length,f=Array(d).fill(1).concat(this.dims);return new t(this.type,this.data.slice(),f)}let r=e.length-this.dims.length,s=Array(r).fill(1).concat(this.dims),n=s.map((d,f)=>d*e[f]),o=n.reduce((d,f)=>d*f,1),a=this.data,i=new a.constructor(o),l=O0(s),u=O0(n);for(let d=0;d<o;++d){let f=d,m=0;for(let _=0;_<n.length;++_){let w=Math.floor(f/u[_]);f=f%u[_];let x=w%s[_];m+=x*l[_]}i[d]=a[m]}return new t(this.type,i,n)}tile(...e){if(e.length<this.dims.length){let r=this.dims.length-e.length;e=Array(r).fill(1).concat(e)}return this.repeat(...e)}to(e){if(this.type===e)return this;if(!xn.hasOwnProperty(e))throw new Error(`Unsupported type: ${e}`);let r,s=["int64","uint64"].includes(this.type),n=["int64","uint64"].includes(e);if(s&&!n)r=Number;else if(!s&&n)["float16","float32","float64"].includes(this.type)?r=o=>BigInt(Math.floor(o)):r=BigInt;else if(this.type==="float16"&&e=="float32"&&this.data instanceof Uint16Array)return new t(e,xk(this.data),this.dims);return new t(e,xn[e].from(this.data,r),this.dims)}};function uP(t,e){let r=t.length,s=e.reduce((o,a)=>o*a);if(r!==s)throw Error(`cannot reshape array of size ${r} into shape (${e})`);let n=t;for(let o=e.length-1;o>=0;o--)n=n.reduce((a,i)=>{let l=a[a.length-1];return l.length<e[o]?l.push(i):a.push([i]),a},[[]]);return n[0]}function ZE(t,e){let[r,s]=fk(t.data,t.dims,e);return new U(t.type,r,s)}function Su(t,[e,r],s="bilinear",n=!1){let o=t.dims.at(-3)??1,a=t.dims.at(-2),i=t.dims.at(-1),l=dk(t.data,[o,a,i],[e,r],s,n);return new U(t.type,l,[o,e,r])}async function Pt(t,{size:e=null,mode:r="bilinear"}={}){if(t.dims.length!==4)throw new Error("`interpolate_4d` currently only supports 4D input.");if(!e)throw new Error("`interpolate_4d` requires a `size` argument.");let s;if(e.length===2)s=[...t.dims.slice(0,2),...e];else if(e.length===3)s=[t.dims[0],...e];else if(e.length===4)s=e;else throw new Error("`size` must be of length 2, 3, or 4.");let n;if(r==="nearest")n=await lr.nearest_interpolate_4d;else if(r==="bilinear")n=await lr.bilinear_interpolate_4d;else if(r==="bicubic")n=await lr.bicubic_interpolate_4d;else throw new Error(`Unsupported mode: ${r}`);let o=new U("int64",new BigInt64Array(s.map(BigInt)),[s.length]);return await n({x:t,s:o})}async function I0(t,e){return await(await lr.matmul)({a:t,b:e})}async function pP(t,e){return await(await lr.rfft)({x:t,a:e})}async function Gt(t,e){let r=await lr.top_k;return e==null?e=t.dims.at(-1):e=Math.min(e,t.dims.at(-1)),await r({x:t,k:new U("int64",[BigInt(e)],[1])})}var Tu=t=>new U("int64",t,[t.length]);async function di(t,e,r,s,n){return await(await lr.slice)({x:t,s:Tu(e),e:Tu(r),a:Tu(s),t:Tu(n??new Array(s.length).fill(1))})}function C0(t,e){let r=t.data,s=e.data,n=[t.dims[0],t.dims[2]],o=new r.constructor(n[0]*n[1]),[a,i,l]=t.dims,u=0;for(let d=0;d<a;++d){let f=d*l*i;for(let m=0;m<l;++m){let _=0,w=0,x=d*i,k=f+m;for(let M=0;M<i;++M){let I=Number(s[x+M]);w+=I,_+=r[k+M*l]*I}let E=_/w;o[u++]=E}}return new U(t.type,o,n)}function dP(t,e,{eps:r=1e-5}={}){if(t.dims.length!==2)throw new Error("`layer_norm` currently only supports 2D input.");let[s,n]=t.dims;if(e.length!==1&&e[0]!==n)throw new Error("`normalized_shape` must be a 1D array with shape `[input.dims[1]]`.");let[o,a]=Ou(t,1,0,!0),i=o.data,l=a.data,u=t.data,d=new u.constructor(u.length);for(let f=0;f<s;++f){let m=f*n;for(let _=0;_<n;++_){let w=m+_;d[w]=(u[w]-l[f])/(i[f]+r)}}return new U(t.type,d,t.dims)}function QE(t,e){return t=t.slice(),e===null?t=t.filter(r=>r!==1):typeof e=="number"?t[e]===1&&t.splice(e,1):Array.isArray(e)&&(t=t.filter((r,s)=>r!==1||!e.includes(s))),t}function JE(t,e){return e=cr(e,t.length+1),t=t.slice(),t.splice(e,0,1),t}function cr(t,e,r=null,s=!0){if(t<-e||t>=e){if(s)throw new Error(`IndexError: index ${t} is out of bounds for dimension${r===null?"":" "+r} with size ${e}`);return t<-e?0:e}return t<0&&(t=(t%e+e)%e),t}function Ee(t,e=0){e=cr(e,t[0].dims.length);let r=t[0].dims.slice();r[e]=t.reduce((a,i)=>a+i.dims[e],0);let s=r.reduce((a,i)=>a*i,1),n=new t[0].data.constructor(s),o=t[0].type;if(e===0){let a=0;for(let i of t){let l=i.data;n.set(l,a),a+=l.length}}else{let a=0;for(let i=0;i<t.length;++i){let{data:l,dims:u}=t[i];for(let d=0;d<l.length;++d){let f=0;for(let m=u.length-1,_=d,w=1;m>=0;--m){let x=u[m],k=_%x;m===e&&(k+=a),f+=k*w,w*=r[m],_=Math.floor(_/x)}n[f]=l[d]}a+=u[e]}}return new U(o,n,r)}function zt(t,e=0){return Ee(t.map(r=>r.unsqueeze(e)),e)}function pi(t,e,r,s=!1,n=null){let o=e.data,a=e.dims;r=cr(r,a.length);let i=a.slice();i[r]=1;let l=new o.constructor(o.length/a[r]);n!==null&&l.fill(n);for(let u=0;u<o.length;++u){let d=0;for(let f=a.length-1,m=u,_=1;f>=0;--f){let w=a[f];if(f!==r){let x=m%w;d+=x*_,_*=i[f]}m=Math.floor(m/w)}l[d]=t(l[d],o[u],u,d)}return s||i.splice(r,1),[e.type,l,i]}function Ou(t,e=null,r=1,s=!1){let n=t.data,o=t.dims;if(e===null){let _=n.reduce((E,M)=>E+M,0)/n.length,w=Math.sqrt(n.reduce((E,M)=>E+(M-_)**2,0)/(n.length-r)),x=new U(t.type,[_],[]);return[new U(t.type,[w],[]),x]}e=cr(e,o.length);let a=fi(t,e,s),i=a.data,[l,u,d]=pi((m,_,w,x)=>m+(_-i[x])**2,t,e,s);for(let m=0;m<u.length;++m)u[m]=Math.sqrt(u[m]/(o[e]-r));return[new U(l,u,d),a]}function fi(t,e=null,r=!1){let s=t.dims,n=t.data;if(e===null){let l=n.reduce((u,d)=>u+d,0);return new U(t.type,[l/n.length],[])}e=cr(e,s.length);let[o,a,i]=pi((l,u)=>l+u,t,e,r);if(s[e]!==1)for(let l=0;l<a.length;++l)a[l]/=s[e];return new U(o,a,i)}function O0(t){let e=new Array(t.length);for(let r=t.length-1,s=1;r>=0;--r)e[r]=s,s*=t[r];return e}function P0(t,e,r,s){let n=t.reduce((o,a)=>o*a,1);return new U(r,new s(n).fill(e),t)}function Ge(t,e){let r,s;if(typeof e=="number")r="float32",s=Float32Array;else if(typeof e=="bigint")r="int64",s=BigInt64Array;else if(typeof e=="boolean")r="bool",s=Uint8Array;else throw new Error(`Unsupported data type: ${typeof e}`);return P0(t,e,r,s)}function yn(t,e){return Ge(t.dims,e)}function rt(t){return P0(t,1n,"int64",BigInt64Array)}function mi(t){return rt(t.dims)}function Iu(t){return P0(t,0n,"int64",BigInt64Array)}function Cu(t){return Iu(t.dims)}function fP(t){let e=t.reduce((r,s)=>r*s,1);return new U("float32",Float32Array.from({length:e},()=>Math.random()),t)}function z0(t){let e=t.reduce((s,n)=>s*n,1),r=new Float32Array(e);for(let s=0;s<e;s+=2){let n=1-Math.random(),o=Math.random(),a=Math.sqrt(-2*Math.log(n)),i=2*Math.PI*o;r[s]=a*Math.cos(i),s+1<e&&(r[s+1]=a*Math.sin(i))}return new U("float32",r,t)}function L0(t,e){if(t.dims.length!==2)throw new Error("The tensor must have 2 dimensions");if(t.dims.at(-1)%8!==0)throw new Error("The last dimension of the tensor must be a multiple of 8");if(!["binary","ubinary"].includes(e))throw new Error("The precision must be either 'binary' or 'ubinary'");let r=e==="binary",s=r?"int8":"uint8",n=r?Int8Array:Uint8Array,o=t.data,a=new n(o.length/8);for(let i=0;i<o.length;++i){let l=o[i]>0?1:0,u=Math.floor(i/8),d=i%8;a[u]|=l<<7-d,r&&d===0&&(a[u]-=128)}return new U(s,a,[t.dims[0],t.dims[1]/8])}async function N0(t,e){return await Promise.all([it(t,"tokenizer.json",!0,e),it(t,"tokenizer_config.json",!0,e)])}function $0(t){let e=t.dims;switch(e.length){case 1:return t.tolist();case 2:if(e[0]!==1)throw new Error("Unable to decode tensor with `batch size !== 1`. Use `tokenizer.batch_decode(...)` for batched inputs.");return t.tolist()[0];default:throw new Error(`Expected tensor to have 1-2 dimensions, got ${e.length}.`)}}var mP=["bos_token","eos_token","unk_token","sep_token","pad_token","cls_token","mask_token"];function hP(t,e,r,s){for(let n of Object.keys(t)){let o=e-t[n].length,a=r(n),i=new Array(o).fill(a);t[n]=s==="right"?dt(t[n],i):dt(i,t[n])}}function _P(t,e){for(let r of Object.keys(t))t[r].length=e}function Es(t,...e){for(let r of e){if(!Object.hasOwn(t,r))continue;let s=t[r];if(s)if(typeof s=="object"){if(s.__type==="AddedToken")return s.content;throw Error(`Unknown token: ${s}`)}else return s}return null}function gP(t){let e=[];for(let r of t.get_added_tokens_decoder().values())r.special&&e.push(r);return e}var j=class extends Je{return_token_type_ids=!1;padding_side="right";constructor(e,r){if(super(),this._tokenizerJSON=e,this._tokenizerConfig=r,this._tokenizer=new Gv(e,r),this.config=r,this.padding_side=r.padding_side??this.padding_side,this.mask_token=Es(r,"mask_token"),this.mask_token_id=this._tokenizer.token_to_id(this.mask_token),this.pad_token=Es(r,"pad_token","eos_token"),this.pad_token_id=this._tokenizer.token_to_id(this.pad_token),this.sep_token=Es(r,"sep_token"),this.sep_token_id=this._tokenizer.token_to_id(this.sep_token),this.unk_token=Es(r,"unk_token"),this.unk_token_id=this._tokenizer.token_to_id(this.unk_token),this.bos_token=Es(r,"bos_token"),this.bos_token_id=this._tokenizer.token_to_id(this.bos_token),this.eos_token=Es(r,"eos_token"),this.eos_token_id=this._tokenizer.token_to_id(this.eos_token),this.chat_template=r.chat_template??null,Array.isArray(this.chat_template)){let n=Object.create(null);for(let{name:o,template:a}of this.chat_template){if(typeof o!="string"||typeof a!="string")throw new Error('Chat template must be a list of objects with "name" and "template" properties');n[o]=a}this.chat_template=n}this._compiled_template_cache=new Map;let s=gP(this._tokenizer);this.all_special_ids=s.map(n=>n.id),this.all_special_tokens=s.map(n=>n.content)}static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main"}={}){let i=await N0(e,{progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a});return new this(...i)}get_vocab(){return this._tokenizer.get_vocab()}get model_max_length(){return this._tokenizerConfig.model_max_length??1/0}get add_eos_token(){return this._tokenizerConfig.add_eos_token}get add_bos_token(){return this._tokenizerConfig.add_bos_token}convert_tokens_to_ids(e){return typeof e=="string"?this._tokenizer.token_to_id(e):e.map(r=>this._tokenizer.token_to_id(r))}_call(e,{text_pair:r=null,add_special_tokens:s=!0,padding:n=!1,truncation:o=null,max_length:a=null,return_tensor:i=!0,return_token_type_ids:l=null}={}){let u=Array.isArray(e),d;if(u){if(e.length===0)throw Error("text array must be non-empty");if(r!==null){if(Array.isArray(r)){if(e.length!==r.length)throw Error("text and text_pair must have the same length")}else throw Error("text_pair must also be an array");d=e.map((m,_)=>this._encode_plus(m,{text_pair:r[_],add_special_tokens:s,return_token_type_ids:l}))}else d=e.map(m=>this._encode_plus(m,{add_special_tokens:s,return_token_type_ids:l}))}else{if(e==null)throw Error("text may not be null or undefined");if(Array.isArray(r))throw Error("When specifying `text_pair`, since `text` is a string, `text_pair` must also be a string (i.e., not an array).");d=[this._encode_plus(e,{text_pair:r,add_special_tokens:s,return_token_type_ids:l})]}if(a===null?a=this.model_max_length:o===null&&(n===!0?(console.warn("`max_length` is ignored when `padding: true` and there is no truncation strategy. To pad to max length, use `padding: 'max_length'`."),a=this.model_max_length):n===!1&&(console.warn("Truncation was not explicitly activated but `max_length` is provided a specific value, please use `truncation: true` to explicitly truncate examples to max length."),o=!0)),n===!0&&(a=Math.min(Te(d.map(m=>m.input_ids.length))[0],a??1/0)),a=Math.min(a,this.model_max_length??1/0),n||o)for(let m=0;m<d.length;++m)d[m].input_ids.length!==a&&(d[m].input_ids.length>a?o&&_P(d[m],a):n&&hP(d[m],a,_=>_==="input_ids"?this.pad_token_id:0,this.padding_side));let f={};if(i){if(!(n&&o)&&d.some(_=>{for(let w of Object.keys(_))if(_[w].length!==d[0][w]?.length)return!0;return!1}))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=true' and 'truncation=true' to have batched tensors with the same length.");let m=[d.length,d[0].input_ids.length];for(let _ of Object.keys(d[0]))f[_]=new U("int64",BigInt64Array.from(d.flatMap(w=>w[_]).map(BigInt)),m)}else{for(let m of Object.keys(d[0]))f[m]=d.map(_=>_[m]);if(!u)for(let m of Object.keys(f))f[m]=f[m][0]}return f}_encode_text(e){return e===null?null:this._tokenizer.encode(e).tokens}_encode_plus(e,{text_pair:r=null,add_special_tokens:s=!0,return_token_type_ids:n=null}={}){let{ids:o,attention_mask:a,token_type_ids:i}=this._tokenizer.encode(e,{text_pair:r,add_special_tokens:s,return_token_type_ids:n??this.return_token_type_ids});return{input_ids:o,attention_mask:a,...i?{token_type_ids:i}:{}}}tokenize(e,{pair:r=null,add_special_tokens:s=!1}={}){return this._tokenizer.tokenize(e,{text_pair:r,add_special_tokens:s})}encode(e,{text_pair:r=null,add_special_tokens:s=!0,return_token_type_ids:n=null}={}){return this._tokenizer.encode(e,{text_pair:r,add_special_tokens:s,return_token_type_ids:n}).ids}batch_decode(e,r={}){return e instanceof U&&(e=e.tolist()),e.map(s=>this.decode(s,r))}decode(e,r={}){if(e instanceof U&&(e=$0(e)),!Array.isArray(e)||e.length===0||!rk(e[0]))throw Error("token_ids must be a non-empty array of integers.");return this.decode_single(e,r)}decode_single(e,{skip_special_tokens:r=!1,clean_up_tokenization_spaces:s=null}){return this._tokenizer.decode(e,{skip_special_tokens:r,clean_up_tokenization_spaces:s})}get_chat_template({chat_template:e=null,tools:r=null}={}){if(this.chat_template&&typeof this.chat_template=="object"){let s=this.chat_template;if(e!==null&&Object.hasOwn(s,e))e=s[e];else if(e===null)if(r!==null&&"tool_use"in s)e=s.tool_use;else if("default"in s)e=s.default;else throw Error(`This model has multiple chat templates with no default specified! Please either pass a chat template or the name of the template you wish to use to the 'chat_template' argument. Available template names are ${Object.keys(s).sort()}.`)}else if(e===null)if(this.chat_template)e=this.chat_template;else throw Error("Cannot use apply_chat_template() because tokenizer.chat_template is not set and no template argument was passed! For information about writing templates and setting the tokenizer.chat_template attribute, please see the documentation at https://huggingface.co/docs/transformers/main/en/chat_templating");return e}apply_chat_template(e,{tools:r=null,documents:s=null,chat_template:n=null,add_generation_prompt:o=!1,tokenize:a=!0,padding:i=!1,truncation:l=!1,max_length:u=null,return_tensor:d=!0,return_dict:f=!0,tokenizer_kwargs:m={},..._}={}){if(n=this.get_chat_template({chat_template:n,tools:r}),typeof n!="string")throw Error(`chat_template must be a string, but got ${typeof n}`);let w=this._compiled_template_cache.get(n);w===void 0&&(w=new tk(n),this._compiled_template_cache.set(n,w));let x=Object.create(null);for(let E of mP){let M=Es(this.config,E);M&&(x[E]=M)}let k=w.render({messages:e,add_generation_prompt:o,tools:r,documents:s,...x,..._});if(a){let E=this._call(k,{add_special_tokens:!1,padding:i,truncation:l,max_length:u,return_tensor:d,...m});return f?E:E.input_ids}return k}};function bn(t,e,r,s){if(!("language_codes"in t)||!Array.isArray(t.language_codes))throw new Error("Tokenizer must have `language_codes` attribute set and it should be an array of language ids.");if(!("languageRegex"in t)||!(t.languageRegex instanceof RegExp))throw new Error("Tokenizer must have `languageRegex` attribute set and it should be a regular expression.");if(!("lang_to_token"in t)||typeof t.lang_to_token!="function")throw new Error("Tokenizer must have `lang_to_token` attribute set and it should be a function.");let n=s.src_lang,o=s.tgt_lang;if(!t.language_codes.includes(o))throw new Error(`Target language code "${o}" is not valid. Must be one of: {${t.language_codes.join(", ")}}`);if(n!==void 0){if(!t.language_codes.includes(n))throw new Error(`Source language code "${n}" is not valid. Must be one of: {${t.language_codes.join(", ")}}`);for(let a of t._tokenizer.post_processor.config.single)if("SpecialToken"in a&&t.languageRegex.test(a.SpecialToken.id)){a.SpecialToken.id=t.lang_to_token(n);break}}return s.forced_bos_token_id=t._tokenizer.token_to_id(t.lang_to_token(o)),t._call(e,r)}var U0={};cs(U0,{AlbertTokenizer:()=>Pu,AutoTokenizer:()=>J,BartTokenizer:()=>zu,BertTokenizer:()=>Lu,BlenderbotSmallTokenizer:()=>Nu,BlenderbotTokenizer:()=>$u,BloomTokenizer:()=>Ru,CLIPTokenizer:()=>Bu,CamembertTokenizer:()=>Uu,CodeGenTokenizer:()=>Fu,CodeLlamaTokenizer:()=>Du,CohereTokenizer:()=>ju,ConvBertTokenizer:()=>Gu,DebertaTokenizer:()=>Wu,DebertaV2Tokenizer:()=>qu,DistilBertTokenizer:()=>Vu,ElectraTokenizer:()=>Hu,EsmTokenizer:()=>Xu,FalconTokenizer:()=>Ku,GPT2Tokenizer:()=>Ju,GPTNeoXTokenizer:()=>Qu,GemmaTokenizer:()=>Yu,HerbertTokenizer:()=>Zu,LlamaTokenizer:()=>ep,M2M100Tokenizer:()=>tp,MBart50Tokenizer:()=>sp,MBartTokenizer:()=>vn,MPNetTokenizer:()=>ap,MarianTokenizer:()=>rp,MgpstrTokenizer:()=>np,MobileBertTokenizer:()=>op,NllbTokenizer:()=>ip,NougatTokenizer:()=>lp,PreTrainedTokenizer:()=>j,Qwen2Tokenizer:()=>cp,RoFormerTokenizer:()=>pp,RobertaTokenizer:()=>up,SiglipTokenizer:()=>dp,SpeechT5Tokenizer:()=>fp,SqueezeBertTokenizer:()=>mp,T5Tokenizer:()=>hp,TokenizersBackend:()=>j,VitsTokenizer:()=>_p,Wav2Vec2CTCTokenizer:()=>gp,WhisperTokenizer:()=>wp,XLMRobertaTokenizer:()=>xp,XLMTokenizer:()=>yp});var Pu=class extends j{return_token_type_ids=!0};var zu=class extends j{};var Lu=class extends j{return_token_type_ids=!0};var Nu=class extends j{};var $u=class extends j{};var Ru=class extends j{};var Uu=class extends j{};var Bu=class extends j{};var Du=class extends j{};var Fu=class extends j{};var ju=class extends j{};var Gu=class extends j{return_token_type_ids=!0};var qu=class extends j{return_token_type_ids=!0};var Wu=class extends j{return_token_type_ids=!0};var Vu=class extends j{};var Hu=class extends j{return_token_type_ids=!0};var Xu=class extends j{};var Ku=class extends j{};var Yu=class extends j{};var Qu=class extends j{};var Ju=class extends j{};var Zu=class extends j{return_token_type_ids=!0};var ep=class extends j{padding_side="left"};var tp=class extends j{constructor(e,r){super(e,r),this.languageRegex=/^__[a-z]{2,3}__$/,this.language_codes=this.all_special_tokens.filter(s=>this.languageRegex.test(s)).map(s=>s.slice(2,-2)),this.lang_to_token=s=>`__${s}__`}_build_translation_inputs(e,r,s){return bn(this,e,r,s)}};var rp=class extends j{constructor(e,r){super(e,r),this.languageRegex=/^(>>\w+<<)\s*/g,this.supported_language_codes=Array.from(this.get_vocab().keys()).filter(s=>this.languageRegex.test(s)),console.warn('WARNING: `MarianTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}_encode_text(e){if(e===null)return null;let[r,...s]=e.trim().split(this.languageRegex);if(s.length===0)return super._encode_text(r);if(s.length===2){let[n,o]=s;return this.supported_language_codes.includes(n)||console.warn(`Unsupported language code "${n}" detected, which may lead to unexpected behavior. Should be one of: ${JSON.stringify(this.supported_language_codes)}`),dt([n],super._encode_text(o))}}};var vn=class extends j{constructor(e,r){super(e,r),this.languageRegex=/^[a-z]{2}_[A-Z]{2}$/,this.language_codes=this.all_special_tokens.filter(s=>this.languageRegex.test(s)).map(s=>s),this.lang_to_token=s=>s}_build_translation_inputs(e,r,s){return bn(this,e,r,s)}};var sp=class extends vn{};var np=class extends j{};var op=class extends j{return_token_type_ids=!0};var ap=class extends j{};var ip=class extends j{constructor(e,r){super(e,r),this.languageRegex=/^[a-z]{3}_[A-Z][a-z]{3}$/,this.language_codes=this.all_special_tokens.filter(s=>this.languageRegex.test(s)),this.lang_to_token=s=>s}_build_translation_inputs(e,r,s){return bn(this,e,r,s)}};var lp=class extends j{};var cp=class extends j{};var up=class extends j{};var pp=class extends j{return_token_type_ids=!0};var dp=class extends j{};var fp=class extends j{};var mp=class extends j{return_token_type_ids=!0};var hp=class extends j{};var R0=class extends Bt{decode_chain(e){let r="";for(let s=1;s<e.length;s+=2)r+=e[s];return[r]}},_p=class extends j{constructor(e,r){super(e,r),this._tokenizer.decoder=new R0({type:"VitsDecoder"})}};var gp=class extends j{};var eA=[["en","english"],["zh","chinese"],["de","german"],["es","spanish"],["ru","russian"],["ko","korean"],["fr","french"],["ja","japanese"],["pt","portuguese"],["tr","turkish"],["pl","polish"],["ca","catalan"],["nl","dutch"],["ar","arabic"],["sv","swedish"],["it","italian"],["id","indonesian"],["hi","hindi"],["fi","finnish"],["vi","vietnamese"],["he","hebrew"],["uk","ukrainian"],["el","greek"],["ms","malay"],["cs","czech"],["ro","romanian"],["da","danish"],["hu","hungarian"],["ta","tamil"],["no","norwegian"],["th","thai"],["ur","urdu"],["hr","croatian"],["bg","bulgarian"],["lt","lithuanian"],["la","latin"],["mi","maori"],["ml","malayalam"],["cy","welsh"],["sk","slovak"],["te","telugu"],["fa","persian"],["lv","latvian"],["bn","bengali"],["sr","serbian"],["az","azerbaijani"],["sl","slovenian"],["kn","kannada"],["et","estonian"],["mk","macedonian"],["br","breton"],["eu","basque"],["is","icelandic"],["hy","armenian"],["ne","nepali"],["mn","mongolian"],["bs","bosnian"],["kk","kazakh"],["sq","albanian"],["sw","swahili"],["gl","galician"],["mr","marathi"],["pa","punjabi"],["si","sinhala"],["km","khmer"],["sn","shona"],["yo","yoruba"],["so","somali"],["af","afrikaans"],["oc","occitan"],["ka","georgian"],["be","belarusian"],["tg","tajik"],["sd","sindhi"],["gu","gujarati"],["am","amharic"],["yi","yiddish"],["lo","lao"],["uz","uzbek"],["fo","faroese"],["ht","haitian creole"],["ps","pashto"],["tk","turkmen"],["nn","nynorsk"],["mt","maltese"],["sa","sanskrit"],["lb","luxembourgish"],["my","myanmar"],["bo","tibetan"],["tl","tagalog"],["mg","malagasy"],["as","assamese"],["tt","tatar"],["haw","hawaiian"],["ln","lingala"],["ha","hausa"],["ba","bashkir"],["jw","javanese"],["su","sundanese"]],hi=new Map(eA),wP=new Map([...eA.map(([t,e])=>[e,t]),["burmese","my"],["valencian","ca"],["flemish","nl"],["haitian","ht"],["letzeburgesch","lb"],["pushto","ps"],["panjabi","pa"],["moldavian","ro"],["moldovan","ro"],["sinhalese","si"],["castilian","es"]]);function tA(t){t=t.toLowerCase();let e=wP.get(t);if(e===void 0){let r=t.match(/^<\|([a-z]{2})\|>$/);if(r&&(t=r[1]),hi.has(t))e=t;else{let n=t.length===2?hi.keys():hi.values();throw new Error(`Language "${t}" is not supported. Must be one of: ${JSON.stringify(Array.from(n))}`)}}return e}var xP="\\p{P}\\u0021-\\u002F\\u003A-\\u0040\\u005B-\\u0060\\u007B-\\u007E",rA=new RegExp(`^[${xP}]+$`,"gu"),wp=class extends j{get timestamp_begin(){return this._tokenizer.token_to_id("<|notimestamps|>")+1}_decode_asr(e,{return_timestamps:r=!1,return_language:s=!1,time_precision:n=null,force_full_sequences:o=!0}={}){if(n===null)throw Error("Must specify time_precision");let a=null,i=r==="word";function l(){return{language:a,timestamp:[null,null],text:""}}let u=[],d=l(),f=0,m=this.timestamp_begin,w=m+1500,x=[],k=[],E=!1,M=null,I=new Set(this.all_special_ids);for(let C of e){let v=C.tokens,G=i?C.token_timestamps:null,X=null,V=m;if("stride"in C){let[Y,B,P]=C.stride;if(f-=B,M=Y-P,B&&(V=B/n+m),P)for(let se=v.length-1;se>=0;--se){let ie=Number(v[se]);if(ie>=m){if(X!==null&&(ie-m)*n<M)break;X=ie}}}let Q=[],K=[];for(let Y=0;Y<v.length;++Y){let B=Number(v[Y]);if(I.has(B)){let P=this.decode([B]),se=hi.get(P.slice(2,-2));if(se!==void 0){if(a!==null&&se!==a&&!r){x.push(Q);let ie=this.findLongestCommonSequence(x)[0],S=this.decode(ie);d.text=S,u.push(d),x=[],Q=[],d=l()}a=d.language=se}}else if(B>=m&&B<=w){let P=(B-m)*n+f,se=ms(P,2);if(X!==null&&B>=X)E=!0;else if(E||x.length>0&&B<V)E=!1;else if(d.timestamp[0]===null)d.timestamp[0]=se;else if(se!==d.timestamp[0]){d.timestamp[1]=se,x.push(Q),i&&k.push(K);let[ie,S]=this.findLongestCommonSequence(x,k),L=this.decode(ie);d.text=L,i&&(d.words=this.collateWordTimestamps(ie,S,a)),u.push(d),x=[],Q=[],k=[],K=[],d=l()}}else if(Q.push(B),i){let P=ms(G[Y]+f,2),se;if(Y+1<G.length){se=ms(G[Y+1]+f,2);let ie=this.decode([B]);rA.test(ie)&&(se=ms(Math.min(P+n,se),2))}else se=null;K.push([P,se])}}if("stride"in C){let[Y,B,P]=C.stride;f+=Y-P}Q.length>0?(x.push(Q),i&&k.push(K)):x.every(Y=>Y.length===0)&&(d=l(),x=[],Q=[],k=[],K=[])}if(x.length>0){if(o&&r)throw new Error("Whisper did not predict an ending timestamp, which can happen if audio is cut off in the middle of a word. Also make sure WhisperTimeStampLogitsProcessor was used during generation.");let[C,v]=this.findLongestCommonSequence(x,k),G=this.decode(C);d.text=G,i&&(d.words=this.collateWordTimestamps(C,v,a)),u.push(d)}let T=Object.create(null),z=u.map(C=>C.text).join("");if(r||s){for(let C=0;C<u.length;++C){let v=u[C];r||delete v.timestamp,s||delete v.language}if(i){let C=[];for(let v of u)for(let G of v.words)C.push(G);T={chunks:C}}else T={chunks:u}}return[z,T]}findLongestCommonSequence(e,r=null){let s=e[0],n=s.length,o=[],a=Array.isArray(r)&&r.length>0,i=a?[]:null,l=a?r[0]:null;for(let u=1;u<e.length;++u){let d=e[u],f=0,m=[n,n,0,0],_=d.length;for(let T=1;T<n+_;++T){let z=Math.max(0,n-T),C=Math.min(n,n+_-T),v=s.slice(z,C),G=Math.max(0,T-n),X=Math.min(_,T),V=d.slice(G,X);if(v.length!==V.length)throw new Error("There is a bug within whisper `decode_asr` function, please report it. Dropping to prevent bad inference.");let Q;a?Q=v.filter((B,P)=>B===V[P]&&l[z+P]<=r[u][G+P]).length:Q=v.filter((B,P)=>B===V[P]).length;let K=T/1e4,Y=Q/T+K;Q>1&&Y>f&&(f=Y,m=[z,C,G,X])}let[w,x,k,E]=m,M=Math.floor((x+w)/2),I=Math.floor((E+k)/2);o.push(...s.slice(0,M)),s=d.slice(I),n=s.length,a&&(i.push(...l.slice(0,M)),l=r[u].slice(I))}return o.push(...s),a?(i.push(...l),[o,i]):[o,[]]}collateWordTimestamps(e,r,s){let[n,o,a]=this.combineTokensIntoWords(e,s),i=[];for(let l=0;l<n.length;++l){let u=a[l];i.push({text:n[l],timestamp:[r[u.at(0)][0],r[u.at(-1)][1]]})}return i}combineTokensIntoWords(e,r,s=`"'\u201C\xA1\xBF([{-`,n=`"'.\u3002,\uFF0C!\uFF01?\uFF1F:\uFF1A\u201D)]}\u3001`){r=r??"english";let o,a,i;return["chinese","japanese","thai","lao","myanmar"].includes(r)?[o,a,i]=this.splitTokensOnUnicode(e):[o,a,i]=this.splitTokensOnSpaces(e),this.mergePunctuations(o,a,i,s,n)}decode(e,r){let s;return r?.decode_with_timestamps?(e instanceof U&&(e=$0(e)),s=this.decodeWithTimestamps(e,r)):s=super.decode(e,r),s}decodeWithTimestamps(e,r){let s=r?.time_precision??.02,n=this.all_special_ids.at(-1)+1,o=[[]];for(let a of e)if(a=Number(a),a>=n){let i=((a-n)*s).toFixed(2);o.push(`<|${i}|>`),o.push([])}else o[o.length-1].push(a);return o=o.map(a=>typeof a=="string"?a:super.decode(a,r)),o.join("")}splitTokensOnUnicode(e){let r=this.decode(e,{decode_with_timestamps:!0}),s="\uFFFD",n=[],o=[],a=[],i=[],l=[],u=0;for(let d=0;d<e.length;++d){let f=e[d];i.push(f),l.push(d);let m=this.decode(i,{decode_with_timestamps:!0});(!m.includes(s)||r[u+m.indexOf(s)]===s)&&(n.push(m),o.push(i),a.push(l),i=[],l=[],u+=m.length)}return[n,o,a]}splitTokensOnSpaces(e){let[r,s,n]=this.splitTokensOnUnicode(e),o=[],a=[],i=[];for(let l=0;l<r.length;++l){let u=r[l],d=s[l],f=n[l],m=d[0]>=this._tokenizer.token_to_id("<|endoftext|>"),_=u.startsWith(" "),w=u.trim(),x=rA.test(w);if(m||_||x||o.length===0)o.push(u),a.push(d),i.push(f);else{let k=o.length-1;o[k]+=u,a[k].push(...d),i[k].push(...f)}}return[o,a,i]}mergePunctuations(e,r,s,n,o){let a=structuredClone(e),i=structuredClone(r),l=structuredClone(s),u=a.length-2,d=a.length-1;for(;u>=0;)a[u].startsWith(" ")&&n.includes(a[u].trim())?(a[d]=a[u]+a[d],i[d]=dt(i[u],i[d]),l[d]=dt(l[u],l[d]),a[u]="",i[u]=[],l[u]=[]):d=u,--u;for(u=0,d=1;d<a.length;)!a[u].endsWith(" ")&&o.includes(a[d])?(a[u]+=a[d],i[u]=dt(i[u],i[d]),l[u]=dt(l[u],l[d]),a[d]="",i[d]=[],l[d]=[]):u=d,++d;return[a.filter(f=>f),i.filter(f=>f.length>0),l.filter(f=>f.length>0)]}};var xp=class extends j{};var yp=class extends j{return_token_type_ids=!0;constructor(e,r){super(e,r),console.warn('WARNING: `XLMTokenizer` is not yet supported by Hugging Face\'s "fast" tokenizers library. Therefore, you may experience slightly inaccurate results.')}};var J=class{static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main"}={}){let[i,l]=await N0(e,{progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a}),u=l.tokenizer_class?.replace(/Fast$/,"")??"PreTrainedTokenizer",d=U0[u];return d||(console.warn(`Unknown tokenizer class "${u}", attempting to construct from base class.`),d=j),new d(i,l)}};var kn="https://github.com/huggingface/transformers.js/issues/new/choose";var _i="preprocessor_config.json",En=_i,sA="processor_config.json",nA="chat_template.jinja";var ne=class extends Je{static classes=["image_processor_class","tokenizer_class","feature_extractor_class"];static uses_processor_config=!1;static uses_chat_template_file=!1;constructor(e,r,s){super(),this.config=e,this.components=r,this.chat_template=s}get image_processor(){return this.components.image_processor}get tokenizer(){return this.components.tokenizer}get feature_extractor(){return this.components.feature_extractor}apply_chat_template(e,r={}){if(!this.tokenizer)throw new Error("Unable to apply chat template without a tokenizer.");return this.tokenizer.apply_chat_template(e,{tokenize:!1,chat_template:this.chat_template??void 0,...r})}batch_decode(...e){if(!this.tokenizer)throw new Error("Unable to decode without a tokenizer.");return this.tokenizer.batch_decode(...e)}decode(...e){if(!this.tokenizer)throw new Error("Unable to decode without a tokenizer.");return this.tokenizer.decode(...e)}async _call(e,...r){for(let s of[this.image_processor,this.feature_extractor,this.tokenizer])if(s)return s(e,...r);throw new Error("No image processor, feature extractor, or tokenizer found.")}static async from_pretrained(e,r={}){let[s,n,o]=await Promise.all([this.uses_processor_config?it(e,sA,!0,r):{},Promise.all(this.classes.filter(a=>a in this).map(async a=>{let i=await this[a].from_pretrained(e,r);return[a.replace(/_class$/,""),i]})).then(Object.fromEntries),this.uses_chat_template_file?Oy(e,nA,!0,r):null]);return new this(s,n,o)}};var Xd={};cs(Xd,{ChatterboxProcessor:()=>$p,Florence2Processor:()=>Md,Gemma3nProcessor:()=>Td,GroundingDinoProcessor:()=>Sd,Idefics3Processor:()=>zi,JinaCLIPProcessor:()=>Id,LlavaProcessor:()=>Cd,MgpstrProcessor:()=>Pd,MoonshineProcessor:()=>zd,OwlViTProcessor:()=>Ld,PaliGemmaProcessor:()=>Nd,Phi3VProcessor:()=>$d,PixtralProcessor:()=>Rd,Processor:()=>ne,PyAnnoteProcessor:()=>Ud,Qwen2VLProcessor:()=>Bd,Sam2Processor:()=>Li,Sam2VideoProcessor:()=>Dd,SamProcessor:()=>zn,SmolVLMProcessor:()=>zi,SpeechT5Processor:()=>Fd,UltravoxProcessor:()=>jd,VLChatProcessor:()=>Od,VoxtralProcessor:()=>qd,Wav2Vec2Processor:()=>Wd,Wav2Vec2ProcessorWithLM:()=>Vd,WhisperProcessor:()=>Hd});var ze=class extends Je{constructor(e){super(),this.config=e}static async from_pretrained(e,r={}){let s=await it(e,_i,!0,r);return new this(s)}};function He(t,e){if(!(t instanceof Float32Array||t instanceof Float64Array))throw new Error(`${e} expects input to be a Float32Array or a Float64Array, but got ${t?.constructor?.name??typeof t} instead. If using the feature extractor directly, remember to use \`read_audio(url, sampling_rate)\` to obtain the raw audio data of the file/url.`)}var gi={};cs(gi,{ASTFeatureExtractor:()=>Ep,ChatterboxFeatureExtractor:()=>Ap,ClapFeatureExtractor:()=>Mp,DacFeatureExtractor:()=>Tn,EncodecFeatureExtractor:()=>Mn,FeatureExtractor:()=>ze,Gemma3nAudioFeatureExtractor:()=>Tp,MoonshineFeatureExtractor:()=>Sp,ParakeetFeatureExtractor:()=>Op,PyAnnoteFeatureExtractor:()=>Sn,SeamlessM4TFeatureExtractor:()=>Ip,SnacFeatureExtractor:()=>Cp,SpeechT5FeatureExtractor:()=>Pp,Wav2Vec2FeatureExtractor:()=>zp,WeSpeakerFeatureExtractor:()=>Lp,WhisperFeatureExtractor:()=>Np});var oA=Ur(require("fs"),1),aA=require("stream"),iA=require("stream/promises");async function bp(t,e){if(be.IS_BROWSER_ENV){if(be.IS_WEBWORKER_ENV)throw new Error("Unable to save a file from a Web Worker.");let r=URL.createObjectURL(e),s=document.createElement("a");s.href=r,s.download=t,s.click(),s.remove(),URL.revokeObjectURL(r)}else if(be.IS_FS_AVAILABLE){let r=e.stream(),s=aA.Readable.fromWeb(r),n=oA.default.createWriteStream(t);await(0,iA.pipeline)(s,n)}else throw new Error("Unable to save because filesystem is disabled in this environment.")}async function kp(t,e){if(typeof AudioContext>"u")throw Error("Unable to load audio from path/URL since `AudioContext` is not available in your environment. Instead, audio data should be passed directly to the pipeline/processor. For more information and some example code, see https://huggingface.co/docs/transformers.js/guides/node-audio-processing.");let r=await(await fn(t)).arrayBuffer(),s=new AudioContext({sampleRate:e});typeof e>"u"&&console.warn(`No sampling rate provided, using default of ${s.sampleRate}Hz.`);let n=await s.decodeAudioData(r),o;if(n.numberOfChannels===2){let a=Math.sqrt(2),i=n.getChannelData(0),l=n.getChannelData(1);o=new Float32Array(i.length);for(let u=0;u<n.length;++u)o[u]=a*(i[u]+l[u])/2}else o=n.getChannelData(0);return o}function uA(t,e){if(t<1)return new Float64Array;if(t===1)return new Float64Array([1]);let r=1-e,s=2*Math.PI/(t-1),n=new Float64Array(t);for(let o=0;o<t;++o)n[o]=e-r*Math.cos(o*s);return n}function lA(t){return uA(t,.5)}function yP(t){return uA(t,.54)}var bP={htk:t=>2595*Math.log10(1+t/700),kaldi:t=>1127*Math.log(1+t/700),slaney:(t,e=1e3,r=15,s=27/Math.log(6.4))=>t>=e?r+Math.log(t/e)*s:3*t/200};function B0(t,e="htk"){let r=bP[e];if(!r)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof t=="number"?r(t):t.map(s=>r(s))}var vP={htk:t=>700*(10**(t/2595)-1),kaldi:t=>700*(Math.exp(t/1127)-1),slaney:(t,e=1e3,r=15,s=Math.log(6.4)/27)=>t>=r?e*Math.exp(s*(t-r)):200*t/3};function kP(t,e="htk"){let r=vP[e];if(!r)throw new Error('mel_scale should be one of "htk", "slaney" or "kaldi".');return typeof t=="number"?r(t):t.map(s=>r(s))}function EP(t,e){let r=Float64Array.from({length:e.length-1},(a,i)=>e[i+1]-e[i]),s=Array.from({length:t.length},()=>new Array(e.length));for(let a=0;a<t.length;++a){let i=s[a];for(let l=0;l<e.length;++l)i[l]=e[l]-t[a]}let n=e.length-2,o=Array.from({length:n},()=>new Array(t.length));for(let a=0;a<t.length;++a){let i=s[a];for(let l=0;l<n;++l){let u=-i[l]/r[l],d=i[l+2]/r[l+1];o[l][a]=Math.max(0,Math.min(u,d))}}return o}function cA(t,e,r){let s=(e-t)/(r-1);return Float64Array.from({length:r},(n,o)=>t+s*o)}function yt(t,e,r,s,n,o=null,a="htk",i=!1){if(o!==null&&o!=="slaney")throw new Error('norm must be one of null or "slaney"');if(t<2)throw new Error(`Require num_frequency_bins: ${t} >= 2`);if(r>s)throw new Error(`Require min_frequency: ${r} <= max_frequency: ${s}`);let l=B0(r,a),u=B0(s,a),d=cA(l,u,e+2),f=kP(d,a),m;if(i){let w=n/((t-1)*2);m=B0(Float64Array.from({length:t},(x,k)=>k*w),a),f=d}else m=cA(0,Math.floor(n/2),t);let _=EP(m,f);if(o!==null&&o==="slaney")for(let w=0;w<e;++w){let x=_[w],k=2/(f[w+2]-f[w]);for(let E=0;E<t;++E)x[E]*=k}return _}function AP(t,e,r){let s=new t.constructor(t.length+e+r),n=t.length-1;for(let o=0;o<t.length;++o)s[e+o]=t[o];for(let o=1;o<=e;++o)s[e-o]=t[un(o,n)];for(let o=1;o<=r;++o)s[n+e+o]=t[un(n-o,n)];return s}function pA(t,e,r,s,n){if(r<=0)throw new Error("reference must be greater than zero");if(s<=0)throw new Error("min_value must be greater than zero");r=Math.max(s,r);let o=Math.log10(r);for(let a=0;a<t.length;++a)t[a]=e*Math.log10(Math.max(s,t[a])-o);if(n!==null){if(n<=0)throw new Error("db_range must be greater than zero");let a=Te(t)[0]-n;for(let i=0;i<t.length;++i)t[i]=Math.max(t[i],a)}return t}function MP(t,e=1,r=1e-5,s=null){return pA(t,20,e,r,s)}function TP(t,e=1,r=1e-10,s=null){return pA(t,10,e,r,s)}async function At(t,e,r,s,{fft_length:n=null,power:o=1,center:a=!0,pad_mode:i="reflect",onesided:l=!0,preemphasis:u=null,preemphasis_htk_flavor:d=!0,mel_filters:f=null,mel_floor:m=1e-10,log_mel:_=null,reference:w=1,min_value:x=1e-10,db_range:k=null,remove_dc_offset:E=null,min_num_frames:M=null,max_num_frames:I=null,do_pad:T=!0,transpose:z=!1,mel_offset:C=0}={}){let v=e.length;if(n===null&&(n=r),r>n)throw Error(`frame_length (${r}) may not be larger than fft_length (${n})`);if(v!==r)throw new Error(`Length of the window (${v}) must equal frame_length (${r})`);if(s<=0)throw new Error("hop_length must be greater than zero");if(o===null&&f!==null)throw new Error("You have provided `mel_filters` but `power` is `None`. Mel spectrogram computation is not yet supported for complex-valued spectrogram. Specify `power` to fix this issue.");if(!d)throw new Error("`preemphasis_htk_flavor=false` is not currently supported.");if(a)switch(i){case"reflect":{let L=Math.floor((n-1)/2)+1;t=AP(t,L,L);break}case"constant":{let L=Math.floor(n/2),R=new t.constructor(t.length+2*L);R.set(t,L),t=R;break}default:throw new Error(`pad_mode="${i}" not implemented yet.`)}let G=Math.floor(1+Math.floor((t.length-r)/s));M!==null&&G<M&&(G=M);let X=l?Math.floor(n/2)+1:n,V=G,Q=G;I!==null&&(I>G?T&&(Q=I):Q=V=I);let K=new uu(n),Y=new Float64Array(n),B=new Float64Array(K.outputBufferSize),P=new Float32Array(X*Q);for(let L=0;L<V;++L){let R=L*s,te=Math.min(t.length-R,r);te!==r&&Y.fill(0,0,r);for(let ue=0;ue<te;++ue)Y[ue]=t[R+ue];if(E){let ue=0;for(let Pe=0;Pe<te;++Pe)ue+=Y[Pe];let Be=ue/te;for(let Pe=0;Pe<te;++Pe)Y[Pe]-=Be}if(u!==null){for(let ue=te-1;ue>=1;--ue)Y[ue]-=u*Y[ue-1];Y[0]*=1-u}for(let ue=0;ue<e.length;++ue)Y[ue]*=e[ue];K.realTransform(B,Y);for(let ue=0;ue<X;++ue){let Be=ue<<1;P[ue*Q+L]=B[Be]**2+B[Be+1]**2}}if(o!==null&&o!==2){let L=o/2;for(let R=0;R<P.length;++R)P[R]**=L}let se=f.length,ie=await I0(new U("float32",f.flat(),[se,X]),new U("float32",P,[X,Q]));z&&(ie=ie.transpose(1,0));let S=ie.data;for(let L=0;L<S.length;++L)S[L]=C+Math.max(m,S[L]);if(o!==null&&_!==null){let L=Math.min(S.length,V*se);switch(_){case"log":for(let R=0;R<L;++R)S[R]=Math.log(S[R]);break;case"log10":for(let R=0;R<L;++R)S[R]=Math.log10(S[R]);break;case"dB":if(o===1)MP(S,w,x,k);else if(o===2)TP(S,w,x,k);else throw new Error(`Cannot use log_mel option '${_}' with power ${o}`);break;default:throw new Error(`log_mel must be one of null, 'log', 'log10' or 'dB'. Got '${_}'`)}}return ie}function Mt(t,e,{periodic:r=!0,frame_length:s=null,center:n=!0}={}){let o=r?t+1:t,a;switch(e){case"boxcar":a=new Float64Array(o).fill(1);break;case"hann":case"hann_window":a=lA(o);break;case"hamming":a=yP(o);break;case"povey":a=lA(o).map(i=>Math.pow(i,.85));break;default:throw new Error(`Unknown window type ${e}.`)}if(r&&(a=a.subarray(0,t)),s===null)return a;if(t>s)throw new Error(`Length of the window (${t}) may not be larger than frame_length (${s})`);return a}function SP(t,e){let r=t.reduce((o,a)=>o+a.length,0),s=new ArrayBuffer(44),n=new DataView(s);return vp(n,0,"RIFF"),n.setUint32(4,36+r*4,!0),vp(n,8,"WAVE"),vp(n,12,"fmt "),n.setUint32(16,16,!0),n.setUint16(20,3,!0),n.setUint16(22,1,!0),n.setUint32(24,e,!0),n.setUint32(28,e*4,!0),n.setUint16(32,4,!0),n.setUint16(34,32,!0),vp(n,36,"data"),n.setUint32(40,r*4,!0),new Blob([s,...t.map(o=>o.buffer)],{type:"audio/wav"})}function vp(t,e,r){for(let s=0;s<r.length;++s)t.setUint8(e+s,r.charCodeAt(s))}var An=class{constructor(e,r){this.audio=e,this.sampling_rate=r}get data(){if(Array.isArray(this.audio)){if(this.audio.length===0)return new Float32Array(0);if(this.audio.length===1)return this.audio[0];let e=this.audio.reduce((n,o)=>n+o.length,0),r=new Float32Array(e),s=0;for(let n of this.audio)r.set(n,s),s+=n.length;return r}else return this.audio}toBlob(){let e=this.audio;return e instanceof Float32Array&&(e=[e]),SP(e,this.sampling_rate)}async save(e){return bp(e,this.toBlob())}};var Ep=class extends ze{constructor(e){super(e);let r=this.config.sampling_rate,s=yt(257,this.config.num_mel_bins,20,Math.floor(r/2),r,null,"kaldi",!0);this.mel_filters=s,this.window=Mt(400,"hann",{periodic:!1}),this.mean=this.config.mean,this.std=this.config.std}async _extract_fbank_features(e,r){return At(e,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:r,transpose:!0})}async _call(e){He(e,"ASTFeatureExtractor");let r=await this._extract_fbank_features(e,this.config.max_length);if(this.config.do_normalize){let s=this.std*2,n=r.data;for(let o=0;o<n.length;++o)n[o]=(n[o]-this.mean)/s}return{input_values:r.unsqueeze_(0)}}};var Mn=class extends ze{async _call(e){He(e,"EncodecFeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=this.config.feature_size;if(e.length%r!==0)throw new Error(`The length of the audio data must be a multiple of the number of channels (${r}).`);let s=[1,r,e.length/r];return{input_values:new U("float32",e,s)}}};var Ap=class extends ze{async _call(e){He(e,"ChatterboxFeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=[1,e.length];return{input_values:new U("float32",e,r)}}};var Mp=class extends ze{constructor(e){super(e),this.mel_filters=yt(this.config.nb_frequency_bins,this.config.feature_size,this.config.frequency_min,this.config.frequency_max,this.config.sampling_rate,null,"htk"),this.mel_filters_slaney=yt(this.config.nb_frequency_bins,this.config.feature_size,this.config.frequency_min,this.config.frequency_max,this.config.sampling_rate,"slaney","slaney"),this.window=Mt(this.config.fft_window_size,"hann")}async _get_input_mel(e,r,s,n){let o,a=!1,i=e.length-r;if(i>0)if(s==="rand_trunc"){a=!0;let l=Math.floor(Math.random()*(i+1));e=e.subarray(l,l+r),o=await this._extract_fbank_features(e,this.mel_filters_slaney,this.config.nb_max_samples)}else throw new Error(`Truncation strategy "${s}" not implemented`);else{if(i<0){let l=new Float64Array(r);if(l.set(e),n==="repeat")for(let u=e.length;u<r;u+=e.length)l.set(e.subarray(0,Math.min(e.length,r-u)),u);else if(n==="repeatpad")for(let u=e.length;u<-i;u+=e.length)l.set(e,u);e=l}if(s==="fusion")throw new Error(`Truncation strategy "${s}" not implemented`);o=await this._extract_fbank_features(e,this.mel_filters_slaney,this.config.nb_max_samples)}return o.unsqueeze_(0)}async _extract_fbank_features(e,r,s=null){return At(e,this.window,this.config.fft_window_size,this.config.hop_length,{power:2,mel_filters:r,log_mel:"dB",max_num_frames:s,do_pad:!1,transpose:!0})}async _call(e,{max_length:r=null}={}){return He(e,"ClapFeatureExtractor"),{input_features:(await this._get_input_mel(e,r??this.config.nb_max_samples,this.config.truncation,this.config.padding)).unsqueeze_(0)}}};var Tn=class extends Mn{};var Tp=class extends ze{constructor(e){super(e);let{fft_length:r,feature_size:s,min_frequency:n,max_frequency:o,sampling_rate:a,frame_length:i}=this.config,l=yt(Math.floor(1+r/2),s,n,o,a,null,"htk",!1);this.mel_filters=l,this.window=Mt(i,"hann")}async _extract_fbank_features(e,r){return At(e,this.window,this.config.frame_length,this.config.hop_length,{fft_length:this.config.fft_length,center:!1,onesided:!0,preemphasis:this.config.preemphasis,preemphasis_htk_flavor:this.config.preemphasis_htk_flavor,mel_filters:this.mel_filters,log_mel:"log",mel_floor:this.config.mel_floor,remove_dc_offset:!1,transpose:!0})}async _call(e,{max_length:r=48e4,truncation:s=!0,padding:n=!0,pad_to_multiple_of:o=128}={}){if(He(e,"Gemma3nAudioFeatureExtractor"),s&&e.length>r&&(e=e.slice(0,r)),n&&e.length%o!==0){let l=o-e.length%o,u=new Float64Array(e.length+l);u.set(e),this.config.padding_value!==0&&u.fill(this.config.padding_value,e.length),e=u}let a=await this._extract_fbank_features(e,this.config.max_length),i=Ge([1,a.dims[0]],!0);return{input_features:a.unsqueeze_(0),input_features_mask:i}}};var Sp=class extends ze{async _call(e){He(e,"MoonshineFeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=[1,e.length];return{input_values:new U("float32",e,r)}}};var OP=1e-5,Op=class extends ze{constructor(e){super(e),this.config.mel_filters??=yt(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,this.config.sampling_rate/2,this.config.sampling_rate,"slaney","slaney");let r=Mt(this.config.win_length,"hann",{periodic:!1});this.window=new Float64Array(this.config.n_fft);let s=Math.floor((this.config.n_fft-this.config.win_length)/2);this.window.set(r,s)}async _extract_fbank_features(e){let r=this.config.preemphasis;e=new Float64Array(e);for(let n=e.length-1;n>=1;--n)e[n]-=r*e[n-1];return await At(e,this.window,this.window.length,this.config.hop_length,{fft_length:this.config.n_fft,power:2,mel_filters:this.config.mel_filters,log_mel:"log",mel_floor:-1/0,pad_mode:"constant",center:!0,transpose:!0,mel_offset:2**-24})}async _call(e){He(e,"ParakeetFeatureExtractor");let r=await this._extract_fbank_features(e),s=Math.floor((e.length+Math.floor(this.config.n_fft/2)*2-this.config.n_fft)/this.config.hop_length),n=r.data;n.fill(0,s*r.dims[1]);let[o,a]=r.dims,i=new Float64Array(a),l=new Float64Array(a);for(let f=0;f<s;++f){let m=f*a;for(let _=0;_<a;++_){let w=n[m+_];i[_]+=w,l[_]+=w*w}}let u=s>1?s-1:1;for(let f=0;f<a;++f){let m=i[f]/s,_=(l[f]-s*m*m)/u,x=1/(Math.sqrt(_)+OP);for(let k=0;k<s;++k){let E=k*a+f;n[E]=(n[E]-m)*x}}let d=new BigInt64Array(o);return d.fill(1n,0,s),{input_features:r.unsqueeze_(0),attention_mask:new U("int64",d,[1,o])}}};var Sn=class extends ze{async _call(e){He(e,"PyAnnoteFeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=[1,1,e.length];return{input_values:new U("float32",e,r)}}samples_to_frames(e){return(e-this.config.offset)/this.config.step}post_process_speaker_diarization(e,r){let s=r/this.samples_to_frames(r)/this.config.sampling_rate,n=[];for(let o of e.tolist()){let a=[],i=-1;for(let l=0;l<o.length;++l){let u=Oe(o[l]),[d,f]=Te(u),[m,_]=[l,l+1];f!==i?(i=f,a.push({id:f,start:m,end:_,score:d})):(a.at(-1).end=_,a.at(-1).score+=d)}n.push(a.map(({id:l,start:u,end:d,score:f})=>({id:l,start:u*s,end:d*s,confidence:f/(d-u)})))}return n}};var Ip=class extends ze{constructor(e){super(e);let r=this.config.sampling_rate,s=yt(257,this.config.num_mel_bins,20,Math.floor(r/2),r,null,"kaldi",!0);this.mel_filters=s,this.window=Mt(400,"povey",{periodic:!1})}async _extract_fbank_features(e,r){return e=e.map(s=>s*32768),At(e,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,max_num_frames:r,transpose:!0})}async _call(e,{padding:r=!0,pad_to_multiple_of:s=2,do_normalize_per_mel_bins:n=!0,return_attention_mask:o=!0}={}){He(e,"SeamlessM4TFeatureExtractor");let a=await this._extract_fbank_features(e,this.config.max_length);if(n){let[w,x]=a.dims,k=a.data;for(let E=0;E<x;++E){let M=0;for(let C=0;C<w;++C)M+=k[C*x+E];let I=M/w,T=0;for(let C=0;C<w;++C)T+=(k[C*x+E]-I)**2;T/=w-1;let z=Math.sqrt(T+1e-7);for(let C=0;C<w;++C){let v=C*x+E;k[v]=(k[v]-I)/z}}}let i;if(r){let[w,x]=a.dims,k=a.data,E=w%s;if(E>0){let M=new Float32Array(x*(w+E));M.set(k),M.fill(this.config.padding_value,k.length);let I=w+E;a=new U(a.type,M,[I,x]),o&&(i=new U("int64",new BigInt64Array(I),[1,I]),i.data.fill(1n,0,w))}}let[l,u]=a.dims,d=this.config.stride;if(l%d!==0)throw new Error(`The number of frames (${l}) must be a multiple of the stride (${d}).`);let m=a.view(1,Math.floor(l/d),u*d),_={input_features:m};if(o){let w=m.dims[1],x=new BigInt64Array(w);if(i){let k=i.data;for(let E=1,M=0;E<l;E+=d,++M)x[M]=k[E]}else x.fill(1n);_.attention_mask=new U("int64",x,[1,w])}return _}};var Cp=class extends Tn{};var Pp=class extends ze{};var zp=class extends ze{_zero_mean_unit_var_norm(e){let s=e.reduce((o,a)=>o+a,0)/e.length,n=e.reduce((o,a)=>o+(a-s)**2,0)/e.length;return e.map(o=>(o-s)/Math.sqrt(n+1e-7))}async _call(e){He(e,"Wav2Vec2FeatureExtractor"),e instanceof Float64Array&&(e=new Float32Array(e));let r=e;this.config.do_normalize&&(r=this._zero_mean_unit_var_norm(r));let s=[1,r.length];return{input_values:new U("float32",r,s),attention_mask:new U("int64",new BigInt64Array(r.length).fill(1n),s)}}};var Lp=class extends ze{constructor(e){super(e);let r=this.config.sampling_rate,s=yt(257,this.config.num_mel_bins,20,Math.floor(r/2),r,null,"kaldi",!0);this.mel_filters=s,this.window=Mt(400,"hamming",{periodic:!1}),this.min_num_frames=this.config.min_num_frames}async _extract_fbank_features(e){return e=e.map(r=>r*32768),At(e,this.window,400,160,{fft_length:512,power:2,center:!1,preemphasis:.97,mel_filters:this.mel_filters,log_mel:"log",mel_floor:1192092955078125e-22,remove_dc_offset:!0,transpose:!0,min_num_frames:this.min_num_frames})}async _call(e){He(e,"WeSpeakerFeatureExtractor");let r=(await this._extract_fbank_features(e)).unsqueeze_(0);if(this.config.fbank_centering_span===null){let s=r.mean(1).data,n=r.data,[o,a,i]=r.dims;for(let l=0;l<o;++l){let u=l*a*i,d=l*i;for(let f=0;f<a;++f){let m=u+f*i;for(let _=0;_<i;++_)n[m+_]-=s[d+_]}}}return{input_features:r}}};var Np=class extends ze{constructor(e){super(e),this.config.mel_filters??=yt(Math.floor(1+this.config.n_fft/2),this.config.feature_size,0,8e3,this.config.sampling_rate,"slaney","slaney"),this.window=Mt(this.config.n_fft,"hann")}async _extract_fbank_features(e){let r=await At(e,this.window,this.config.n_fft,this.config.hop_length,{power:2,mel_filters:this.config.mel_filters,log_mel:"log10",max_num_frames:Math.min(Math.floor(e.length/this.config.hop_length),this.config.nb_max_frames)}),s=r.data,n=Te(s)[0];for(let o=0;o<s.length;++o)s[o]=(Math.max(s[o],n-8)+4)/4;return r}async _call(e,{max_length:r=null}={}){He(e,"WhisperFeatureExtractor");let s,n=r??this.config.n_samples;return e.length>n?(e.length>this.config.n_samples&&console.warn("Attempting to extract features for audio longer than 30 seconds. If using a pipeline to extract transcript from a long audio clip, remember to specify `chunk_length_s` and/or `stride_length_s`."),s=e.slice(0,n)):(s=new Float32Array(n),s.set(e)),{input_features:(await this._extract_fbank_features(s)).unsqueeze_(0)}}};var Ze=class{static async from_pretrained(e,r={}){let s=await it(e,_i,!0,r),n=s.feature_extractor_type,o=gi[n];if(!o)throw new Error(`Unknown feature_extractor_type: '${n}'. Please report this at ${kn}.`);return new o(s)}};var $p=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e,r=null){let s=this.tokenizer(e),n=r?await this.feature_extractor(r):{};return{...s,...n}}};var Rp=Ur(require("sharp"),1),As,dA,Vr,Zt=be.IS_BROWSER_ENV||be.IS_WEBWORKER_ENV;if(Zt)As=(t,e)=>{if(!self.OffscreenCanvas)throw new Error("OffscreenCanvas not supported by this browser.");return new self.OffscreenCanvas(t,e)},Vr=self.createImageBitmap,dA=self.ImageData;else if(Rp.default)Vr=async t=>{let r=(await t.metadata()).channels,{data:s,info:n}=await t.rotate().raw().toBuffer({resolveWithObject:!0}),o=new Xe(new Uint8ClampedArray(s),n.width,n.height,n.channels);return r!==void 0&&r!==n.channels&&o.convert(r),o};else throw new Error("Unable to load image processing library.");var IP={0:"nearest",1:"lanczos",2:"bilinear",3:"bicubic",4:"box",5:"hamming"},CP=new Map([["png","image/png"],["jpg","image/jpeg"],["jpeg","image/jpeg"],["gif","image/gif"]]),Xe=class t{constructor(e,r,s,n){this.data=e,this.width=r,this.height=s,this.channels=n}get size(){return[this.width,this.height]}static async read(e){if(e instanceof t)return e;if(typeof e=="string"||e instanceof URL)return await this.fromURL(e);if(e instanceof Blob)return await this.fromBlob(e);if(typeof HTMLCanvasElement<"u"&&e instanceof HTMLCanvasElement||typeof OffscreenCanvas<"u"&&e instanceof OffscreenCanvas)return this.fromCanvas(e);throw new Error(`Unsupported input type: ${typeof e}`)}static fromCanvas(e){if(!Zt)throw new Error("fromCanvas() is only supported in browser environments.");let s=e.getContext("2d").getImageData(0,0,e.width,e.height).data;return new t(s,e.width,e.height,4)}static async fromURL(e){let r=await fn(e);if(r.status!==200)throw new Error(`Unable to read image from "${e}" (${r.status} ${r.statusText})`);let s=await r.blob();return this.fromBlob(s)}static async fromBlob(e){if(Zt){let r=await Vr(e),s=As(r.width,r.height).getContext("2d");return s.drawImage(r,0,0),new this(s.getImageData(0,0,r.width,r.height).data,r.width,r.height,4)}else{let r=(0,Rp.default)(await e.arrayBuffer());return await Vr(r)}}static fromTensor(e,r="CHW"){if(e.dims.length!==3)throw new Error(`Tensor should have 3 dimensions, but has ${e.dims.length} dimensions.`);if(r==="CHW")e=e.transpose(1,2,0);else if(r!=="HWC")throw new Error(`Unsupported channel format: ${r}`);if(!(e.data instanceof Uint8ClampedArray||e.data instanceof Uint8Array))throw new Error(`Unsupported tensor type: ${e.type}`);switch(e.dims[2]){case 1:case 2:case 3:case 4:return new t(e.data,e.dims[1],e.dims[0],e.dims[2]);default:throw new Error(`Unsupported number of channels: ${e.dims[2]}`)}}grayscale(){if(this.channels===1)return this;let e=new Uint8ClampedArray(this.width*this.height*1);switch(this.channels){case 3:case 4:for(let r=0,s=0;r<this.data.length;r+=this.channels){let n=this.data[r],o=this.data[r+1],a=this.data[r+2];e[s++]=Math.round(.2989*n+.587*o+.114*a)}break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(e,this.width,this.height,1)}rgb(){if(this.channels===3)return this;let e=new Uint8ClampedArray(this.width*this.height*3);switch(this.channels){case 1:for(let r=0,s=0;r<this.data.length;++r)e[s++]=this.data[r],e[s++]=this.data[r],e[s++]=this.data[r];break;case 4:for(let r=0,s=0;r<this.data.length;r+=4)e[s++]=this.data[r],e[s++]=this.data[r+1],e[s++]=this.data[r+2];break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(e,this.width,this.height,3)}rgba(){if(this.channels===4)return this;let e=new Uint8ClampedArray(this.width*this.height*4);switch(this.channels){case 1:for(let r=0,s=0;r<this.data.length;++r)e[s++]=this.data[r],e[s++]=this.data[r],e[s++]=this.data[r],e[s++]=255;break;case 3:for(let r=0,s=0;r<this.data.length;r+=3)e[s++]=this.data[r],e[s++]=this.data[r+1],e[s++]=this.data[r+2],e[s++]=255;break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this._update(e,this.width,this.height,4)}putAlpha(e){if(e.width!==this.width||e.height!==this.height)throw new Error(`Expected mask size to be ${this.width}x${this.height}, but got ${e.width}x${e.height}`);if(e.channels!==1)throw new Error(`Expected mask to have 1 channel, but got ${e.channels}`);let r=this.data,s=e.data,n=this.width*this.height;if(this.channels===3){let o=new Uint8ClampedArray(n*4);for(let a=0,i=0,l=0;a<n;++a)o[l++]=r[i++],o[l++]=r[i++],o[l++]=r[i++],o[l++]=s[a];return this._update(o,this.width,this.height,4)}else if(this.channels===4){for(let o=0;o<n;++o)r[4*o+3]=s[o];return this}throw new Error(`Expected image to have 3 or 4 channels, but got ${this.channels}`)}async resize(e,r,{resample:s=2}={}){if(this.width===e&&this.height===r)return this;let n=IP[s]??s,o=Ty(e),a=Ty(r);if(o&&a)return this;if(o?e=r/this.height*this.width:a&&(r=e/this.width*this.height),Zt){let i=this.channels,l=this.toCanvas(),u=As(e,r).getContext("2d");return u.drawImage(l,0,0,e,r),new t(u.getImageData(0,0,e,r).data,e,r,4).convert(i)}else{let i=this.toSharp();switch(n){case"box":case"hamming":(n==="box"||n==="hamming")&&(console.warn(`Resampling method ${n} is not yet supported. Using bilinear instead.`),n="bilinear");case"nearest":case"bilinear":case"bicubic":i=i.affine([e/this.width,0,0,r/this.height],{interpolator:n});break;case"lanczos":i=i.resize({width:e,height:r,fit:"fill",kernel:"lanczos3"});break;default:throw new Error(`Resampling method ${n} is not supported.`)}return await Vr(i)}}async pad([e,r,s,n]){if(e=Math.max(e,0),r=Math.max(r,0),s=Math.max(s,0),n=Math.max(n,0),e===0&&r===0&&s===0&&n===0)return this;if(Zt){let o=this.channels,a=this.toCanvas(),i=this.width+e+r,l=this.height+s+n,u=As(i,l).getContext("2d");return u.drawImage(a,0,0,this.width,this.height,e,s,this.width,this.height),new t(u.getImageData(0,0,i,l).data,i,l,4).convert(o)}else{let o=this.toSharp().extend({left:e,right:r,top:s,bottom:n});return await Vr(o)}}async crop([e,r,s,n]){if(e=Math.max(e,0),r=Math.max(r,0),s=Math.min(s,this.width-1),n=Math.min(n,this.height-1),e===0&&r===0&&s===this.width-1&&n===this.height-1)return this;let o=s-e+1,a=n-r+1;if(Zt){let i=this.channels,l=this.toCanvas(),u=As(o,a).getContext("2d");return u.drawImage(l,e,r,o,a,0,0,o,a),new t(u.getImageData(0,0,o,a).data,o,a,4).convert(i)}else{let i=this.toSharp().extract({left:e,top:r,width:o,height:a});return await Vr(i)}}async center_crop(e,r){if(this.width===e&&this.height===r)return this;let s=(this.width-e)/2,n=(this.height-r)/2;if(Zt){let o=this.channels,a=this.toCanvas(),i=As(e,r).getContext("2d"),l=0,u=0,d=0,f=0;return s>=0?l=s:d=-s,n>=0?u=n:f=-n,i.drawImage(a,l,u,e,r,d,f,e,r),new t(i.getImageData(0,0,e,r).data,e,r,4).convert(o)}else{let o=this.toSharp();if(s>=0&&n>=0)o=o.extract({left:Math.floor(s),top:Math.floor(n),width:e,height:r});else if(s<=0&&n<=0){let a=Math.floor(-n),i=Math.floor(-s);o=o.extend({top:a,left:i,right:e-this.width-i,bottom:r-this.height-a})}else{let a=[0,0],i=0;n<0?(a[0]=Math.floor(-n),a[1]=r-this.height-a[0]):i=Math.floor(n);let l=[0,0],u=0;s<0?(l[0]=Math.floor(-s),l[1]=e-this.width-l[0]):u=Math.floor(s),o=o.extend({top:a[0],bottom:a[1],left:l[0],right:l[1]}).extract({left:u,top:i,width:e,height:r})}return await Vr(o)}}async toBlob(e="image/png",r=1){if(!Zt)throw new Error("toBlob() is only supported in browser environments.");return await this.toCanvas().convertToBlob({type:e,quality:r})}toTensor(e="CHW"){let r=new U("uint8",new Uint8Array(this.data),[this.height,this.width,this.channels]);if(e!=="HWC")if(e==="CHW")r=r.permute(2,0,1);else throw new Error(`Unsupported channel format: ${e}`);return r}toCanvas(){if(!Zt)throw new Error("toCanvas() is only supported in browser environments.");let e=this.clone().rgba(),r=As(e.width,e.height),s=new dA(e.data,e.width,e.height);return r.getContext("2d").putImageData(s,0,0),r}split(){let{data:e,width:r,height:s,channels:n}=this,o=e.constructor,a=e.length/n,i=Array.from({length:n},()=>new o(a));for(let l=0;l<a;++l){let u=n*l;for(let d=0;d<n;++d)i[d][l]=e[u+d]}return i.map(l=>new t(l,r,s,1))}_update(e,r,s,n=null){return this.data=e,this.width=r,this.height=s,n!==null&&(this.channels=n),this}clone(){return new t(this.data.slice(),this.width,this.height,this.channels)}convert(e){if(this.channels===e)return this;switch(e){case 1:this.grayscale();break;case 3:this.rgb();break;case 4:this.rgba();break;default:throw new Error(`Conversion failed due to unsupported number of channels: ${this.channels}`)}return this}async save(e){if(Zt){if(be.IS_WEBWORKER_ENV)throw new Error("Unable to save an image from a Web Worker.");let r=e.split(".").pop().toLowerCase(),s=CP.get(r)??"image/png",n=await this.toBlob(s);return bp(e,n)}else if(be.IS_FS_AVAILABLE)await this.toSharp().toFile(e);else throw new Error("Unable to save the image because filesystem is disabled in this environment.")}toSharp(){if(Zt)throw new Error("toSharp() is only supported in server-side environments.");return(0,Rp.default)(this.data,{raw:{width:this.width,height:this.height,channels:this.channels}})}},fA=Xe.read.bind(Xe);function mA(t,e,r=0,s=null){let n=t/e,o=gk(n)*e;return s!==null&&o>s&&(o=Math.floor(n)*e),o<r&&(o=Math.ceil(n)*e),o}function D0([t,e],r){return[Math.max(Math.floor(t/r),1)*r,Math.max(Math.floor(e/r),1)*r]}function F0([t,e,r,s]){return[t-r/2,e-s/2,t+r/2,e+s/2]}function Hr(t,e=.5,r=null,s=!1){let n=t.logits,o=t.pred_boxes,[a,i,l]=n.dims;if(r!==null&&r.length!==a)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let u=[];for(let d=0;d<a;++d){let f=r!==null?r[d]:null,m={boxes:[],classes:[],scores:[]},_=n[d],w=o[d];for(let x=0;x<i;++x){let k=_[x],E=[],M;if(s){M=k.sigmoid().data;for(let I=0;I<M.length;++I)M[I]>e&&E.push(I)}else{let I=Te(k.data)[1];if(I===l-1||(M=Oe(k.data),M[I]<e))continue;E.push(I)}for(let I of E){let T=w[x].data;T=F0(T),f!==null&&(T=T.map((z,C)=>z*f[(C+1)%2])),m.boxes.push(T),m.classes.push(I),m.scores.push(M[I])}}u.push(m)}return u}function Up(t,e=null){let r=t.logits,s=r.dims[0];if(e!==null&&e.length!==s)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let n=[];for(let o=0;o<s;++o){let a=e!==null?e[o]:null,i=r[o];a!==null&&(i=Su(i,a,"bilinear",!1));let[l,u]=a??i.dims.slice(-2),d=new U("int32",new Int32Array(l*u),[l,u]),f=i[0].data,m=d.data;for(let x=1;x<i.dims[0];++x){let k=i[x].data;for(let E=0;E<k.length;++E)k[E]>f[E]&&(f[E]=k[E],m[E]=x)}let _=new Array(i.dims[0]);for(let x=0;x<m.length;++x){let k=m[x];_[k]=k}let w=_.filter(x=>x!==void 0);n.push({segmentation:d,labels:w})}return n}function PP(t,e,r,s){let n=[],o=[],a=[];for(let i=0;i<t.dims[0];++i){let l=t[i],u=e[i],d=Te(l.data)[1];if(d===s)continue;let m=Oe(l.data)[d];m>r&&(n.push(u),o.push(m),a.push(d))}return[n,o,a]}function zP(t,e,r,s=.5,n=.8){let o=[],a=0,i=0,l=e[r].data;for(let d=0;d<t.length;++d)t[d]===r&&(o.push(d),++a),l[d]>=s&&++i;let u=a>0&&i>0;return u&&(u=a/i>n),[u,o]}function LP(t,e,r,s,n,o=null,a=null){let[i,l]=a??t[0].dims,u=new U("int32",new Int32Array(i*l),[i,l]),d=[];if(a!==null)for(let x=0;x<t.length;++x)t[x]=Su(t[x],a,"bilinear",!1);let f=new Int32Array(t[0].data.length),m=new Float32Array(t[0].data.length);for(let x=0;x<t.length;++x){let k=e[x],E=t[x].data;for(let M=0;M<E.length;++M)E[M]*=k,E[M]>m[M]&&(f[M]=x,m[M]=E[M])}let _=0,w=u.data;for(let x=0;x<r.length;++x){let k=r[x],[E,M]=zP(f,t,x,s,n);if(E){++_;for(let I of M)w[I]=_;d.push({id:_,label_id:k,score:e[x]})}}return[u,d]}function NP(t,e,r=28,s=3136,n=784*1280){if(t<r||e<r)throw new Error(`height:${t} or width:${e} must be larger than factor:${r}`);if(Math.max(t,e)/Math.min(t,e)>200)throw new Error(`absolute aspect ratio must be smaller than 200, got ${Math.max(t,e)/Math.min(t,e)}`);let o=Math.round(t/r)*r,a=Math.round(e/r)*r;if(o*a>n){let i=Math.sqrt(t*e/n);o=Math.floor(t/i/r)*r,a=Math.floor(e/i/r)*r}else if(o*a<s){let i=Math.sqrt(s/(t*e));o=Math.ceil(t*i/r)*r,a=Math.ceil(e*i/r)*r}return[o,a]}function Bp(t,e=.5,r=.5,s=.8,n=null,o=null){n===null&&(console.warn("`label_ids_to_fuse` unset. No instance will be fused."),n=new Set);let a=t.class_queries_logits??t.logits,l=(t.masks_queries_logits??t.pred_masks).sigmoid(),[u,d,f]=a.dims;if(f-=1,o!==null&&o.length!==u)throw Error("Make sure that you pass in as many target sizes as the batch dimension of the logits");let m=[];for(let _=0;_<u;++_){let w=o!==null?o[_]:null,x=a[_],k=l[_],[E,M,I]=PP(x,k,e,f);if(I.length===0){let[C,v]=w??k.dims.slice(-2),G=new U("int32",new Int32Array(C*v).fill(-1),[C,v]);m.push({segmentation:G,segments_info:[]});continue}let[T,z]=LP(E,M,I,r,s,n,w);m.push({segmentation:T,segments_info:z})}return m}function Dp(t,e=.5,r=null){throw new Error("`post_process_instance_segmentation` is not yet implemented.")}var W=class extends Je{constructor(e){super(),this.image_mean=e.image_mean??e.mean,this.image_std=e.image_std??e.std,this.resample=e.resample??2,this.do_rescale=e.do_rescale??!0,this.rescale_factor=e.rescale_factor??1/255,this.do_normalize=e.do_normalize,this.do_thumbnail=e.do_thumbnail,this.size=e.size??e.image_size,this.do_resize=e.do_resize??this.size!==void 0,this.size_divisibility=e.size_divisibility??e.size_divisor,this.do_center_crop=e.do_center_crop,this.crop_size=e.crop_size,this.do_convert_rgb=e.do_convert_rgb??!0,this.do_crop_margin=e.do_crop_margin,this.pad_size=e.pad_size,this.do_pad=e.do_pad,this.min_pixels=e.min_pixels,this.max_pixels=e.max_pixels,this.do_pad&&!this.pad_size&&this.size&&this.size.width!==void 0&&this.size.height!==void 0&&(this.pad_size=this.size),this.do_flip_channel_order=e.do_flip_channel_order??!1,this.config=e}async thumbnail(e,r,s=2){let n=e.height,o=e.width,a=r.height,i=r.width,l=Math.min(n,a),u=Math.min(o,i);return l===n&&u===o?e:(n>o?u=Math.floor(o*l/n):o>n&&(l=Math.floor(n*u/o)),await e.resize(u,l,{resample:s}))}async crop_margin(e,r=200){let s=e.clone().grayscale(),n=ti(s.data)[0],a=Te(s.data)[0]-n;if(a===0)return e;let i=r/255,l=s.width,u=s.height,d=0,f=0,m=s.data;for(let _=0;_<s.height;++_){let w=_*s.width;for(let x=0;x<s.width;++x)(m[w+x]-n)/a<i&&(l=Math.min(l,x),u=Math.min(u,_),d=Math.max(d,x),f=Math.max(f,_))}return e=await e.crop([l,u,d,f]),e}pad_image(e,r,s,{mode:n="constant",center:o=!1,constant_values:a=0}={}){let[i,l,u]=r,d,f;if(typeof s=="number"?(d=s,f=s):s==="square"?d=f=Math.max(i,l):(d=s.width,f=s.height),d!==l||f!==i){let m=new Float32Array(d*f*u);if(Array.isArray(a))for(let x=0;x<m.length;++x)m[x]=a[x%u];else a!==0&&m.fill(a);let[_,w]=o?[Math.floor((d-l)/2),Math.floor((f-i)/2)]:[0,0];for(let x=0;x<i;++x){let k=(x+w)*d,E=x*l;for(let M=0;M<l;++M){let I=(k+M+_)*u,T=(E+M)*u;for(let z=0;z<u;++z)m[I+z]=e[T+z]}}if(n==="symmetric"){if(o)throw new Error("`center` padding is not supported when `mode` is set to `symmetric`.");let x=i-1,k=l-1;for(let E=0;E<f;++E){let M=E*d,I=un(E,x)*l;for(let T=0;T<d;++T){if(E<i&&T<l)continue;let z=(M+T)*u,C=(I+un(T,k))*u;for(let v=0;v<u;++v)m[z+v]=e[C+v]}}}e=m,r=[f,d,u]}return[e,r]}rescale(e){for(let r=0;r<e.length;++r)e[r]=this.rescale_factor*e[r]}get_resize_output_image_size(e,r){let[s,n]=e.size,o,a;if(this.do_thumbnail){let{height:i,width:l}=r;o=Math.min(i,l)}else Number.isInteger(r)?(o=r,a=this.config.max_size??o):r!==void 0&&(o=r.shortest_edge,a=r.longest_edge);if(o!==void 0||a!==void 0){let i=o===void 0?1:Math.max(o/s,o/n),l=s*i,u=n*i,d=a===void 0?1:Math.min(a/l,a/u),f=Math.floor(Number((l*d).toFixed(2))),m=Math.floor(Number((u*d).toFixed(2)));return this.size_divisibility!==void 0&&([f,m]=D0([f,m],this.size_divisibility)),[f,m]}else if(r!==void 0&&r.width!==void 0&&r.height!==void 0){let i=r.width,l=r.height;if(this.config.keep_aspect_ratio&&this.config.ensure_multiple_of){let u=l/n,d=i/s;Math.abs(1-d)<Math.abs(1-u)?u=d:d=u,l=mA(u*n,this.config.ensure_multiple_of),i=mA(d*s,this.config.ensure_multiple_of)}return[i,l]}else{if(this.size_divisibility!==void 0)return D0([s,n],this.size_divisibility);if(this.min_pixels!==void 0&&this.max_pixels!==void 0){let i=this.config.patch_size*this.config.merge_size;return NP(n,s,i,this.min_pixels,this.max_pixels)}else throw new Error(`Could not resize image due to unsupported \`this.size\` option in config: ${JSON.stringify(r)}`)}}async resize(e){let[r,s]=this.get_resize_output_image_size(e,this.size);return await e.resize(r,s,{resample:this.resample})}async preprocess(e,{do_normalize:r=null,do_pad:s=null,do_convert_rgb:n=null,do_convert_grayscale:o=null,do_flip_channel_order:a=null}={}){this.do_crop_margin&&(e=await this.crop_margin(e));let[i,l]=e.size;if(n??this.do_convert_rgb?e=e.rgb():o&&(e=e.grayscale()),this.do_resize&&(e=await this.resize(e)),this.do_thumbnail&&(e=await this.thumbnail(e,this.size,this.resample)),this.do_center_crop){let _,w;Number.isInteger(this.crop_size)?(_=this.crop_size,w=this.crop_size):(_=this.crop_size.width,w=this.crop_size.height),e=await e.center_crop(_,w)}let u=[e.height,e.width],d=Float32Array.from(e.data),f=[e.height,e.width,e.channels];if(this.do_rescale&&this.rescale(d),r??this.do_normalize){let _=this.image_mean;Array.isArray(this.image_mean)||(_=new Array(e.channels).fill(_));let w=this.image_std;if(Array.isArray(this.image_std)||(w=new Array(e.channels).fill(w)),_.length!==e.channels||w.length!==e.channels)throw new Error(`When set to arrays, the length of \`image_mean\` (${_.length}) and \`image_std\` (${w.length}) must match the number of channels in the image (${e.channels}).`);for(let x=0;x<d.length;x+=e.channels)for(let k=0;k<e.channels;++k)d[x+k]=(d[x+k]-_[k])/w[k]}if(s??this.do_pad){if(this.pad_size)[d,f]=this.pad_image(d,[e.height,e.width,e.channels],this.pad_size);else if(this.size_divisibility){let[_,w]=D0([f[1],f[0]],this.size_divisibility);[d,f]=this.pad_image(d,f,{width:_,height:w})}}if(a??this.do_flip_channel_order){if(f[2]!==3)throw new Error("Flipping channel order is only supported for RGB images.");for(let _=0;_<d.length;_+=3){let w=d[_];d[_]=d[_+2],d[_+2]=w}}let m=new U("float32",d,f).permute(2,0,1);return{original_size:[l,i],reshaped_input_size:u,pixel_values:m}}async _call(e,...r){Array.isArray(e)||(e=[e]);let s=await Promise.all(e.map(o=>this.preprocess(o)));return{pixel_values:zt(s.map(o=>o.pixel_values),0),original_sizes:s.map(o=>o.original_size),reshaped_input_sizes:s.map(o=>o.reshaped_input_size)}}static async from_pretrained(e,r={}){let s=await it(e,En,!0,r);return new this(s)}};var Cn={};cs(Cn,{BeitFeatureExtractor:()=>Fp,BitImageProcessor:()=>jp,CLIPFeatureExtractor:()=>qp,CLIPImageProcessor:()=>wi,ChineseCLIPFeatureExtractor:()=>Gp,ConvNextFeatureExtractor:()=>Wp,ConvNextImageProcessor:()=>xi,DINOv3ViTImageProcessor:()=>Xp,DPTFeatureExtractor:()=>Yp,DPTImageProcessor:()=>vi,DeiTFeatureExtractor:()=>Vp,DeiTImageProcessor:()=>yi,DetrFeatureExtractor:()=>Hp,DetrImageProcessor:()=>bi,DonutFeatureExtractor:()=>Kp,DonutImageProcessor:()=>Ms,EfficientNetImageProcessor:()=>Qp,GLPNFeatureExtractor:()=>Jp,GroundingDinoImageProcessor:()=>Zp,Idefics3ImageProcessor:()=>ki,ImageFeatureExtractor:()=>W,ImageProcessor:()=>W,JinaCLIPImageProcessor:()=>td,LlavaOnevisionImageProcessor:()=>rd,Mask2FormerImageProcessor:()=>nd,MaskFormerFeatureExtractor:()=>sd,MaskFormerImageProcessor:()=>Ts,MobileNetV1FeatureExtractor:()=>od,MobileNetV1ImageProcessor:()=>Ei,MobileNetV2FeatureExtractor:()=>ad,MobileNetV2ImageProcessor:()=>Ai,MobileNetV3FeatureExtractor:()=>id,MobileNetV3ImageProcessor:()=>Mi,MobileNetV4FeatureExtractor:()=>ld,MobileNetV4ImageProcessor:()=>Ti,MobileViTFeatureExtractor:()=>cd,MobileViTImageProcessor:()=>Si,NougatImageProcessor:()=>ud,OwlViTFeatureExtractor:()=>pd,OwlViTImageProcessor:()=>Ss,Owlv2ImageProcessor:()=>dd,Phi3VImageProcessor:()=>fd,PixtralImageProcessor:()=>md,PvtImageProcessor:()=>hd,Qwen2VLImageProcessor:()=>_d,RTDetrImageProcessor:()=>gd,Sam2ImageProcessor:()=>In,Sam3ImageProcessor:()=>In,SamImageProcessor:()=>In,SapiensFeatureExtractor:()=>wd,SapiensImageProcessor:()=>Oi,SegformerFeatureExtractor:()=>xd,SegformerImageProcessor:()=>Ii,SiglipImageProcessor:()=>yd,SmolVLMImageProcessor:()=>ki,Swin2SRImageProcessor:()=>bd,VLMImageProcessor:()=>ed,ViTFeatureExtractor:()=>vd,ViTImageProcessor:()=>Ci,VitMatteImageProcessor:()=>kd,VitPoseImageProcessor:()=>Ed,YolosFeatureExtractor:()=>Ad,YolosImageProcessor:()=>Pi});var Fp=class extends W{};var jp=class extends W{};var Gp=class extends W{};var wi=class extends W{},qp=class extends wi{};var xi=class extends W{constructor(e){super(e),this.crop_pct=this.config.crop_pct??224/256}async resize(e){let r=this.size?.shortest_edge;if(r===void 0)throw new Error("Size dictionary must contain 'shortest_edge' key.");if(r<384){let s=Math.floor(r/this.crop_pct),[n,o]=this.get_resize_output_image_size(e,{shortest_edge:s});e=await e.resize(n,o,{resample:this.resample}),e=await e.center_crop(r,r)}else e=await e.resize(r,r,{resample:this.resample});return e}},Wp=class extends xi{};var yi=class extends W{},Vp=class extends yi{};var bi=class extends W{async _call(e){let r=await super._call(e),s=[r.pixel_values.dims[0],64,64],n=Ge(s,1n);return{...r,pixel_mask:n}}post_process_object_detection(...e){return Hr(...e)}post_process_panoptic_segmentation(...e){return Bp(...e)}post_process_instance_segmentation(...e){return Dp(...e)}},Hp=class extends bi{};var Xp=class extends W{};var Ms=class extends W{pad_image(e,r,s,n={}){let[o,a,i]=r,l=this.image_mean;Array.isArray(this.image_mean)||(l=new Array(i).fill(l));let u=this.image_std;Array.isArray(u)||(u=new Array(i).fill(l));let d=l.map((f,m)=>-f/u[m]);return super.pad_image(e,r,s,{center:!0,constant_values:d,...n})}},Kp=class extends Ms{};var vi=class extends W{},Yp=class extends vi{};var Qp=class extends W{constructor(e){super(e),this.include_top=this.config.include_top??!0,this.include_top&&(this.image_std=this.image_std.map(r=>r*r))}};var Jp=class extends W{};var Zp=class extends W{async _call(e){let r=await super._call(e),s=r.pixel_values.dims,n=rt([s[0],s[2],s[3]]);return{...r,pixel_mask:n}}};var ki=class extends W{constructor(e){super(e),this.do_image_splitting=e.do_image_splitting??!0,this.max_image_size=e.max_image_size}get_resize_for_vision_encoder(e,r){let[s,n]=e.dims.slice(-2),o=n/s;return n>=s?(n=Math.ceil(n/r)*r,s=Math.floor(n/o),s=Math.ceil(s/r)*r):(s=Math.ceil(s/r)*r,n=Math.floor(s*o),n=Math.ceil(n/r)*r),{height:s,width:n}}async _call(e,{do_image_splitting:r=null,return_row_col_info:s=!1}={}){let n;if(!Array.isArray(e))n=[[e]];else{if(e.length===0||!e[0])throw new Error("No images provided.");Array.isArray(e[0])?n=e:n=[e]}let o=[],a=[],i=[],l=[],u=[];for(let E of n){let M=await Promise.all(E.map(z=>this.preprocess(z)));l.push(...M.map(z=>z.original_size)),u.push(...M.map(z=>z.reshaped_input_size)),M.forEach(z=>z.pixel_values.unsqueeze_(0));let{longest_edge:I}=this.max_image_size,T;if(r??this.do_image_splitting){let z=new Array(M.length),C=new Array(M.length);T=await Promise.all(M.map(async(v,G)=>{let X=this.get_resize_for_vision_encoder(v.pixel_values,I),V=await Pt(v.pixel_values,{size:[X.height,X.width]}),{frames:Q,num_splits_h:K,num_splits_w:Y}=await this.split_image(V,this.max_image_size);return z[G]=K,C[G]=Y,Ee(Q,0)})),a.push(z),i.push(C)}else{let z=[I,I];T=await Promise.all(M.map(C=>Pt(C.pixel_values,{size:z}))),a.push(new Array(M.length).fill(0)),i.push(new Array(M.length).fill(0))}o.push(Ee(T,0))}let d=o.length,[f,m,_,w]=o[0].dims,x,k;if(d===1)x=o[0].unsqueeze_(0),k=Ge([d,f,_,w],!0);else{let E=Math.max(...o.map(T=>T.dims.at(0)));k=Ge([d,E,_,w],!0);let M=k.data,I=E*_*w;for(let T=0;T<d;++T){let z=o[T].dims[0];if(z<E){o[T]=Ee([o[T],Ge([E-z,m,_,w],0)],0);let C=T*I+z*_*w,v=(T+1)*I;M.fill(!1,C,v)}}x=zt(o,0)}return{pixel_values:x,pixel_attention_mask:k,original_sizes:l,reshaped_input_sizes:u,...s?{rows:a,cols:i}:{}}}async split_image(e,{longest_edge:r}){let s=r,n=r,o=[],[a,i]=e.dims.slice(-2),l=0,u=0;if(a>s||i>n){l=Math.ceil(a/s),u=Math.ceil(i/n);let d=Math.ceil(a/l),f=Math.ceil(i/u);for(let w=0;w<l;++w)for(let x=0;x<u;++x){let k,E,M,I;w===l-1?(E=a-d,I=a):(E=w*d,I=(w+1)*d),x===u-1?(k=i-f,M=i):(k=x*f,M=(x+1)*f);let C=await di(e,[E,k],[I,M],[2,3]);o.push(C)}let m=s,_=n;(a!==m||i!==_)&&(e=await Pt(e,{size:[m,_]}))}return o.push(e),{frames:o,num_splits_h:l,num_splits_w:u}}};var ed=class extends W{constructor(e){super({do_pad:!0,pad_size:{width:e.image_size,height:e.image_size},...e}),this.constant_values=this.config.background_color.map(r=>r*this.rescale_factor)}pad_image(e,r,s,n){return super.pad_image(e,r,s,{constant_values:this.constant_values,center:!0,...n})}};var td=class extends W{constructor(e){let{resize_mode:r,fill_color:s,interpolation:n,size:o,...a}=e,i=r==="squash"?{width:o,height:o}:r==="shortest"?{shortest_edge:o}:{longest_edge:o},l=n==="bicubic"?3:2;super({...a,size:i,resample:l,do_center_crop:!0,crop_size:o,do_normalize:!0})}};var rd=class extends W{};var Ts=class extends W{post_process_panoptic_segmentation(...e){return Bp(...e)}post_process_instance_segmentation(...e){return Dp(...e)}},sd=class extends Ts{};var nd=class extends Ts{};var Ei=class extends W{},od=class extends Ei{};var Ai=class extends W{},ad=class extends Ai{};var Mi=class extends W{},id=class extends Mi{};var Ti=class extends W{},ld=class extends Ti{};var Si=class extends W{},cd=class extends Si{};var ud=class extends Ms{};var Ss=class extends W{post_process_object_detection(...e){return Hr(...e)}},pd=class extends Ss{};var dd=class extends Ss{};var Lt=336,$P=[2,3],{ceil:j0,floor:On,sqrt:G0}=Math,fd=class extends W{constructor(e){super({...e,do_normalize:!0,do_pad:!0,pad_size:"custom",do_convert_rgb:!0,do_resize:!0}),this._num_crops=e.num_crops}calc_num_image_tokens_from_image_size(e,r){let{num_img_tokens:s}=this.config;return On((On(r/Lt)*On(e/Lt)+1)*s+1+(On(r/Lt)+1)*G0(s))}get_resize_output_image_size(e,r){let s=this._num_crops,[n,o]=e.size,a=n/o,i=1;for(;i*Math.ceil(i/a)<=s;)i+=1;i-=1;let l=Math.floor(i*336),u=Math.floor(l/a);return[l,u]}pad_image(e,r,s,n={}){let[o,a]=r,i=Lt*j0(o/Lt),l=Lt*j0(a/Lt),u=[1,1,1].map((d,f)=>(d-this.image_mean[f])/this.image_std[f]);return super.pad_image(e,r,{width:l,height:i},{center:!0,constant_values:u,...n})}async _call(e,{num_crops:r=null}={}){if(this._num_crops=r??=this.config.num_crops,r<4||G0(r)%1!==0)throw new Error("num_crops must be a square number >= 4");Array.isArray(e)||(e=[e]);let s=e.length,n=await Promise.all(e.map(m=>this.preprocess(m))),o=n.map(m=>m.original_size),a=n.map(m=>m.reshaped_input_size),i=[];for(let{pixel_values:m}of n){m.unsqueeze_(0);let[_,w]=m.dims.slice(-2),x=await Pt(m,{size:[Lt,Lt],mode:"bicubic"});if(r>0){let k=[],E=G0(r),M=On(w/E),I=On(_/E);for(let z=0;z<E;++z)for(let C=0;C<E;++C){let v,G,X,V;z===E-1?(G=_-I,V=_):(G=z*I,V=(z+1)*I),C===E-1?(v=w-M,X=w):(v=C*M,X=(C+1)*M);let Y=await di(m,[G,v],[V,X],$P);k.push(Y)}let T=await Pt(Ee(k,0),{size:[Lt,Lt],mode:"bicubic"});i.push(Ee([x,T],0))}else i.push(x)}let l=zt(i,0),u=a.map(m=>m.map(_=>Lt*j0(_/Lt))),d=new U("int64",u.flat(),[s,2]),f=u.map(([m,_])=>this.calc_num_image_tokens_from_image_size(_,m));return{pixel_values:l,original_sizes:o,reshaped_input_sizes:a,image_sizes:d,num_img_tokens:f}}};var md=class extends W{get_resize_output_image_size(e,r){let{longest_edge:s}=r;if(s===void 0)throw new Error("size must contain 'longest_edge'");let[n,o]=e.size,a=Math.max(n,o)/s,i=n,l=o;a>1&&(i=Math.floor(n/a),l=Math.floor(o/a));let{patch_size:u,spatial_merge_size:d}=this.config;if(!d)throw new Error("config must contain 'spatial_merge_size'");let f=u*d,m=Math.floor((i-1)/f)+1,_=Math.floor((l-1)/f)+1;return[m*f,_*f]}};var hd=class extends W{};var _d=class extends W{async _call(e,...r){let{pixel_values:s,original_sizes:n,reshaped_input_sizes:o}=await super._call(e,...r),a=s,{temporal_patch_size:i,merge_size:l,patch_size:u}=this.config;a.dims[0]===1&&(a=Ee(Array.from({length:i},()=>a),0));let d=a.dims[0]/i,f=a.dims[1],m=Math.floor(a.dims[2]/u),_=Math.floor(a.dims[3]/u),w=a.view(d,i,f,Math.floor(m/l),l,u,Math.floor(_/l),l,u).permute(0,3,6,4,7,2,1,5,8).view(d*m*_,f*i*u*u),x=new U("int64",[d,m,_],[1,3]);return{pixel_values:w,image_grid_thw:x,original_sizes:n,reshaped_input_sizes:o}}};var gd=class extends W{post_process_object_detection(...e){return Hr(...e)}};var In=class extends W{reshape_input_points(e,r,s,n=!1){e=structuredClone(e);let o=Sy(e);if(o.length===3)n||(o=[1,...o]),e=[e];else if(o.length!==4)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");for(let a=0;a<e.length;++a){let[i,l]=r[a],[u,d]=s[a],f=[d/l,u/i];for(let m=0;m<e[a].length;++m)for(let _=0;_<e[a][m].length;++_)for(let w=0;w<e[a][m][_].length;++w)e[a][m][_][w]*=f[w%2]}return new U("float32",Float32Array.from(e.flat(1/0)),o)}add_input_labels(e,r){let s=Sy(e);if(s.length===2)s=[1,...s],e=[e];else if(s.length!==3)throw Error("The input_points must be a 4D tensor of shape `batch_size`, `point_batch_size`, `nb_points_per_image`, `2`.");if(s.some((n,o)=>n!==r.dims[o]))throw Error(`The first ${s.length} dimensions of 'input_points' and 'input_labels' must be the same.`);return new U("int64",e.flat(1/0).map(BigInt),s)}async _call(e,{input_points:r=null,input_labels:s=null,input_boxes:n=null}={}){let o=await super._call(e);if(r&&(o.input_points=this.reshape_input_points(r,o.original_sizes,o.reshaped_input_sizes)),s){if(!o.input_points)throw Error("`input_points` must be provided if `input_labels` are provided.");o.input_labels=this.add_input_labels(s,o.input_points)}return n&&(o.input_boxes=this.reshape_input_points(n,o.original_sizes,o.reshaped_input_sizes,!0)),o}async post_process_masks(e,r,s,{mask_threshold:n=0,binarize:o=!0,pad_size:a=null}={}){let i=[];a=a??this.pad_size??this.size;let l=[a.height,a.width];for(let u=0;u<r.length;++u){let d=r[u],f=s[u],m=await Pt(e[u],{mode:"bilinear",size:l});if(m=m.slice(null,null,[0,f[0]],[0,f[1]]),m=await Pt(m,{mode:"bilinear",size:d}),o){let _=m.data,w=new Uint8Array(_.length);for(let x=0;x<_.length;++x)_[x]>n&&(w[x]=1);m=new U("bool",w,m.dims)}i.push(m)}return i}generate_crop_boxes(e,r,{crop_n_layers:s=0,overlap_ratio:n=512/1500,points_per_crop:o=32,crop_n_points_downscale_factor:a=1}={}){}};var Oi=class extends W{post_process_semantic_segmentation(...e){return Up(...e)}},wd=class extends Oi{};var Ii=class extends W{post_process_semantic_segmentation(...e){return Up(...e)}},xd=class extends Ii{};var yd=class extends W{};var bd=class extends W{pad_image(e,r,s,n={}){let[o,a,i]=r;return super.pad_image(e,r,{width:a+(s-a%s)%s,height:o+(s-o%s)%s},{mode:"symmetric",center:!1,constant_values:-1,...n})}};var Ci=class extends W{},vd=class extends Ci{};var kd=class extends W{async _call(e,r){Array.isArray(e)||(e=[e]),Array.isArray(r)||(r=[r]);let s=await Promise.all(e.map(a=>this.preprocess(a))),n=await Promise.all(r.map(a=>this.preprocess(a,{do_normalize:!1,do_convert_rgb:!1,do_convert_grayscale:!0})));return{pixel_values:zt(s.map((a,i)=>Ee([a.pixel_values,n[i].pixel_values],0)),0),original_sizes:s.map(a=>a.original_size),reshaped_input_sizes:s.map(a=>a.reshaped_input_size)}}};var Ed=class extends W{post_process_pose_estimation(e,r,{threshold:s=null}={}){let n=e.tolist(),[o,a,i,l]=e.dims,u=[];for(let d=0;d<o;++d){let f=n[d],m=r[d],_=[];for(let w=0;w<m.length;++w){let x=m[w],k=[],E=[],M=[],I=x.at(-2)/l,T=x.at(-1)/i;for(let z=0;z<f.length;++z){let[C,v]=[0,0],G=0,X=-1/0,V=f[z];for(let K=0;K<V.length;++K){let Y=V[K];for(let B=0;B<Y.length;++B){let P=Y[B];G+=P,X=Math.max(X,P),C+=(B+.5)*P,v+=K*P}}if(s!=null&&X<s)continue;let Q=[I*C/G,T*v/G];k.push(Q),M.push(z),E.push(X)}_.push({bbox:x,scores:E,labels:M,keypoints:k})}u.push(_)}return u}};var Pi=class extends W{post_process_object_detection(...e){return Hr(...e)}},Ad=class extends Pi{};var Le=class{static async from_pretrained(e,r={}){let s=await it(e,En,!0,r),n=s.image_processor_type??s.feature_extractor_type,o=Cn[n?.replace(/Fast$/,"")];return o||(n!==void 0&&console.warn(`Image processor type '${n}' not found, assuming base ImageProcessor. Please report this at ${kn}.`),o=W),new o(s)}};var Md=class extends ne{static tokenizer_class=J;static image_processor_class=Le;constructor(e,r,s){super(e,r,s);let{tasks_answer_post_processing_type:n,task_prompts_without_inputs:o,task_prompts_with_input:a}=this.image_processor.config;this.tasks_answer_post_processing_type=new Map(Object.entries(n??{})),this.task_prompts_without_inputs=new Map(Object.entries(o??{})),this.task_prompts_with_input=new Map(Object.entries(a??{})),this.regexes={quad_boxes:/(.+?)<loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)>/gm,bboxes:/([^<]+)?<loc_(\d+)><loc_(\d+)><loc_(\d+)><loc_(\d+)>/gm},this.size_per_bin=1e3}construct_prompts(e){typeof e=="string"&&(e=[e]);let r=[];for(let s of e)if(this.task_prompts_without_inputs.has(s))r.push(this.task_prompts_without_inputs.get(s));else{for(let[n,o]of this.task_prompts_with_input)if(s.includes(n)){r.push(o.replaceAll("{input}",s).replaceAll(n,""));break}r.length!==e.length&&r.push(s)}return r}post_process_generation(e,r,s){let n=this.tasks_answer_post_processing_type.get(r)??"pure_text";e=e.replaceAll("<s>","").replaceAll("</s>","");let o;switch(n){case"pure_text":o=e;break;case"description_with_bboxes":case"bboxes":case"phrase_grounding":case"ocr":let a=n==="ocr"?"quad_boxes":"bboxes",i=e.matchAll(this.regexes[a]),l=[],u=[];for(let[d,f,...m]of i)l.push(f?f.trim():l.at(-1)??""),u.push(m.map((_,w)=>(Number(_)+.5)/this.size_per_bin*s[w%2]));o={labels:l,[a]:u};break;default:throw new Error(`Task "${r}" (of type "${n}") not yet implemented.`)}return{[r]:o}}async _call(e,r=null,s={}){if(!e&&!r)throw new Error("Either text or images must be provided");let n=await this.image_processor(e,s),o=r?this.tokenizer(this.construct_prompts(r),s):{};return{...n,...o}}};var Td=class extends ne{static image_processor_class=Le;static feature_extractor_class=Ze;static tokenizer_class=J;static uses_processor_config=!0;static uses_chat_template_file=!0;constructor(e,r,s){super(e,r,s),this.audio_seq_length=this.config.audio_seq_length,this.image_seq_length=this.config.image_seq_length;let{audio_token_id:n,boa_token:o,audio_token:a,eoa_token:i,image_token_id:l,boi_token:u,image_token:d,eoi_token:f}=this.tokenizer.config;this.audio_token_id=n,this.boa_token=o,this.audio_token=a;let m=a.repeat(this.audio_seq_length);this.full_audio_sequence=`
|
|
16
16
|
|
|
17
17
|
${o}${m}${i}
|
|
18
18
|
|
|
@@ -24,6 +24,6 @@ ${u}${_}${f}
|
|
|
24
24
|
`}return a+=`
|
|
25
25
|
${s}${o}`+n.repeat(t)+`${s}`,a}function BP(t,e,r,s){return`${e}${s}`+r.repeat(t)+`${e}`}function DP(t,e,r,s,n,o){return t===0&&e===0?BP(r,s,n,o):UP(r,t,e,s,n,o)}var zi=class extends ne{static image_processor_class=Le;static tokenizer_class=J;static uses_processor_config=!0;fake_image_token="<fake_token_around_image>";image_token="<image>";global_img_token="<global-img>";async _call(e,r=null,s={}){s.return_row_col_info??=!0;let n;r&&(n=await this.image_processor(r,s)),Array.isArray(e)||(e=[e]);let o=n.rows??[new Array(e.length).fill(0)],a=n.cols??[new Array(e.length).fill(0)],i=this.config.image_seq_len,l=[],u=[];for(let f=0;f<e.length;++f){let m=e[f],_=o[f],w=a[f];l.push(nk(m,this.image_token));let x=_.map((M,I)=>DP(M,w[I],i,this.fake_image_token,this.image_token,this.global_img_token)),k=m.split(this.image_token);if(k.length===0)throw new Error("The image token should be present in the text.");let E=k[0];for(let M=0;M<x.length;++M)E+=x[M]+k[M+1];u.push(E)}return{...this.tokenizer(u),...n}}};var Od=class extends ne{static image_processor_class=Le;static tokenizer_class=J;static uses_processor_config=!0;constructor(e,r,s){super(e,r,s),this.image_tag=this.config.image_tag,this.image_start_tag=this.config.image_start_tag,this.image_end_tag=this.config.image_end_tag,this.num_image_tokens=this.config.num_image_tokens}async _call(e,{images:r=null,chat_template:s="default"}={}){r?Array.isArray(r)||(r=[r]):r=await Promise.all(e.filter(k=>k.images).flatMap(k=>k.images).map(k=>Xe.read(k)));let n=this.tokenizer,o=n.apply_chat_template(e,{tokenize:!1,add_generation_prompt:!0,chat_template:s}),a=k=>n.encode(k,{add_special_tokens:!1}),i=o.split(this.image_tag),l=i.length-1;if(r.length!==l)throw new Error(`Number of images provided (${r.length}) does not match number of "${this.image_tag}" image tags (${l})`);let[u,d,f]=n.convert_tokens_to_ids([this.image_tag,this.image_start_tag,this.image_end_tag]),m=a(i[0]),_=new Array(m.length).fill(!1);for(let k=1;k<i.length;++k){let E=new Array(this.num_image_tokens).fill(u),M=a(i[k]);m=dt(m,[d],E,[f],M);let I=new Array(this.num_image_tokens).fill(!0);_=dt(_,[!1],I,[!1],new Array(M.length).fill(!1))}let w=[1,m.length],x={input_ids:new U("int64",m,w),attention_mask:new U("int64",new Array(m.length).fill(1),w),images_seq_mask:new U("bool",_,w),images_emb_mask:new U("bool",new Array(l*this.num_image_tokens).fill(!0),[1,l,this.num_image_tokens])};if(r&&r.length>0){let k=await this.image_processor(r);return k.pixel_values.unsqueeze_(0),{...x,...k}}return x}};var Id=class extends ne{static tokenizer_class=J;static image_processor_class=Le;async _call(e=null,r=null,s={}){if(!e&&!r)throw new Error("Either text or images must be provided");let n=e?this.tokenizer(e,s):{},o=r?await this.image_processor(r,s):{};return{...n,...o}}};var Cd=class extends ne{static tokenizer_class=J;static image_processor_class=Le;static uses_processor_config=!0;async _call(e,r=null,s={}){let n=await this.image_processor(e,s);if(r){let[a,i]=n.pixel_values.dims.slice(-2),{image_token:l,patch_size:u,num_additional_image_tokens:d}=this.config,f=Math.floor(a/u)*Math.floor(i/u)+d;r=structuredClone(r),Array.isArray(r)||(r=[r]);for(let m=0;m<r.length;++m)r[m]=r[m].replace(l,l.repeat(f))}let o=r?this.tokenizer(r,s):{};return{...n,...o}}};var hA={char:["char_decode",1],bpe:["bpe_decode",2],wp:["wp_decode",102]},Pd=class extends ne{static tokenizer_class=J;static image_processor_class=Le;get char_tokenizer(){return this.components.char_tokenizer}get bpe_tokenizer(){return this.components.bpe_tokenizer}get wp_tokenizer(){return this.components.wp_tokenizer}_decode_helper(e,r){if(!hA.hasOwnProperty(r))throw new Error(`Format ${r} is not supported.`);let[s,n]=hA[r],o=this[s].bind(this),[a,i]=e.dims,l=[],u=[],d=e.tolist();for(let m=0;m<a;++m){let _=d[m],w=[],x=[];for(let E=1;E<i;++E){let[M,I]=Te(Oe(_[E]));if(x.push(M),I==n)break;w.push(I)}let k=x.length>0?x.reduce((E,M)=>E*M,1):0;u.push(w),l.push(k)}return[o(u),l]}char_decode(e){return this.char_tokenizer.batch_decode(e).map(r=>r.replaceAll(" ",""))}bpe_decode(e){return this.bpe_tokenizer.batch_decode(e)}wp_decode(e){return this.wp_tokenizer.batch_decode(e).map(r=>r.replaceAll(" ",""))}batch_decode([e,r,s]){let[n,o]=this._decode_helper(e,"char"),[a,i]=this._decode_helper(r,"bpe"),[l,u]=this._decode_helper(s,"wp"),d=[],f=[];for(let m=0;m<n.length;++m){let[_,w]=Te([o[m],i[m],u[m]]);d.push([n[m],a[m],l[m]][w]),f.push(_)}return{generated_text:d,scores:f,char_preds:n,bpe_preds:a,wp_preds:l}}static async from_pretrained(...e){let r=await super.from_pretrained(...e),s=await J.from_pretrained("Xenova/gpt2"),n=await J.from_pretrained("Xenova/bert-base-uncased");return r.components={image_processor:r.image_processor,char_tokenizer:r.tokenizer,bpe_tokenizer:s,wp_tokenizer:n},r}async _call(e,r=null){let s=await this.image_processor(e);return r&&(s.labels=this.tokenizer(r).input_ids),s}};var zd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var Ld=class extends ne{static tokenizer_class=J;static image_processor_class=Le};var Pn="<image>";function FP(t,e,r,s,n){return`${s.repeat(r*n)}${e}${t}
|
|
26
26
|
`}var Nd=class extends ne{static tokenizer_class=J;static image_processor_class=Le;static uses_processor_config=!1;async _call(e,r=null,s={}){r||(console.warn("You are using PaliGemma without a text prefix. It will perform as a picture-captioning model."),r=""),Array.isArray(e)||(e=[e]),Array.isArray(r)||(r=[r]);let n=this.tokenizer.bos_token,o=this.image_processor.config.image_seq_length,a;r.some(u=>u.includes(Pn))?a=r.map(u=>{let d=u.replaceAll(Pn,Pn.repeat(o)),f=d.lastIndexOf(Pn),m=f===-1?0:f+Pn.length;return d.slice(0,m)+n+d.slice(m)+`
|
|
27
|
-
`}):(console.warn("You are passing both `text` and `images` to `PaliGemmaProcessor`. The processor expects special image tokens in the text, as many tokens as there are images per each text. It is recommended to add `<image>` tokens in the very beginning of your text. For this call, we will infer how many images each text has and add special tokens."),a=r.map(u=>FP(u,n,o,Pn,e.length)));let i=this.tokenizer(a,s);return{...await this.image_processor(e,s),...i}}};var _A="<|image|>",jP=/<\|image_\d+\|>/g,$d=class extends ne{static image_processor_class=Le;static tokenizer_class=J;async _call(e,r=null,{padding:s=!0,truncation:n=!0,num_crops:o=null}={}){Array.isArray(e)||(e=[e]);let a,i;if(r){i=await this.image_processor(r,{num_crops:o});let{num_img_tokens:l}=i,u=e.map((f,m)=>f.split(jP).join(_A.repeat(l[m])));a=this.tokenizer(u,{padding:s,truncation:n});let d=this.tokenizer._tokenizer.token_to_id(_A);a.input_ids.map_(f=>f==d?-f:f)}else a=this.tokenizer(e);return{...a,...i}}};var Rd=class extends ne{static tokenizer_class=J;static image_processor_class=Le;static uses_processor_config=!0;async _call(e,r=null,s={}){let n=await this.image_processor(e,s);if(r){let[a,i]=n.pixel_values.dims.slice(-2),{image_token:l,image_break_token:u,image_end_token:d,patch_size:f,spatial_merge_size:m}=this.config,_=f*m,w=Math.floor(a/_),x=Math.floor(i/_);r=structuredClone(r),Array.isArray(r)||(r=[r]);for(let k=0;k<r.length;++k){let E=l.repeat(x),M=E+u,I=E+d,T=M.repeat(w-1)+I;r[k]=r[k].replace(l,T)}}let o=r?this.tokenizer(r,s):{};return{...n,...o}}};var Ud=class extends ne{static feature_extractor_class=Sn;async _call(e){return await this.feature_extractor(e)}post_process_speaker_diarization(...e){return this.feature_extractor.post_process_speaker_diarization(...e)}get sampling_rate(){return this.feature_extractor.config.sampling_rate}};var Bd=class extends ne{static image_processor_class=Le;static tokenizer_class=J;async _call(e,r=null,...s){Array.isArray(e)||(e=[e]);let n,o;if(r&&(n=await this.image_processor(r),o=n.image_grid_thw),o){let i=this.image_processor.config.merge_size**2,l=0,u=o.tolist();e=e.map(d=>{for(;d.includes("<|image_pad|>");){let f=Number(u[l++].reduce((m,_)=>m*_,1n));d=d.replace("<|image_pad|>","<|placeholder|>".repeat(Math.floor(f/i)))}return d.replaceAll("<|placeholder|>","<|image_pad|>")})}return{...this.tokenizer(e),...n}}};var zn=class extends ne{static image_processor_class=Le;async _call(...e){return await this.image_processor(...e)}post_process_masks(...e){return this.image_processor.post_process_masks(...e)}reshape_input_points(...e){return this.image_processor.reshape_input_points(...e)}};var Li=class extends zn{},Dd=class extends Li{};var Fd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var jd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;static uses_processor_config=!0;async _call(e,r=null,s={}){if(Array.isArray(e))throw new Error("Batched inputs are not supported yet.");let n={};if(r){let a=r.length,{input_features:i}=await this.feature_extractor(r,{...s,max_length:a}),l=Math.round(a/this.config.encoder_ds_factor+1e-4),u=1+Math.ceil(l/this.config.stack_factor);n.audio_token_len=[u],n.audio_values=i;let d=this.config.audio_placeholder;if(!e.includes(d))throw new Error(`The input text does not contain the image token ${d}.`);e=e.replaceAll(d,d.repeat(u))}return{...this.tokenizer(e,{add_special_tokens:!1,...s}),...n}}};var Gd="[AUDIO]",GP="[BEGIN_AUDIO]",qP=375;function WP(t,e){let r=[];for(let s=0;s<t.length;s+=e)r.push(t.subarray(s,Math.min(s+e,t.length)));return r}var qd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;static uses_processor_config=!1;async _call(e,r=null,s={}){if(Array.isArray(e))throw new Error("Batched inputs are not supported yet.");let n={};if(r){if(!e.includes(Gd))throw new Error(`The input text does not contain the audio token ${Gd}.`);Array.isArray(r)||(r=[r]);let a=e.split(Gd),i=a.length-1;if(i!==r.length)throw new Error(`The number of audio inputs (${r.length}) does not match the number of audio tokens in the text (${i}).`);let l=this.feature_extractor.config.n_samples,u=r.map(w=>WP(w,l)),d=u.map(w=>w.length),f=u.flat(),m=(await Promise.all(f.map(w=>this.feature_extractor(w,s)))).map(w=>w.input_features);n.audio_values=m.length>1?Ee(m,0):m[0];let _=a[0];for(let w=0;w<d.length;++w){_+=GP;for(let x=0;x<d[w];++x)_+=Gd.repeat(qP);_+=a[w+1]}e=_}return{...this.tokenizer(e,{add_special_tokens:!1,...s}),...n}}};var Wd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var Vd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var Hd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var lt=class{static async from_pretrained(e,r={}){let s=await it(e,En,!0,r),{image_processor_type:n,feature_extractor_type:o,processor_class:a}=s;if(a&&Xd[a])return Xd[a].from_pretrained(e,r);if(!n&&!o)throw new Error("No `image_processor_type` or `feature_extractor_type` found in the config.");let i={};if(n){let u=Cn[n.replace(/Fast$/,"")];if(!u)throw new Error(`Unknown image_processor_type: '${n}'.`);i.image_processor=new u(s)}if(o){let u=Cn[o];if(u)i.image_processor=new u(s);else{let d=gi[o];if(!d)throw new Error(`Unknown feature_extractor_type: '${o}'.`);i.feature_extractor=new d(s)}}let l={};return new ne(l,i,null)}};async function VP(t,e){return await it(t,"config.json",!0,e)}function Ln(t){let e={},r={};switch(t.model_type){case"llava":case"paligemma":case"gemma3":case"florence2":case"llava_onevision":case"idefics3":case"ultravox":case"voxtral":case"smolvlm":case"gemma3n":case"chatterbox":case"mistral3":r=Ln(t.text_config);break;case"moondream1":r=Ln(t.phi_config);break;case"musicgen":r=Ln(t.decoder);break;case"multi_modality":r=Ln(t.language_config);break;case"gpt2":case"gptj":case"jais":case"codegen":case"gpt_bigcode":e.num_heads="n_head",e.num_layers="n_layer",e.hidden_size="n_embd";break;case"gpt_neox":case"stablelm":case"opt":case"falcon":case"modernbert-decoder":e.num_heads="num_attention_heads",e.num_layers="num_hidden_layers",e.hidden_size="hidden_size";break;case"gpt_oss":case"llama":case"llama4_text":case"nanochat":case"apertus":case"arcee":case"lfm2":case"lfm2_moe":case"smollm3":case"olmo":case"olmo2":case"olmo3":case"mobilellm":case"granite":case"granitemoehybrid":case"cohere":case"mistral":case"starcoder2":case"qwen2":case"qwen2_vl":case"phi":case"phi3":case"phi3_v":case"llava_qwen2":e.num_heads="num_key_value_heads",e.num_layers="num_hidden_layers",e.hidden_size="hidden_size",e.num_attention_heads="num_attention_heads",e.dim_kv="head_dim";break;case"qwen3":case"gemma":case"gemma2":case"vaultgemma":case"gemma3_text":case"gemma3n_text":case"glm":case"helium":case"ernie4_5":case"hunyuan_v1_dense":case"falcon_h1":case"ministral":case"ministral3":e.num_heads="num_key_value_heads",e.num_layers="num_hidden_layers",e.dim_kv="head_dim";break;case"openelm":e.num_heads="num_kv_heads",e.num_layers="num_transformer_layers",e.dim_kv="head_dim";break;case"gpt_neo":case"donut-swin":e.num_heads="num_heads",e.num_layers="num_layers",e.hidden_size="hidden_size";break;case"bloom":e.num_heads="n_head",e.num_layers="n_layer",e.hidden_size="hidden_size";break;case"mpt":e.num_heads="n_heads",e.num_layers="n_layers",e.hidden_size="d_model";break;case"exaone":e.num_heads="num_key_value_heads",e.num_layers="num_layers",e.dim_kv="head_dim",e.num_attention_heads="num_attention_heads";break;case"youtu":e.num_heads="num_key_value_heads",e.num_layers="num_hidden_layers",e.dim_kv="qk_head_dim",e.num_attention_heads="num_attention_heads";break;case"t5":case"mt5":case"longt5":e.num_decoder_layers="num_decoder_layers",e.num_decoder_heads="num_heads",e.decoder_dim_kv="d_kv",e.num_encoder_layers="num_layers",e.num_encoder_heads="num_heads",e.encoder_dim_kv="d_kv";break;case"bart":case"mbart":case"marian":case"whisper":case"lite-whisper":case"m2m_100":case"blenderbot":case"blenderbot-small":case"florence2_language":e.num_decoder_layers="decoder_layers",e.num_decoder_heads="decoder_attention_heads",e.decoder_hidden_size="d_model",e.num_encoder_layers="encoder_layers",e.num_encoder_heads="encoder_attention_heads",e.encoder_hidden_size="d_model";break;case"speecht5":e.num_decoder_layers="decoder_layers",e.num_decoder_heads="decoder_attention_heads",e.decoder_hidden_size="hidden_size",e.num_encoder_layers="encoder_layers",e.num_encoder_heads="encoder_attention_heads",e.encoder_hidden_size="hidden_size";break;case"trocr":e.num_encoder_layers=e.num_decoder_layers="decoder_layers",e.num_encoder_heads=e.num_decoder_heads="decoder_attention_heads",e.encoder_hidden_size=e.decoder_hidden_size="d_model";break;case"musicgen_decoder":e.num_encoder_layers=e.num_decoder_layers="num_hidden_layers",e.num_encoder_heads=e.num_decoder_heads="num_attention_heads",e.encoder_hidden_size=e.decoder_hidden_size="hidden_size";break;case"moonshine":e.num_decoder_layers="decoder_num_hidden_layers",e.num_decoder_heads="decoder_num_key_value_heads",e.num_encoder_layers="encoder_num_hidden_layers",e.num_encoder_heads="encoder_num_key_value_heads",e.encoder_hidden_size=e.decoder_hidden_size="hidden_size";break;case"vision-encoder-decoder":let n=Ln(t.decoder),o="num_decoder_layers"in n,a=at(t,["model_type","is_encoder_decoder"]);return o?(a.num_decoder_layers=n.num_decoder_layers,a.num_decoder_heads=n.num_decoder_heads,a.decoder_hidden_size=n.decoder_hidden_size,a.num_encoder_layers=n.num_encoder_layers,a.num_encoder_heads=n.num_encoder_heads,a.encoder_hidden_size=n.encoder_hidden_size):(a.num_layers=n.num_layers,a.num_heads=n.num_heads,a.hidden_size=n.hidden_size),a}let s={...r,...at(t,["model_type","multi_query","is_encoder_decoder"])};for(let n in e)s[n]=t[e[n]];return s}function Kd(t,e){if(["lfm2","lfm2_moe"].includes(t.model_type)){let r=e?.prefix??"past_key_values",s=r==="present"?"present":"past",n={},{layer_types:o,num_attention_heads:a,num_key_value_heads:i,hidden_size:l,conv_L_cache:u}=t,d=l/a,f=e?.batch_size??1;for(let m=0;m<o.length;++m)if(o[m]==="full_attention")for(let _ of["key","value"])n[`${r}.${m}.${_}`]=[f,i,0,d];else if(o[m]==="conv")n[`${s}_conv.${m}`]=[f,l,u];else throw new Error(`Unsupported layer type: ${o[m]}`);return n}else if(["granitemoehybrid","falcon_h1"].includes(t.model_type)){let r=e?.prefix??"past_key_values",s=r==="present"?"present":"past",n={},{layer_types:o,num_hidden_layers:a,num_attention_heads:i,num_key_value_heads:l,hidden_size:u,mamba_d_conv:d,mamba_n_heads:f,mamba_d_head:m,mamba_d_state:_,mamba_n_groups:w,mamba_expand:x,mamba_d_ssm:k}=t,E=u/i,M=e?.batch_size??1,I=(k??x*u)+2*w*_;for(let T=0;T<a;++T)if((!o||o[T]==="mamba")&&(n[`${s}_conv.${T}`]=[M,I,d],n[`${s}_ssm.${T}`]=[M,f,m,_]),!o||o[T]==="attention")for(let z of["key","value"])n[`${r}.${T}.${z}`]=[M,l,0,E];return n}return HP(t,e)}function HP(t,{prefix:e="past_key_values",batch_size:r=1}={}){let s={},n=t.normalized_config;if(n.is_encoder_decoder&&"num_encoder_heads"in n&&"num_decoder_heads"in n){let o=n.encoder_dim_kv??n.encoder_hidden_size/n.num_encoder_heads,a=n.decoder_dim_kv??n.decoder_hidden_size/n.num_decoder_heads,i=[r,n.num_encoder_heads,0,o],l=[r,n.num_decoder_heads,0,a];for(let u=0;u<n.num_decoder_layers;++u)s[`${e}.${u}.encoder.key`]=i,s[`${e}.${u}.encoder.value`]=i,s[`${e}.${u}.decoder.key`]=l,s[`${e}.${u}.decoder.value`]=l}else{let o=n.num_heads,a=n.num_layers,i=n.dim_kv??n.hidden_size/(n.num_attention_heads??o);if(n.model_type==="falcon"){let l=[r*o,0,i];for(let u=0;u<a;++u)s[`${e}.${u}.key`]=l,s[`${e}.${u}.value`]=l}else if(n.multi_query){let l=[r*o,0,2*i];for(let u=0;u<a;++u)s[`${e}.${u}.key_value`]=l}else if(n.model_type==="bloom"){let l=[r*o,i,0],u=[r*o,0,i];for(let d=0;d<a;++d)s[`${e}.${d}.key`]=l,s[`${e}.${d}.value`]=u}else if(n.model_type==="openelm")for(let l=0;l<a;++l){let u=[r,o[l],0,i];s[`${e}.${l}.key`]=u,s[`${e}.${l}.value`]=u}else{let l=[r,o,0,i];for(let u=0;u<a;++u)s[`${e}.${u}.key`]=l,s[`${e}.${u}.value`]=l}}return s}var Ni=class t{model_type=null;is_encoder_decoder=!1;max_position_embeddings;"transformers.js_config";constructor(e){Object.assign(this,e),this.normalized_config=Ln(this)}static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main"}={}){s&&!(s instanceof t)&&(s=new t(s));let i=s??await VP(e,{progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a});return new this(i)}},Xr=class{static async from_pretrained(...e){return Ni.from_pretrained(...e)}};async function gA(t,e,r,s){let n=`${e}${s}.onnx`,o=`${r.subfolder??""}/${n}`;return await ei(t,o,!0,r,be.IS_NODE_ENV)}async function wA(t,e,r,s,n,o={}){let a=`${e}${r}.onnx`,i=be.IS_NODE_ENV,l=[];if(n){let u;typeof n=="object"?n.hasOwnProperty(a)?u=n[a]:n.hasOwnProperty(e)?u=n[e]:u=!1:u=n;let d=+u;if(d>iu)throw new Error(`The number of external data chunks (${d}) exceeds the maximum allowed value (${iu}).`);for(let f=0;f<d;++f){let m=`${a}_data${f===0?"":"_"+f}`,_=`${s.subfolder??""}/${m}`;l.push(new Promise(async(w,x)=>{let k=await ei(t,_,!0,s,i);w(k instanceof Uint8Array?{path:m,data:k}:m)}))}}else o.externalData!==void 0&&(l=o.externalData.map(async u=>{if(typeof u.data=="string"){let d=await ei(t,u.data,!0,s);return{...u,data:d}}return u}));return Promise.all(l)}async function XP(t,e,r,s=!1){let n=r.config?.["transformers.js_config"]??{},o=r.device??n.device;o&&typeof o!="string"&&(o.hasOwnProperty(e)?o=o[e]:(console.warn(`device not specified for "${e}". Using the default device.`),o=null));let a=o??(be.IS_NODE_ENV?"cpu":"wasm"),i=HE(a),l=n.device_config??{};l.hasOwnProperty(a)&&(n={...n,...l[a]});let u=r.dtype??n.dtype;if(typeof u!="string"&&(u&&u.hasOwnProperty(e)?u=u[e]:(u=T0[a]??mt.fp32,console.warn(`dtype not specified for "${e}". Using the default dtype (${u}) for this device (${a}).`))),u===mt.auto){let z=n.dtype;typeof z!="string"&&(z=z?.[e]),z&&z!==mt.auto&&mt.hasOwnProperty(z)?u=z:u=T0[a]??mt.fp32}let d=u;if(S0.hasOwnProperty(d)){if(a==="webgpu"&&!be.IS_NODE_ENV&&d===mt.fp16&&!await YE())throw new Error(`The device (${a}) does not support fp16.`)}else throw new Error(`Invalid dtype: ${d}. Should be one of: ${Object.keys(mt).join(", ")}`);let f=n.kv_cache_dtype,m=f?typeof f=="string"?f:f[d]??"float32":void 0;if(m&&!["float32","float16"].includes(m))throw new Error(`Invalid kv_cache_dtype: ${m}. Should be one of: float32, float16`);let _=S0[d],w={...r.session_options};w.executionProviders??=i;let x=n.free_dimension_overrides;x?w.freeDimensionOverrides??=x:a.startsWith("webnn")&&!w.freeDimensionOverrides&&console.warn(`WebNN does not currently support dynamic shapes and requires 'free_dimension_overrides' to be set in config.json, preferably as a field within config["transformers.js_config"]["device_config"]["${a}"]. When 'free_dimension_overrides' is not set, you may experience significant performance degradation.`);let k=gA(t,e,r,_),E=r.use_external_data_format??n.use_external_data_format,M=await wA(t,e,_,r,E,w);if(M.length>0&&!be.IS_NODE_ENV&&(w.externalData=M),s&&a==="webgpu"&&f!==!1){let z=Kd(r.config,{prefix:"present"});if(Object.keys(z).length>0&&!ui()){let C={};for(let v in z)C[v]="gpu-buffer";w.preferredOutputLocation=C}}return{buffer_or_path:await k,session_options:w,session_config:{dtype:d,kv_cache_dtype:m,device:a}}}async function bt(t,e,r,s=void 0){return Object.fromEntries(await Promise.all(Object.keys(e).map(async n=>{let{buffer_or_path:o,session_options:a,session_config:i}=await XP(t,e[n],r,n===s),l=await Eu(o,a,i);return[n,l]})))}function xA(t){for(let e in t)Mu(t[e])?t[e]=new U(t[e]):typeof t[e]=="object"&&xA(t[e]);return t}async function ce(t,e){let r=KP(t,e);try{let s=Object.fromEntries(Object.entries(r).map(([o,a])=>{let i=a.ort_tensor;return be.IS_NODE_ENV&&typeof Float16Array<"u"&&i.cpuData instanceof Float16Array&&(i.cpuData=new Uint16Array(i.cpuData.buffer)),[o,i]})),n=await Au(t,s);return xA(n)}catch(s){let n=Object.fromEntries(Object.entries(r).map(([o,a])=>{let i={type:a.type,dims:a.dims,location:a.location};return i.location!=="gpu-buffer"&&(i.data=a.data),[o,i]}));throw console.error(`An error occurred during model execution: "${s}".`),console.error("Inputs given to model:",n),s}}function KP(t,e){let r=Object.create(null),s=[];for(let a of t.inputNames){let i=e[a];if(!(i instanceof U)){s.push(a);continue}r[a]=ui()?i.clone():i}if(s.length>0)throw new Error(`An error occurred during model execution: "Missing the following inputs: ${s.join(", ")}.`);let n=Object.keys(e).length,o=t.inputNames.length;if(n>o){let a=Object.keys(e).filter(i=>!t.inputNames.includes(i));console.warn(`WARNING: Too many inputs were provided (${n} > ${o}). The following inputs will be ignored: "${a.join(", ")}".`)}return r}var Ne=class{};var F=class extends Ne{constructor({logits:e,...r}){super(),this.logits=e;let s=Object.values(r);s.length>0&&(this.attentions=s)}},_e=class extends Ne{constructor({logits:e}){super(),this.logits=e}},we=class extends Ne{constructor({logits:e}){super(),this.logits=e}},Ae=class extends Ne{constructor({start_logits:e,end_logits:r}){super(),this.start_logits=e,this.end_logits=r}},gt=class extends Ne{constructor({logits:e}){super(),this.logits=e}};var Yd=class extends Ne{constructor({alphas:e}){super(),this.alphas=e}};var Nt=class extends Je{_call(e,r){throw Error("`_call` should be implemented in a subclass")}},Nn=class extends Je{_call(e,r){throw Error("`_call` should be implemented in a subclass")}},Kr=class extends Je{constructor(){super(),this.processors=[]}push(e){this.processors.push(e)}extend(e){this.processors.push(...e)}_call(e,r){let s=r;for(let n of this.processors)s=n(e,s);return s}[Symbol.iterator](){return this.processors.values()}},$i=class extends Nt{constructor(e){super(),this.bos_token_id=e}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length===1){let n=r[s].data;n.fill(-1/0),n[this.bos_token_id]=0}return r}},Ri=class extends Nt{constructor(e,r){super(),this.max_length=e,this.eos_token_id=Array.isArray(r)?r:[r]}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length===this.max_length-1){let n=r[s].data;n.fill(-1/0);for(let o of this.eos_token_id)n[o]=0}return r}},Os=class extends Nt{constructor(e,r){super(),this.begin_suppress_tokens=e,this.begin_index=r}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length===this.begin_index){let n=r[s].data;for(let o of this.begin_suppress_tokens)n[o]=-1/0}return r}},Ui=class extends Nt{constructor(e,r){super(),this.eos_token_id=Array.isArray(e.eos_token_id)?e.eos_token_id[0]:e.eos_token_id,this.no_timestamps_token_id=e.no_timestamps_token_id,this.timestamp_begin=this.no_timestamps_token_id+1,this.begin_index=r.length,r.at(-1)===this.no_timestamps_token_id&&(this.begin_index-=1),this.max_initial_timestamp_index=e.max_initial_timestamp_index}_call(e,r){for(let s=0;s<e.length;++s){let n=r[s].data;if(n[this.no_timestamps_token_id]=-1/0,e[s].length===this.begin_index-1){n.fill(-1/0),n[this.timestamp_begin]=0;continue}let o=e[s].slice(this.begin_index),a=o.length>=1&&o[o.length-1]>=this.timestamp_begin,i=o.length<2||o[o.length-2]>=this.timestamp_begin;if(a&&(i?n.subarray(this.timestamp_begin).fill(-1/0):n.subarray(0,this.eos_token_id).fill(-1/0)),e[s].length===this.begin_index&&this.max_initial_timestamp_index!==null){let f=this.timestamp_begin+this.max_initial_timestamp_index;n.subarray(f+1).fill(-1/0)}let l=pu(n),u=Math.log(l.subarray(this.timestamp_begin).map(Math.exp).reduce((f,m)=>f+m)),d=Te(l.subarray(0,this.timestamp_begin))[0];u>d&&n.subarray(0,this.timestamp_begin).fill(-1/0)}return r}},Bi=class extends Nt{constructor(e){super(),this.no_repeat_ngram_size=e}getNgrams(e){let r=e.length,s=[];for(let o=0;o<r+1-this.no_repeat_ngram_size;++o){let a=[];for(let i=0;i<this.no_repeat_ngram_size;++i)a.push(e[o+i]);s.push(a.map(Number))}let n=new Map;for(let o of s){let a=o.slice(0,o.length-1),i=JSON.stringify(a),l=n.get(i)??[];l.push(o[o.length-1]),n.set(i,l)}return n}getGeneratedNgrams(e,r){let s=r.slice(r.length+1-this.no_repeat_ngram_size,r.length);return e.get(JSON.stringify(s.map(Number)))??[]}calcBannedNgramTokens(e){let r=[];if(e.length+1<this.no_repeat_ngram_size)return r;{let s=this.getNgrams(e);return this.getGeneratedNgrams(s,e)}}_call(e,r){for(let s=0;s<e.length;++s){let n=r[s].data,o=this.calcBannedNgramTokens(e[s]);for(let a of o)n[a]=-1/0}return r}},Di=class extends Nt{constructor(e){super(),this.penalty=e}_call(e,r){for(let s=0;s<e.length;++s){let n=r[s].data;for(let o of new Set(e[s])){let a=Number(o);n[a]<0?n[a]*=this.penalty:n[a]/=this.penalty}}return r}},Fi=class extends Nt{constructor(e,r){super(),this.min_length=e,this.eos_token_id=Array.isArray(r)?r:[r]}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length<this.min_length){let n=r[s].data;for(let o of this.eos_token_id)n[o]=-1/0}return r}},ji=class extends Nt{constructor(e,r,s){super(),this.prompt_length_to_skip=e,this.min_new_tokens=r,this.eos_token_id=Array.isArray(s)?s:[s]}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length-this.prompt_length_to_skip<this.min_new_tokens){let o=r[s].data;for(let a of this.eos_token_id)o[a]=-1/0}return r}},Gi=class extends Nt{constructor(e,r){super(),this.bad_words_ids=e,this.eos_token_id=Array.isArray(r)?r:[r]}_call(e,r){for(let s=0;s<e.length;++s){let n=r[s].data,o=e[s];for(let a of this.bad_words_ids){if(o.length<a.length-1)continue;let i=!0;for(let l=1;l<=a.length-1;++l)if(a.at(-l-1)!=o.at(-l)){i=!1;break}i&&(n[a.at(-1)]=-1/0)}}return r}},qi=class extends Nt{constructor(e){if(super(),e<=1)throw new Error(`Require guidance scale >1 to use the classifier free guidance processor, got guidance scale ${e}.`);this.guidance_scale=e}_call(e,r){if(r.dims[0]!==2*e.length)throw new Error(`Logits should have twice the batch size of the input ids, the first half of batches corresponding to the conditional inputs, and the second half of batches corresponding to the unconditional inputs. Got batch size ${r.dims[0]} for the logits and ${e.length} for the input ids.`);let s=e.length,n=r.slice([0,s],null),o=r.slice([s,r.dims[0]],null);for(let a=0;a<o.data.length;++a)o.data[a]+=(n.data[a]-o.data[a])*this.guidance_scale;return o}},Wi=class extends Nn{constructor(e){if(super(),typeof e!="number"||e<=0){let r=`\`temperature\` (=${e}) must be a strictly positive float, otherwise your next token scores will be invalid.`;e===0&&(r+=" If you're looking for greedy decoding strategies, set `do_sample=false`.")}this.temperature=e}_call(e,r){let s=r.data;for(let n=0;n<s.length;++n)s[n]/=this.temperature;return r}},q0=class extends Nn{constructor(e,{filter_value:r=-1/0,min_tokens_to_keep:s=1}={}){if(super(),e<0||e>1)throw new Error(`\`top_p\` must be a float > 0 and < 1, but is ${e}`);if(!Number.isInteger(s)||s<1)throw new Error(`\`min_tokens_to_keep\` must be a positive integer, but is ${s}`);this.top_p=e,this.filter_value=r,this.min_tokens_to_keep=s}},W0=class extends Nn{constructor(e,{filter_value:r=-1/0,min_tokens_to_keep:s=1}={}){if(super(),!Number.isInteger(e)||e<0)throw new Error(`\`top_k\` must be a positive integer, but is ${e}`);this.top_k=Math.max(e,s),this.filter_value=r}};var $n=class{max_length=20;max_new_tokens=null;min_length=0;min_new_tokens=null;early_stopping=!1;max_time=null;do_sample=!1;num_beams=1;num_beam_groups=1;penalty_alpha=null;use_cache=!0;temperature=1;top_k=50;top_p=1;typical_p=1;epsilon_cutoff=0;eta_cutoff=0;diversity_penalty=0;repetition_penalty=1;encoder_repetition_penalty=1;length_penalty=1;no_repeat_ngram_size=0;bad_words_ids=null;force_words_ids=null;renormalize_logits=!1;constraints=null;forced_bos_token_id=null;forced_eos_token_id=null;remove_invalid_values=!1;exponential_decay_length_penalty=null;suppress_tokens=null;streamer=null;begin_suppress_tokens=null;forced_decoder_ids=null;guidance_scale=null;num_return_sequences=1;output_attentions=!1;output_hidden_states=!1;output_scores=!1;return_dict_in_generate=!1;pad_token_id=null;bos_token_id=null;eos_token_id=null;encoder_no_repeat_ngram_size=0;decoder_start_token_id=null;generation_kwargs={};constructor(e){Object.assign(this,at(e,Object.getOwnPropertyNames(this)))}};var Is=class extends Je{_call(e,r){throw Error("StoppingCriteria needs to be subclassed")}},Vi=class t extends Je{constructor(){super(),this.criteria=[]}push(e){this.criteria.push(e)}extend(e){e instanceof t?e=e.criteria:e instanceof Is&&(e=[e]),this.criteria.push(...e)}_call(e,r){let s=new Array(e.length).fill(!1);for(let n of this.criteria){let o=n(e,r);for(let a=0;a<s.length;++a)s[a]||=o[a]}return s}[Symbol.iterator](){return this.criteria.values()}},Hi=class extends Is{constructor(e,r=null){super(),this.max_length=e,this.max_position_embeddings=r}_call(e){return e.map(r=>r.length>=this.max_length)}},Xi=class extends Is{constructor(e){super(),Array.isArray(e)||(e=[e]),this.eos_token_id=e}_call(e,r){return e.map(s=>{let n=s.at(-1);return this.eos_token_id.some(o=>n==o)})}},V0=class extends Is{constructor(){super(),this.interrupted=!1}interrupt(){this.interrupted=!0}reset(){this.interrupted=!1}_call(e,r){return new Array(e.length).fill(this.interrupted)}};var Cs=class extends Je{constructor(e){super(),this.generation_config=e}async _call(e){return this.sample(e)}async sample(e){throw Error("sample should be implemented in subclasses.")}getLogits(e,r){let s=e.dims.at(-1),n=e.data;if(r===-1)n=n.slice(-s);else{let o=r*s;n=n.slice(o,o+s)}return n}randomSelect(e){let r=0;for(let n=0;n<e.length;++n)r+=e[n];let s=Math.random()*r;for(let n=0;n<e.length;++n)if(s-=e[n],s<=0)return n;return 0}static getSampler(e){if(e.do_sample)return new X0(e);if(e.num_beams>1)return new K0(e);if(e.num_return_sequences>1)throw Error(`num_return_sequences has to be 1 when doing greedy search, but is ${e.num_return_sequences}.`);return new H0(e)}},H0=class extends Cs{async sample(e){let r=Te(e.data)[1];return[[BigInt(r),0]]}},X0=class extends Cs{async sample(e){let r=e.dims.at(-1);this.generation_config.top_k>0&&(r=Math.min(this.generation_config.top_k,r));let[s,n]=await Gt(e,r),o=Oe(s.data);return Array.from({length:this.generation_config.num_beams},()=>{let a=this.randomSelect(o);return[n.data[a],Math.log(o[a])]})}},K0=class extends Cs{async sample(e){let r=e.dims.at(-1);this.generation_config.top_k>0&&(r=Math.min(this.generation_config.top_k,r));let[s,n]=await Gt(e,r),o=Oe(s.data);return Array.from({length:this.generation_config.num_beams},(a,i)=>[n.data[i],Math.log(o[i])])}};var Ki=null;function bA(t){Ki=t}function Y0(t){if(t instanceof U)return t;if(t.length===0)throw Error("items must be non-empty");if(Array.isArray(t[0])){if(t.some(e=>e.length!==t[0].length))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=True' and/or 'truncation=True' to have batched tensors with the same length.");return new U("int64",BigInt64Array.from(t.flat().map(e=>BigInt(e))),[t.length,t[0].length])}else return new U("int64",BigInt64Array.from(t.map(e=>BigInt(e))),[1,t.length])}function Q0(t){return new U("bool",[t],[1])}var H={EncoderOnly:0,EncoderDecoder:1,Seq2Seq:2,Vision2Seq:3,DecoderOnly:4,DecoderOnlyWithoutHead:5,MaskGeneration:6,ImageTextToText:7,Musicgen:8,MultiModality:9,Phi3V:10,AudioTextToText:11,AutoEncoder:12,ImageAudioTextToText:13,Supertonic:14,Chatterbox:15},yA={[H.DecoderOnly]:{can_generate:!0,forward:Tt,prepare_inputs:Yi},[H.DecoderOnlyWithoutHead]:{can_generate:!1,forward:Tt,prepare_inputs:Yi},[H.Seq2Seq]:{can_generate:!0,forward:Qd,prepare_inputs:Qi},[H.Vision2Seq]:{can_generate:!0,forward:Qd,prepare_inputs:Qi},[H.Musicgen]:{can_generate:!0,forward:Qd},[H.EncoderDecoder]:{can_generate:!1,forward:Qd},[H.ImageTextToText]:{can_generate:!0,forward:JP,prepare_inputs:Jd},[H.AudioTextToText]:{can_generate:!0,forward:QP,prepare_inputs:Jd},[H.Phi3V]:{can_generate:!0,prepare_inputs:Jd},[H.ImageAudioTextToText]:{can_generate:!0,prepare_inputs:Jd},[H.MultiModality]:{can_generate:!0},[H.AutoEncoder]:{can_generate:!1,forward:YP},[H.Chatterbox]:{can_generate:!0,forward:qt},default:{can_generate:!1,forward:qt}},zs=new Map,Zd=new Map,Ps=new Map,y=class extends Je{main_input_name="input_ids";forward_params=["input_ids","attention_mask"];_return_dict_in_generate_keys=null;constructor(e,r,s){super(),this.config=e,this.sessions=r,this.configs=s;let n=Ps.get(this.constructor),o=zs.get(n),a=yA[o]??yA.default;this.can_generate=a.can_generate,this._forward=a.forward,this._prepare_inputs_for_generation=a.prepare_inputs,this.can_generate&&this.forward_params.push("past_key_values"),this.custom_config=this.config["transformers.js_config"]??{}}async dispose(){let e=[];for(let r of Object.values(this.sessions))e.push(r.release?.());return await Promise.all(e)}static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main",model_file_name:i=null,subfolder:l="onnx",device:u=null,dtype:d=null,use_external_data_format:f=null,session_options:m={}}={}){let _={progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a,model_file_name:i,subfolder:l,device:u,dtype:d,use_external_data_format:f,session_options:m},w=Ps.get(this),x=zs.get(w);s=_.config=await Xr.from_pretrained(e,_);let k;if(x===H.DecoderOnly)k=await Promise.all([bt(e,{model:_.model_file_name??"model"},_,"model"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.Seq2Seq||x===H.Vision2Seq)k=await Promise.all([bt(e,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},_,"decoder_model_merged"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.MaskGeneration)k=await Promise.all([bt(e,{model:"vision_encoder",prompt_encoder_mask_decoder:"prompt_encoder_mask_decoder"},_)]);else if(x===H.EncoderDecoder)k=await Promise.all([bt(e,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},_,"decoder_model_merged")]);else if(x===H.ImageTextToText){let E={embed_tokens:"embed_tokens",vision_encoder:"vision_encoder",decoder_model_merged:"decoder_model_merged"};s.is_encoder_decoder&&(E.model="encoder_model"),k=await Promise.all([bt(e,E,_,"decoder_model_merged"),xr(e,{generation_config:"generation_config.json"},_)])}else if(x===H.AudioTextToText){let E={embed_tokens:"embed_tokens",audio_encoder:"audio_encoder",decoder_model_merged:"decoder_model_merged"};k=await Promise.all([bt(e,E,_,"decoder_model_merged"),xr(e,{generation_config:"generation_config.json"},_)])}else if(x===H.ImageAudioTextToText){let E={embed_tokens:"embed_tokens",audio_encoder:"audio_encoder",vision_encoder:"vision_encoder",decoder_model_merged:"decoder_model_merged"};k=await Promise.all([bt(e,E,_),xr(e,{generation_config:"generation_config.json"},_)])}else if(x===H.Musicgen)k=await Promise.all([bt(e,{model:"text_encoder",decoder_model_merged:"decoder_model_merged",encodec_decode:"encodec_decode"},_,"decoder_model_merged"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.MultiModality)k=await Promise.all([bt(e,{prepare_inputs_embeds:"prepare_inputs_embeds",model:"language_model",lm_head:"lm_head",gen_head:"gen_head",gen_img_embeds:"gen_img_embeds",image_decode:"image_decode"},_,"model"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.Phi3V)k=await Promise.all([bt(e,{prepare_inputs_embeds:"prepare_inputs_embeds",model:"model",vision_encoder:"vision_encoder"},_,"model"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.Chatterbox)k=await Promise.all([bt(e,{embed_tokens:"embed_tokens",speech_encoder:"speech_encoder",model:"language_model",conditional_decoder:"conditional_decoder"},_,"model"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.AutoEncoder)k=await Promise.all([bt(e,{encoder_model:"encoder_model",decoder_model:"decoder_model"},_)]);else if(x===H.Supertonic)k=await Promise.all([bt(e,{text_encoder:"text_encoder",latent_denoiser:"latent_denoiser",voice_decoder:"voice_decoder"},_)]);else{if(x===void 0){let E=w??s?.model_type;E!=="custom"&&console.warn(`Model type for '${E}' not found, assuming encoder-only architecture. Please report this at ${kn}.`)}k=await Promise.all([bt(e,{model:_.model_file_name??"model"},_)])}return new this(s,...k)}async _call(e){return await this.forward(e)}async forward(e){return await this._forward(this,e)}get generation_config(){return this.configs?.generation_config??null}_get_logits_processor(e,r,s=null){let n=new Kr;if(e.repetition_penalty!==null&&e.repetition_penalty!==1&&n.push(new Di(e.repetition_penalty)),e.no_repeat_ngram_size!==null&&e.no_repeat_ngram_size>0&&n.push(new Bi(e.no_repeat_ngram_size)),e.bad_words_ids!==null&&n.push(new Gi(e.bad_words_ids,e.eos_token_id)),e.min_length!==null&&e.eos_token_id!==null&&e.min_length>0&&n.push(new Fi(e.min_length,e.eos_token_id)),e.min_new_tokens!==null&&e.eos_token_id!==null&&e.min_new_tokens>0&&n.push(new ji(r,e.min_new_tokens,e.eos_token_id)),e.forced_bos_token_id!==null&&n.push(new $i(e.forced_bos_token_id)),e.forced_eos_token_id!==null&&n.push(new Ri(e.max_length,e.forced_eos_token_id)),e.begin_suppress_tokens!==null){let o=r>1||e.forced_bos_token_id===null?r:r+1;n.push(new Os(e.begin_suppress_tokens,o))}return e.guidance_scale!==null&&e.guidance_scale>1&&n.push(new qi(e.guidance_scale)),e.temperature===0&&e.do_sample&&(console.warn("`do_sample` changed to false because `temperature: 0` implies greedy sampling (always selecting the most likely token), which is incompatible with `do_sample: true`."),e.do_sample=!1),e.do_sample&&e.temperature!==null&&e.temperature!==1&&n.push(new Wi(e.temperature)),s!==null&&n.extend(s),n}_prepare_generation_config(e,r,s=$n){let n={...this.config};for(let a of["decoder","generator","text_config"])a in n&&Object.assign(n,n[a]);let o=new s(n);return Object.assign(o,this.generation_config??{}),e&&Object.assign(o,e),r&&Object.assign(o,at(r,Object.getOwnPropertyNames(o))),o}_get_stopping_criteria(e,r=null){let s=new Vi;return e.max_length!==null&&s.push(new Hi(e.max_length,this.config.max_position_embeddings??null)),e.eos_token_id!==null&&s.push(new Xi(e.eos_token_id)),r&&s.extend(r),s}_validate_model_class(){if(!this.can_generate){let e=[Ki.MODEL_FOR_CAUSAL_LM_MAPPING_NAMES,Ki.MODEL_FOR_VISION_2_SEQ_MAPPING_NAMES,Ki.MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMES,Ki.MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPING_NAMES].filter(Boolean),r=Ps.get(this.constructor),s=new Set,n=this.config.model_type;for(let a of e){let i=a?.get(n);i&&s.add(i)}let o=`The current model class (${r}) is not compatible with \`.generate()\`, as it doesn't have a language model head.`;throw s.size>0&&(o+=` Please use the following class instead: ${[...s].join(", ")}`),Error(o)}}prepare_inputs_for_generation(...e){if(!this._prepare_inputs_for_generation)throw new Error("prepare_inputs_for_generation is not implemented for this model.");return this._prepare_inputs_for_generation(this,...e)}_update_model_kwargs_for_generation({generated_input_ids:e,outputs:r,model_inputs:s,is_encoder_decoder:n}){return s.past_key_values=this.getPastKeyValues(r,s.past_key_values),s.input_ids=new U("int64",e.flat(),[e.length,1]),n?"decoder_attention_mask"in s:s.attention_mask=Ee([s.attention_mask,rt([s.attention_mask.dims[0],1])],1),s.position_ids=null,s}_prepare_model_inputs({inputs:e,bos_token_id:r,model_kwargs:s}){let n=at(s,this.forward_params),o=this.main_input_name;if(o in n){if(e)throw new Error("`inputs`: {inputs}` were passed alongside {input_name} which is not allowed. Make sure to either pass {inputs} or {input_name}=...")}else n[o]=e;return{inputs_tensor:n[o],model_inputs:n,model_input_name:o}}async _prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:e,model_inputs:r,model_input_name:s,generation_config:n}){if(this.sessions.model.inputNames.includes("inputs_embeds")&&!r.inputs_embeds&&"_prepare_inputs_embeds"in this){let{input_ids:a,pixel_values:i,attention_mask:l,...u}=r,d=await this._prepare_inputs_embeds(r);r={...u,...at(d,["inputs_embeds","attention_mask"])}}let{last_hidden_state:o}=await qt(this,r);if(n.guidance_scale!==null&&n.guidance_scale>1)o=Ee([o,yn(o,0)],0),"attention_mask"in r&&(r.attention_mask=Ee([r.attention_mask,Cu(r.attention_mask)],0));else if(r.decoder_input_ids){let a=Y0(r.decoder_input_ids).dims[0];if(a!==o.dims[0]){if(o.dims[0]!==1)throw new Error(`The encoder outputs have a different batch size (${o.dims[0]}) than the decoder inputs (${a}).`);o=Ee(Array.from({length:a},()=>o),0)}}return r.encoder_outputs=o,r}_prepare_decoder_input_ids_for_generation({batch_size:e,model_input_name:r,model_kwargs:s,decoder_start_token_id:n,bos_token_id:o,generation_config:a}){let{decoder_input_ids:i,...l}=s;if(!(i instanceof U)){if(i)Array.isArray(i[0])||(i=Array.from({length:e},()=>i));else if(n??=o,this.config.model_type==="musicgen")i=Array.from({length:e*this.config.decoder.num_codebooks},()=>[n]);else if(Array.isArray(n)){if(n.length!==e)throw new Error(`\`decoder_start_token_id\` expcted to have length ${e} but got ${n.length}`);i=n}else i=Array.from({length:e},()=>[n]);i=Y0(i)}return s.decoder_attention_mask=mi(i),{input_ids:i,model_inputs:l}}async generate({inputs:e=null,generation_config:r=null,logits_processor:s=null,stopping_criteria:n=null,streamer:o=null,...a}){this._validate_model_class(),r=this._prepare_generation_config(r,a);let{inputs_tensor:i,model_inputs:l,model_input_name:u}=this._prepare_model_inputs({inputs:e,model_kwargs:a}),d=this.config.is_encoder_decoder;d&&("encoder_outputs"in l||(l=await this._prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:i,model_inputs:l,model_input_name:u,generation_config:r})));let f;d?{input_ids:f,model_inputs:l}=this._prepare_decoder_input_ids_for_generation({batch_size:l[u].dims.at(0),model_input_name:u,model_kwargs:l,decoder_start_token_id:r.decoder_start_token_id,bos_token_id:r.bos_token_id,generation_config:r}):f=l[u];let m=f.dims.at(-1);r.max_new_tokens!==null&&(r.max_length=m+r.max_new_tokens);let _=this._get_logits_processor(r,m,s),w=this._get_stopping_criteria(r,n),x=l[u].dims.at(0),k=Cs.getSampler(r),E=new Array(x).fill(0),M=f.tolist();o&&o.put(M);let I,T={},z={};for(;;){if(l=this.prepare_inputs_for_generation(M,l,r),I=await this.forward(l),r.return_dict_in_generate)if(r.output_attentions){let K=this.getAttentions(I);for(let Y in K)Y in T||(T[Y]=[]),T[Y].push(K[Y])}else this._return_dict_in_generate_keys&&Object.assign(z,at(I,this._return_dict_in_generate_keys));let G=I.logits.slice(null,-1,null).to("float32"),X=_(M,G),V=[];for(let K=0;K<X.dims.at(0);++K){let Y=X[K],B=await k(Y);for(let[P,se]of B){let ie=BigInt(P);E[K]+=se,M[K].push(ie),V.push([ie]);break}}if(o&&o.put(V),w(M).every(K=>K))break;l=this._update_model_kwargs_for_generation({generated_input_ids:V,outputs:I,model_inputs:l,is_encoder_decoder:d})}o&&o.end();let C=this.getPastKeyValues(I,l.past_key_values,!0),v=new U("int64",M.flat(),[M.length,M[0].length]);if(r.return_dict_in_generate)return{sequences:v,past_key_values:C,...T,...z};for(let G of Object.values(I))G.location==="gpu-buffer"&&G.dispose();return v}getPastKeyValues(e,r,s=!1){let n=Object.create(null);for(let o in e)if(o.startsWith("present")){let a=o.replace("present_ssm","past_ssm").replace("present_conv","past_conv").replace("present","past_key_values"),i=o.includes("encoder");if(i&&r?n[a]=r[a]:n[a]=e[o],r&&(!i||s)){let l=r[a];l.location==="gpu-buffer"&&l.dispose()}}return n}getAttentions(e){let r={};for(let s of["cross_attentions","encoder_attentions","decoder_attentions"])for(let n in e)n.startsWith(s)&&(s in r||(r[s]=[]),r[s].push(e[n]));return r}addPastKeyValues(e,r){if(r)Object.assign(e,r);else{let s=this.sessions.decoder_model_merged??this.sessions.model,n=(e[this.main_input_name]??e.attention_mask)?.dims?.[0]??1,o=s?.config?.kv_cache_dtype??"float32",a=o==="float16"?xn.float16:xn.float32,i=Kd(this.config,{batch_size:n});for(let l in i){let u=i[l].reduce((d,f)=>d*f,1);e[l]=new U(o,new a(u),i[l])}}}async encode_image({pixel_values:e}){return(await ce(this.sessions.vision_encoder,{pixel_values:e})).image_features}async encode_text({input_ids:e}){return(await ce(this.sessions.embed_tokens,{input_ids:e})).inputs_embeds}async encode_audio({audio_values:e}){return(await ce(this.sessions.audio_encoder,{audio_values:e})).audio_features}};async function Qd(t,e){let{encoder_outputs:r,input_ids:s,decoder_input_ids:n,...o}=e;if(!r){let a=at(e,t.sessions.model.inputNames);r=(await qt(t,a)).last_hidden_state}return o.input_ids=n,o.encoder_hidden_states=r,t.sessions.decoder_model_merged.inputNames.includes("encoder_attention_mask")&&(o.encoder_attention_mask=e.attention_mask),await Tt(t,o,!0)}async function qt(t,e){let r=t.sessions.model,s=at(e,r.inputNames);if(r.inputNames.includes("inputs_embeds")&&!s.inputs_embeds){if(!e.input_ids)throw new Error("Both `input_ids` and `inputs_embeds` are missing in the model inputs.");s.inputs_embeds=await t.encode_text({input_ids:e.input_ids})}if(r.inputNames.includes("token_type_ids")&&!s.token_type_ids){if(!s.input_ids)throw new Error("Both `input_ids` and `token_type_ids` are missing in the model inputs.");s.token_type_ids=Cu(s.input_ids)}if(r.inputNames.includes("pixel_mask")&&!s.pixel_mask){if(!s.pixel_values)throw new Error("Both `pixel_values` and `pixel_mask` are missing in the model inputs.");let n=s.pixel_values.dims;s.pixel_mask=rt([n[0],n[2],n[3]])}return await ce(r,s)}async function YP(t,e){let r=await t.encode(e);return await t.decode(r)}async function Tt(t,e,r=!1){let s=t.sessions[r?"decoder_model_merged":"model"],{past_key_values:n,...o}=e;if(s.inputNames.includes("use_cache_branch")&&(o.use_cache_branch=Q0(!!n)),s.inputNames.includes("position_ids")&&o.attention_mask&&!o.position_ids){let i=["paligemma","gemma3_text","gemma3"].includes(t.config.model_type)?1:0;o.position_ids=ZP(o,n,i)}t.addPastKeyValues(o,n);let a=at(o,s.inputNames);return await ce(s,a)}async function vA(t,{encode_function:e,merge_function:r,modality_input_name:s,modality_output_name:n,input_ids:o=null,attention_mask:a=null,position_ids:i=null,inputs_embeds:l=null,past_key_values:u=null,generation_config:d=null,logits_processor:f=null,...m}){let _=m[s];if(!l){if(l=await t.encode_text({input_ids:o,...m}),_&&o.dims[1]!==1){let x=await e({[s]:_,...m});({inputs_embeds:l,attention_mask:a}=r({[n]:x,inputs_embeds:l,input_ids:o,attention_mask:a}))}else if(u&&_&&o.dims[1]===1){let x=o.dims[1],k=Object.values(u)[0].dims.at(-2);a=Ee([rt([o.dims[0],k]),a.slice(null,[a.dims[1]-x,a.dims[1]])],1)}}if(!i&&t.config.model_type==="qwen2_vl"){let{image_grid_thw:x,video_grid_thw:k}=m;[i]=t.get_rope_index(o,x,k,a)}return await Tt(t,{inputs_embeds:l,past_key_values:u,attention_mask:a,position_ids:i,generation_config:d,logits_processor:f},!0)}async function QP(t,e){return await vA(t,{...e,modality_input_name:"audio_values",modality_output_name:"audio_features",encode_function:t.encode_audio.bind(t),merge_function:t._merge_input_ids_with_audio_features.bind(t)})}async function JP(t,e){return await vA(t,{...e,modality_input_name:"pixel_values",modality_output_name:"image_features",encode_function:t.encode_image.bind(t),merge_function:t._merge_input_ids_with_image_features.bind(t)})}function J0(t,e=0){let[r,s]=t.dims,n=t.data,o=new BigInt64Array(n.length);for(let a=0;a<r;++a){let i=a*s,l=BigInt(e);for(let u=0;u<s;++u){let d=i+u;n[d]===0n?o[d]=BigInt(1):(o[d]=l,l+=n[d])}}return{data:o,dims:t.dims}}function ZP(t,e=null,r=0){let{input_ids:s,inputs_embeds:n,attention_mask:o}=t,{data:a,dims:i}=J0(o,r),l=new U("int64",a,i);if(e){let u=-(s??n).dims.at(1);l=l.slice(null,[u,null])}return l}function Yi(t,e,r,s){let n=r.past_key_values?Object.values(r.past_key_values)[0].dims.at(-2):0;if(!r.attention_mask){let o;for(let a of["input_ids","inputs_embeds","position_ids"])if(r[a]){o=r[a].dims;break}if(!o)throw new Error("attention_mask is not provided, and unable to infer its shape from model inputs.");r.attention_mask=rt([o[0],n+o[1]])}if(r.past_key_values){let{input_ids:o,attention_mask:a}=r;a&&a.dims[1]>o.dims[1]||n<o.dims[1]&&(r.input_ids=o.slice(null,[n,null]))}return r}function Qi(t,e,r,s){return r.past_key_values&&(e=e.map(n=>[n.at(-1)])),{...r,decoder_input_ids:Y0(e)}}function Jd(t,...e){return t.config.is_encoder_decoder?Qi(t,...e):Yi(t,...e)}function kA({modality_token_id:t,inputs_embeds:e,modality_features:r,input_ids:s,attention_mask:n}){let o=s.tolist().map(u=>u.reduce((d,f,m)=>(f==t&&d.push(m),d),[])),a=o.reduce((u,d)=>u+d.length,0),i=r.dims[0];if(a!==i)throw new Error(`Number of tokens and features do not match: tokens: ${a}, features ${i}`);let l=0;for(let u=0;u<o.length;++u){let d=o[u],f=e[u];for(let m=0;m<d.length;++m)f[d[m]].data.set(r[l++].data)}return{inputs_embeds:e,attention_mask:n}}function ur({image_token_id:t,inputs_embeds:e,image_features:r,input_ids:s,attention_mask:n}){return kA({modality_token_id:t,inputs_embeds:e,modality_features:r,input_ids:s,attention_mask:n})}function ef({audio_token_id:t,inputs_embeds:e,audio_features:r,input_ids:s,attention_mask:n}){return kA({modality_token_id:t,inputs_embeds:e,modality_features:r,input_ids:s,attention_mask:n})}async function xr(t,e,r){return Object.fromEntries(await Promise.all(Object.keys(e).map(async s=>{let n=await it(t,e[s],!1,r);return[s,n]})))}var Yl={};cs(Yl,{ASTForAudioClassification:()=>pf,ASTModel:()=>uf,ASTPreTrainedModel:()=>Bn,AlbertForMaskedLM:()=>nf,AlbertForQuestionAnswering:()=>sf,AlbertForSequenceClassification:()=>rf,AlbertModel:()=>tf,AlbertPreTrainedModel:()=>Yr,ApertusForCausalLM:()=>af,ApertusModel:()=>of,ApertusPreTrainedModel:()=>Rn,ArceeForCausalLM:()=>cf,ArceeModel:()=>lf,ArceePreTrainedModel:()=>Un,BartForConditionalGeneration:()=>ff,BartForSequenceClassification:()=>mf,BartModel:()=>df,BartPretrainedModel:()=>Ls,BeitForImageClassification:()=>_f,BeitModel:()=>hf,BeitPreTrainedModel:()=>Dn,BertForMaskedLM:()=>wf,BertForQuestionAnswering:()=>bf,BertForSequenceClassification:()=>xf,BertForTokenClassification:()=>yf,BertModel:()=>gf,BertPreTrainedModel:()=>yr,BlenderbotForConditionalGeneration:()=>kf,BlenderbotModel:()=>vf,BlenderbotPreTrainedModel:()=>Fn,BlenderbotSmallForConditionalGeneration:()=>Af,BlenderbotSmallModel:()=>Ef,BlenderbotSmallPreTrainedModel:()=>jn,BloomForCausalLM:()=>Tf,BloomModel:()=>Mf,BloomPreTrainedModel:()=>Gn,CLIPModel:()=>Nf,CLIPPreTrainedModel:()=>er,CLIPSegForImageSegmentation:()=>Df,CLIPSegModel:()=>Bf,CLIPSegPreTrainedModel:()=>Xn,CLIPTextModel:()=>$f,CLIPTextModelWithProjection:()=>Hn,CLIPVisionModel:()=>Rf,CLIPVisionModelWithProjection:()=>Uf,CamembertForMaskedLM:()=>Of,CamembertForQuestionAnswering:()=>Pf,CamembertForSequenceClassification:()=>If,CamembertForTokenClassification:()=>Cf,CamembertModel:()=>Sf,CamembertPreTrainedModel:()=>br,ChatterboxModel:()=>qn,ChatterboxPreTrainedModel:()=>Ji,ChineseCLIPModel:()=>zf,ChineseCLIPPreTrainedModel:()=>Zi,ClapAudioModelWithProjection:()=>Vn,ClapModel:()=>Lf,ClapPreTrainedModel:()=>Ns,ClapTextModelWithProjection:()=>Wn,CodeGenForCausalLM:()=>jf,CodeGenModel:()=>Ff,CodeGenPreTrainedModel:()=>Kn,CohereForCausalLM:()=>qf,CohereModel:()=>Gf,CoherePreTrainedModel:()=>Yn,ConvBertForMaskedLM:()=>Vf,ConvBertForQuestionAnswering:()=>Kf,ConvBertForSequenceClassification:()=>Hf,ConvBertForTokenClassification:()=>Xf,ConvBertModel:()=>Wf,ConvBertPreTrainedModel:()=>vr,ConvNextForImageClassification:()=>Qf,ConvNextModel:()=>Yf,ConvNextPreTrainedModel:()=>Qn,ConvNextV2ForImageClassification:()=>Zf,ConvNextV2Model:()=>Jf,ConvNextV2PreTrainedModel:()=>Jn,DFineForObjectDetection:()=>sm,DFineModel:()=>rm,DFinePreTrainedModel:()=>eo,DINOv3ConvNextModel:()=>Tm,DINOv3ConvNextPreTrainedModel:()=>al,DINOv3ViTModel:()=>Sm,DINOv3ViTPreTrainedModel:()=>il,DPTForDepthEstimation:()=>$m,DPTModel:()=>Nm,DPTPreTrainedModel:()=>ao,DacDecoderModel:()=>ro,DacDecoderOutput:()=>tl,DacEncoderModel:()=>to,DacEncoderOutput:()=>el,DacModel:()=>nm,DacPreTrainedModel:()=>$s,DebertaForMaskedLM:()=>am,DebertaForQuestionAnswering:()=>cm,DebertaForSequenceClassification:()=>im,DebertaForTokenClassification:()=>lm,DebertaModel:()=>om,DebertaPreTrainedModel:()=>kr,DebertaV2ForMaskedLM:()=>pm,DebertaV2ForQuestionAnswering:()=>mm,DebertaV2ForSequenceClassification:()=>dm,DebertaV2ForTokenClassification:()=>fm,DebertaV2Model:()=>um,DebertaV2PreTrainedModel:()=>Er,DecisionTransformerModel:()=>hm,DecisionTransformerPreTrainedModel:()=>rl,DeiTForImageClassification:()=>gm,DeiTModel:()=>_m,DeiTPreTrainedModel:()=>so,DepthAnythingForDepthEstimation:()=>wm,DepthAnythingPreTrainedModel:()=>sl,DepthProForDepthEstimation:()=>xm,DepthProPreTrainedModel:()=>nl,DetrForObjectDetection:()=>bm,DetrForSegmentation:()=>vm,DetrModel:()=>ym,DetrObjectDetectionOutput:()=>Us,DetrPreTrainedModel:()=>Rs,DetrSegmentationOutput:()=>ol,Dinov2ForImageClassification:()=>Em,Dinov2Model:()=>km,Dinov2PreTrainedModel:()=>no,Dinov2WithRegistersForImageClassification:()=>Mm,Dinov2WithRegistersModel:()=>Am,Dinov2WithRegistersPreTrainedModel:()=>oo,DistilBertForMaskedLM:()=>zm,DistilBertForQuestionAnswering:()=>Pm,DistilBertForSequenceClassification:()=>Im,DistilBertForTokenClassification:()=>Cm,DistilBertModel:()=>Om,DistilBertPreTrainedModel:()=>Ar,DonutSwinModel:()=>Lm,DonutSwinPreTrainedModel:()=>ll,EdgeTamModel:()=>xw,EfficientNetForImageClassification:()=>Um,EfficientNetModel:()=>Rm,EfficientNetPreTrainedModel:()=>io,ElectraForMaskedLM:()=>Dm,ElectraForQuestionAnswering:()=>Gm,ElectraForSequenceClassification:()=>Fm,ElectraForTokenClassification:()=>jm,ElectraModel:()=>Bm,ElectraPreTrainedModel:()=>Mr,Ernie4_5ForCausalLM:()=>Wm,Ernie4_5Model:()=>qm,Ernie4_5PretrainedModel:()=>lo,EsmForMaskedLM:()=>Hm,EsmForSequenceClassification:()=>Xm,EsmForTokenClassification:()=>Km,EsmModel:()=>Vm,EsmPreTrainedModel:()=>Qr,ExaoneForCausalLM:()=>Qm,ExaoneModel:()=>Ym,ExaonePreTrainedModel:()=>co,FalconForCausalLM:()=>Zm,FalconH1ForCausalLM:()=>th,FalconH1Model:()=>eh,FalconH1PreTrainedModel:()=>po,FalconModel:()=>Jm,FalconPreTrainedModel:()=>uo,FastViTForImageClassification:()=>sh,FastViTModel:()=>rh,FastViTPreTrainedModel:()=>fo,Florence2ForConditionalGeneration:()=>nh,Florence2PreTrainedModel:()=>cl,GLPNForDepthEstimation:()=>mh,GLPNModel:()=>fh,GLPNPreTrainedModel:()=>xo,GPT2LMHeadModel:()=>Eh,GPT2Model:()=>kh,GPT2PreTrainedModel:()=>Eo,GPTBigCodeForCausalLM:()=>_h,GPTBigCodeModel:()=>hh,GPTBigCodePreTrainedModel:()=>yo,GPTJForCausalLM:()=>Mh,GPTJModel:()=>Ah,GPTJPreTrainedModel:()=>Ao,GPTNeoForCausalLM:()=>wh,GPTNeoModel:()=>gh,GPTNeoPreTrainedModel:()=>bo,GPTNeoXForCausalLM:()=>yh,GPTNeoXModel:()=>xh,GPTNeoXPreTrainedModel:()=>vo,Gemma2ForCausalLM:()=>lh,Gemma2Model:()=>ih,Gemma2PreTrainedModel:()=>ho,Gemma3ForCausalLM:()=>uh,Gemma3Model:()=>ch,Gemma3PreTrainedModel:()=>_o,Gemma3nForConditionalGeneration:()=>go,Gemma3nPreTrainedModel:()=>ul,GemmaForCausalLM:()=>ah,GemmaModel:()=>oh,GemmaPreTrainedModel:()=>mo,GlmForCausalLM:()=>dh,GlmModel:()=>ph,GlmPreTrainedModel:()=>wo,GptOssForCausalLM:()=>vh,GptOssModel:()=>bh,GptOssPreTrainedModel:()=>ko,GraniteForCausalLM:()=>Sh,GraniteModel:()=>Th,GraniteMoeHybridForCausalLM:()=>Ih,GraniteMoeHybridModel:()=>Oh,GraniteMoeHybridPreTrainedModel:()=>To,GranitePreTrainedModel:()=>Mo,GroundingDinoForObjectDetection:()=>Ch,GroundingDinoPreTrainedModel:()=>pl,GroupViTModel:()=>Ph,GroupViTPreTrainedModel:()=>dl,HeliumForCausalLM:()=>Lh,HeliumModel:()=>zh,HeliumPreTrainedModel:()=>So,HieraForImageClassification:()=>$h,HieraModel:()=>Nh,HieraPreTrainedModel:()=>Oo,HubertForCTC:()=>Gh,HubertForSequenceClassification:()=>qh,HubertModel:()=>jh,HubertPreTrainedModel:()=>Fh,HunYuanDenseV1ForCausalLM:()=>Vh,HunYuanDenseV1Model:()=>Wh,HunYuanDenseV1PreTrainedModel:()=>Io,IJepaForImageClassification:()=>Kh,IJepaModel:()=>Xh,IJepaPreTrainedModel:()=>Co,Idefics3ForConditionalGeneration:()=>ml,Idefics3PreTrainedModel:()=>fl,JAISLMHeadModel:()=>Qh,JAISModel:()=>Yh,JAISPreTrainedModel:()=>Po,JinaCLIPModel:()=>Jh,JinaCLIPPreTrainedModel:()=>Bs,JinaCLIPTextModel:()=>zo,JinaCLIPVisionModel:()=>Zh,Lfm2ForCausalLM:()=>t_,Lfm2Model:()=>e_,Lfm2MoeForCausalLM:()=>s_,Lfm2MoeModel:()=>r_,Lfm2MoePreTrainedModel:()=>No,Lfm2PreTrainedModel:()=>Lo,LiteWhisperForConditionalGeneration:()=>Cx,Llama4ForCausalLM:()=>a_,Llama4PreTrainedModel:()=>hl,LlamaForCausalLM:()=>o_,LlamaModel:()=>n_,LlamaPreTrainedModel:()=>$o,LlavaForConditionalGeneration:()=>Ds,LlavaOnevisionForConditionalGeneration:()=>Ds,LlavaPreTrainedModel:()=>_l,LlavaQwen2ForCausalLM:()=>l_,LongT5ForConditionalGeneration:()=>u_,LongT5Model:()=>c_,LongT5PreTrainedModel:()=>Ro,M2M100ForConditionalGeneration:()=>d_,M2M100Model:()=>p_,M2M100PreTrainedModel:()=>Uo,MBartForCausalLM:()=>y_,MBartForConditionalGeneration:()=>w_,MBartForSequenceClassification:()=>x_,MBartModel:()=>g_,MBartPreTrainedModel:()=>Jr,MPNetForMaskedLM:()=>ng,MPNetForQuestionAnswering:()=>ig,MPNetForSequenceClassification:()=>og,MPNetForTokenClassification:()=>ag,MPNetModel:()=>sg,MPNetPreTrainedModel:()=>Tr,MT5ForConditionalGeneration:()=>pg,MT5Model:()=>ug,MT5PreTrainedModel:()=>Yo,MarianMTModel:()=>m_,MarianModel:()=>f_,MarianPreTrainedModel:()=>Bo,MaskFormerForInstanceSegmentation:()=>__,MaskFormerModel:()=>h_,MaskFormerPreTrainedModel:()=>Do,Metric3DForDepthEstimation:()=>b_,Metric3DPreTrainedModel:()=>gl,Metric3Dv2ForDepthEstimation:()=>v_,Metric3Dv2PreTrainedModel:()=>wl,MgpstrForSceneTextRecognition:()=>k_,MgpstrModelOutput:()=>xl,MgpstrPreTrainedModel:()=>yl,MimiDecoderModel:()=>jo,MimiDecoderOutput:()=>vl,MimiEncoderModel:()=>Fo,MimiEncoderOutput:()=>bl,MimiModel:()=>E_,MimiPreTrainedModel:()=>Fs,MistralForCausalLM:()=>M_,MistralModel:()=>A_,MistralPreTrainedModel:()=>Go,MobileBertForMaskedLM:()=>S_,MobileBertForQuestionAnswering:()=>I_,MobileBertForSequenceClassification:()=>O_,MobileBertModel:()=>T_,MobileBertPreTrainedModel:()=>Zr,MobileLLMForCausalLM:()=>P_,MobileLLMModel:()=>C_,MobileLLMPreTrainedModel:()=>qo,MobileNetV1ForImageClassification:()=>L_,MobileNetV1ForSemanticSegmentation:()=>N_,MobileNetV1Model:()=>z_,MobileNetV1PreTrainedModel:()=>js,MobileNetV2ForImageClassification:()=>R_,MobileNetV2ForSemanticSegmentation:()=>U_,MobileNetV2Model:()=>$_,MobileNetV2PreTrainedModel:()=>Gs,MobileNetV3ForImageClassification:()=>D_,MobileNetV3ForSemanticSegmentation:()=>F_,MobileNetV3Model:()=>B_,MobileNetV3PreTrainedModel:()=>qs,MobileNetV4ForImageClassification:()=>G_,MobileNetV4ForSemanticSegmentation:()=>q_,MobileNetV4Model:()=>j_,MobileNetV4PreTrainedModel:()=>Ws,MobileViTForImageClassification:()=>V_,MobileViTModel:()=>W_,MobileViTPreTrainedModel:()=>Wo,MobileViTV2ForImageClassification:()=>X_,MobileViTV2Model:()=>H_,MobileViTV2PreTrainedModel:()=>Vo,ModernBertDecoderForCausalLM:()=>eg,ModernBertDecoderModel:()=>Z_,ModernBertDecoderPreTrainedModel:()=>Ho,ModernBertForMaskedLM:()=>Y_,ModernBertForSequenceClassification:()=>Q_,ModernBertForTokenClassification:()=>J_,ModernBertModel:()=>K_,ModernBertPreTrainedModel:()=>es,Moondream1ForConditionalGeneration:()=>i_,MoonshineForConditionalGeneration:()=>rg,MoonshineModel:()=>tg,MoonshinePreTrainedModel:()=>Xo,MptForCausalLM:()=>cg,MptModel:()=>lg,MptPreTrainedModel:()=>Ko,MultiModalityCausalLM:()=>dg,MultiModalityPreTrainedModel:()=>kl,MusicgenForCausalLM:()=>mg,MusicgenForConditionalGeneration:()=>Jo,MusicgenModel:()=>fg,MusicgenPreTrainedModel:()=>Qo,NanoChatForCausalLM:()=>_g,NanoChatModel:()=>hg,NanoChatPreTrainedModel:()=>Zo,NeoBertForMaskedLM:()=>wg,NeoBertForQuestionAnswering:()=>bg,NeoBertForSequenceClassification:()=>xg,NeoBertForTokenClassification:()=>yg,NeoBertModel:()=>gg,NeoBertPreTrainedModel:()=>Sr,NomicBertModel:()=>vg,NomicBertPreTrainedModel:()=>El,OPTForCausalLM:()=>Pg,OPTModel:()=>Cg,OPTPreTrainedModel:()=>na,Olmo2ForCausalLM:()=>Mg,Olmo2Model:()=>Ag,Olmo2PreTrainedModel:()=>ta,Olmo3ForCausalLM:()=>Sg,Olmo3Model:()=>Tg,Olmo3PreTrainedModel:()=>ra,OlmoForCausalLM:()=>Eg,OlmoModel:()=>kg,OlmoPreTrainedModel:()=>ea,OpenELMForCausalLM:()=>Ig,OpenELMModel:()=>Og,OpenELMPreTrainedModel:()=>sa,OwlViTForObjectDetection:()=>$g,OwlViTModel:()=>Ng,OwlViTPreTrainedModel:()=>aa,Owlv2ForObjectDetection:()=>Lg,Owlv2Model:()=>zg,Owlv2PreTrainedModel:()=>oa,PaliGemmaForConditionalGeneration:()=>Rg,PaliGemmaPreTrainedModel:()=>Al,ParakeetForCTC:()=>Ug,ParakeetPreTrainedModel:()=>Ml,PatchTSMixerForPrediction:()=>Dg,PatchTSMixerModel:()=>Bg,PatchTSMixerPreTrainedModel:()=>ia,PatchTSTForPrediction:()=>jg,PatchTSTModel:()=>Fg,PatchTSTPreTrainedModel:()=>la,Phi3ForCausalLM:()=>Vg,Phi3Model:()=>Wg,Phi3PreTrainedModel:()=>ua,Phi3VForCausalLM:()=>pa,Phi3VPreTrainedModel:()=>Tl,PhiForCausalLM:()=>qg,PhiModel:()=>Gg,PhiPreTrainedModel:()=>ca,PreTrainedModel:()=>y,PvtForImageClassification:()=>Xg,PvtModel:()=>Hg,PvtPreTrainedModel:()=>da,PyAnnoteForAudioFrameClassification:()=>Yg,PyAnnoteModel:()=>Kg,PyAnnotePreTrainedModel:()=>fa,Qwen2ForCausalLM:()=>Jg,Qwen2Model:()=>Qg,Qwen2PreTrainedModel:()=>ma,Qwen2VLForConditionalGeneration:()=>Zg,Qwen2VLPreTrainedModel:()=>Sl,Qwen3ForCausalLM:()=>tw,Qwen3Model:()=>ew,Qwen3PreTrainedModel:()=>ha,RFDetrForObjectDetection:()=>ow,RFDetrModel:()=>nw,RFDetrObjectDetectionOutput:()=>Ol,RFDetrPreTrainedModel:()=>ga,RTDetrForObjectDetection:()=>tm,RTDetrModel:()=>em,RTDetrObjectDetectionOutput:()=>tr,RTDetrPreTrainedModel:()=>Zn,RTDetrV2ForObjectDetection:()=>gw,RTDetrV2Model:()=>_w,RTDetrV2ObjectDetectionOutput:()=>Il,RTDetrV2PreTrainedModel:()=>wa,ResNetForImageClassification:()=>sw,ResNetModel:()=>rw,ResNetPreTrainedModel:()=>_a,RoFormerForMaskedLM:()=>dw,RoFormerForQuestionAnswering:()=>hw,RoFormerForSequenceClassification:()=>fw,RoFormerForTokenClassification:()=>mw,RoFormerModel:()=>pw,RoFormerPreTrainedModel:()=>Ir,RobertaForMaskedLM:()=>iw,RobertaForQuestionAnswering:()=>uw,RobertaForSequenceClassification:()=>lw,RobertaForTokenClassification:()=>cw,RobertaModel:()=>aw,RobertaPreTrainedModel:()=>Or,Sam2ImageSegmentationOutput:()=>zl,Sam2Model:()=>xa,Sam2PreTrainedModel:()=>Ll,Sam3TrackerModel:()=>yw,SamImageSegmentationOutput:()=>Cl,SamModel:()=>ww,SamPreTrainedModel:()=>Pl,SapiensForDepthEstimation:()=>vw,SapiensForNormalEstimation:()=>kw,SapiensForSemanticSegmentation:()=>bw,SapiensPreTrainedModel:()=>Vs,SegformerForImageClassification:()=>Aw,SegformerForSemanticSegmentation:()=>Mw,SegformerModel:()=>Ew,SegformerPreTrainedModel:()=>Hs,SiglipModel:()=>Tw,SiglipPreTrainedModel:()=>ya,SiglipTextModel:()=>ba,SiglipVisionModel:()=>Sw,SmolLM3ForCausalLM:()=>Iw,SmolLM3Model:()=>Ow,SmolLM3PreTrainedModel:()=>va,SmolVLMForConditionalGeneration:()=>Hh,SnacDecoderModel:()=>Ea,SnacEncoderModel:()=>ka,SnacModel:()=>Cw,SnacPreTrainedModel:()=>Xs,SpeechT5ForSpeechToText:()=>zw,SpeechT5ForTextToSpeech:()=>Lw,SpeechT5HifiGan:()=>Nw,SpeechT5Model:()=>Pw,SpeechT5PreTrainedModel:()=>Ks,SqueezeBertForMaskedLM:()=>Rw,SqueezeBertForQuestionAnswering:()=>Bw,SqueezeBertForSequenceClassification:()=>Uw,SqueezeBertModel:()=>$w,SqueezeBertPreTrainedModel:()=>ts,StableLmForCausalLM:()=>Fw,StableLmModel:()=>Dw,StableLmPreTrainedModel:()=>Aa,Starcoder2ForCausalLM:()=>Gw,Starcoder2Model:()=>jw,Starcoder2PreTrainedModel:()=>Ma,StyleTextToSpeech2Model:()=>qw,StyleTextToSpeech2PreTrainedModel:()=>Nl,SupertonicForConditionalGeneration:()=>Ta,SupertonicPreTrainedModel:()=>$l,Swin2SRForImageSuperResolution:()=>Kw,Swin2SRModel:()=>Xw,Swin2SRPreTrainedModel:()=>Sa,SwinForImageClassification:()=>Vw,SwinForSemanticSegmentation:()=>Hw,SwinModel:()=>Ww,SwinPreTrainedModel:()=>Ys,T5ForConditionalGeneration:()=>Qw,T5Model:()=>Yw,T5PreTrainedModel:()=>Oa,TableTransformerForObjectDetection:()=>Zw,TableTransformerModel:()=>Jw,TableTransformerObjectDetectionOutput:()=>Rl,TableTransformerPreTrainedModel:()=>Ia,TrOCRForCausalLM:()=>ex,TrOCRPreTrainedModel:()=>Ul,UltravoxModel:()=>Dl,UltravoxPreTrainedModel:()=>Bl,UniSpeechForCTC:()=>sx,UniSpeechForSequenceClassification:()=>nx,UniSpeechModel:()=>rx,UniSpeechPreTrainedModel:()=>Qs,UniSpeechSatForAudioFrameClassification:()=>lx,UniSpeechSatForCTC:()=>ax,UniSpeechSatForSequenceClassification:()=>ix,UniSpeechSatModel:()=>ox,UniSpeechSatPreTrainedModel:()=>rs,VaultGemmaForCausalLM:()=>ux,VaultGemmaModel:()=>cx,VaultGemmaPreTrainedModel:()=>Ca,ViTForImageClassification:()=>fx,ViTMAEModel:()=>mx,ViTMAEPreTrainedModel:()=>Fl,ViTMSNForImageClassification:()=>_x,ViTMSNModel:()=>hx,ViTMSNPreTrainedModel:()=>za,ViTModel:()=>dx,ViTPreTrainedModel:()=>Pa,VisionEncoderDecoderModel:()=>px,VitMatteForImageMatting:()=>gx,VitMattePreTrainedModel:()=>jl,VitPoseForPoseEstimation:()=>wx,VitPosePreTrainedModel:()=>Gl,VitsModel:()=>xx,VitsModelOutput:()=>ql,VitsPreTrainedModel:()=>Wl,VoxtralForConditionalGeneration:()=>tx,Wav2Vec2BertForCTC:()=>bx,Wav2Vec2BertForSequenceClassification:()=>vx,Wav2Vec2BertModel:()=>yx,Wav2Vec2BertPreTrainedModel:()=>Js,Wav2Vec2ForAudioFrameClassification:()=>Dh,Wav2Vec2ForCTC:()=>Uh,Wav2Vec2ForSequenceClassification:()=>Bh,Wav2Vec2Model:()=>Rh,Wav2Vec2PreTrainedModel:()=>Wt,WavLMForAudioFrameClassification:()=>Tx,WavLMForCTC:()=>Ex,WavLMForSequenceClassification:()=>Ax,WavLMForXVector:()=>Mx,WavLMModel:()=>kx,WavLMPreTrainedModel:()=>Cr,WeSpeakerResNetModel:()=>Sx,WeSpeakerResNetPreTrainedModel:()=>Hl,WhisperForConditionalGeneration:()=>Xl,WhisperModel:()=>Ix,WhisperPreTrainedModel:()=>La,XLMForQuestionAnswering:()=>$x,XLMForSequenceClassification:()=>Lx,XLMForTokenClassification:()=>Nx,XLMModel:()=>Px,XLMPreTrainedModel:()=>Pr,XLMRobertaForMaskedLM:()=>Ux,XLMRobertaForQuestionAnswering:()=>Fx,XLMRobertaForSequenceClassification:()=>Bx,XLMRobertaForTokenClassification:()=>Dx,XLMRobertaModel:()=>Rx,XLMRobertaPreTrainedModel:()=>zr,XLMWithLMHeadModel:()=>zx,XVectorOutput:()=>Vl,YolosForObjectDetection:()=>Gx,YolosModel:()=>jx,YolosObjectDetectionOutput:()=>Kl,YolosPreTrainedModel:()=>Na,YoutuForCausalLM:()=>Wx,YoutuModel:()=>qx,YoutuPreTrainedModel:()=>$a});var Yr=class extends y{},tf=class extends Yr{},rf=class extends Yr{async _call(e){return new F(await super._call(e))}},sf=class extends Yr{async _call(e){return new Ae(await super._call(e))}},nf=class extends Yr{async _call(e){return new we(await super._call(e))}};var Rn=class extends y{},of=class extends Rn{},af=class extends Rn{};var Un=class extends y{},lf=class extends Un{},cf=class extends Un{};var Bn=class extends y{},uf=class extends Bn{},pf=class extends Bn{};var Ls=class extends y{},df=class extends Ls{},ff=class extends Ls{},mf=class extends Ls{async _call(e){return new F(await super._call(e))}};var Dn=class extends y{},hf=class extends Dn{},_f=class extends Dn{async _call(e){return new F(await super._call(e))}};var yr=class extends y{},gf=class extends yr{},wf=class extends yr{async _call(e){return new we(await super._call(e))}},xf=class extends yr{async _call(e){return new F(await super._call(e))}},yf=class extends yr{async _call(e){return new _e(await super._call(e))}},bf=class extends yr{async _call(e){return new Ae(await super._call(e))}};var Fn=class extends y{},vf=class extends Fn{},kf=class extends Fn{};var jn=class extends y{},Ef=class extends jn{},Af=class extends jn{};var Gn=class extends y{},Mf=class extends Gn{},Tf=class extends Gn{};var br=class extends y{},Sf=class extends br{},Of=class extends br{async _call(e){return new we(await super._call(e))}},If=class extends br{async _call(e){return new F(await super._call(e))}},Cf=class extends br{async _call(e){return new _e(await super._call(e))}},Pf=class extends br{async _call(e){return new Ae(await super._call(e))}};var ez=4299n,EA=6561n,Ji=class extends y{forward_params=["input_ids","inputs_embeds","attention_mask","position_ids","audio_values","exaggeration","audio_features","audio_tokens","speaker_embeddings","speaker_features","past_key_values"];main_input_name="input_ids";_return_dict_in_generate_keys=["audio_tokens","speaker_embeddings","speaker_features"]},qn=class extends Ji{async encode_speech(e){return ce(this.sessions.speech_encoder,{audio_values:e})}async forward({input_ids:e=null,attention_mask:r=null,audio_values:s=null,exaggeration:n=null,position_ids:o=null,inputs_embeds:a=null,past_key_values:i=null,generation_config:l=null,logits_processor:u=null,audio_features:d=null,audio_tokens:f=null,speaker_embeddings:m=null,speaker_features:_=null,...w}){let x;if(!a){let E=this.sessions.embed_tokens.inputNames,M={input_ids:e};if(E.includes("exaggeration")){if(!(n instanceof U)){let I=e.dims[0];if(n==null)n=Ge([I],.5);else if(typeof n=="number")n=Ge([I],n);else if(Array.isArray(n))n=new U("float32",n,[I]);else throw new Error("Unsupported type for `exaggeration` input")}M.exaggeration=n}if(E.includes("position_ids")&&(M.position_ids=o),{inputs_embeds:a}=await ce(this.sessions.embed_tokens,M),d&&f&&m&&_&&(x={audio_features:d,audio_tokens:f,speaker_embeddings:m,speaker_features:_}),x||s)x??=await this.encode_speech(s),a=Ee([x.audio_features,a],1),r=rt([a.dims[0],a.dims[1]]);else{let I=a.dims[1];if(!i||I!==1)throw new Error("Incorrect state encountered during generation.");let T=Object.values(i)[0].dims.at(-2);r=rt([a.dims[0],T+I])}}return{...await Tt(this,{inputs_embeds:a,past_key_values:i,attention_mask:r,generation_config:l,logits_processor:u},!1),...x}}prepare_inputs_for_generation(e,r,s){if(!r.position_ids&&this.sessions.embed_tokens.inputNames.includes("position_ids"))if(r.input_ids.dims[1]===1){let n=Array.from({length:e.length},(o,a)=>e[a].length-e[a].findLastIndex(i=>i==EA)-1);r.position_ids=new U("int64",n,[e.length,1])}else{let o=r.input_ids.tolist().map(a=>{let i=0;return a.map(l=>l>=EA?0:i++)});r.position_ids=new U("int64",o.flat(),r.input_ids.dims)}return r.input_ids.dims[1]===1&&(delete r.audio_values,delete r.audio_features,delete r.audio_tokens,delete r.speaker_embeddings,delete r.speaker_features),Yi(this,e,r,s)}async generate(e){let{sequences:r,audio_tokens:s,speaker_embeddings:n,speaker_features:o}=await super.generate({...e,return_dict_in_generate:!0}),a=r.slice(null,[e.input_ids.dims[1],-1]),i=Ge([a.dims[0],3],ez),l=Ee([s,a,i],1),{waveform:u}=await ce(this.sessions.conditional_decoder,{speech_tokens:l,speaker_features:o,speaker_embeddings:n});return u}};var Zi=class extends y{},zf=class extends Zi{};var Ns=class extends y{},Lf=class extends Ns{},Wn=class extends Ns{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Vn=class extends Ns{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"audio_model"})}};var er=class extends y{},Nf=class extends er{},$f=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Hn=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Rf=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"vision_model"})}},Uf=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"vision_model"})}};var Xn=class extends y{},Bf=class extends Xn{},Df=class extends Xn{};var Kn=class extends y{},Ff=class extends Kn{},jf=class extends Kn{};var Yn=class extends y{},Gf=class extends Yn{},qf=class extends Yn{};var vr=class extends y{},Wf=class extends vr{},Vf=class extends vr{async _call(e){return new we(await super._call(e))}},Hf=class extends vr{async _call(e){return new F(await super._call(e))}},Xf=class extends vr{async _call(e){return new _e(await super._call(e))}},Kf=class extends vr{async _call(e){return new Ae(await super._call(e))}};var Qn=class extends y{},Yf=class extends Qn{},Qf=class extends Qn{async _call(e){return new F(await super._call(e))}};var Jn=class extends y{},Jf=class extends Jn{},Zf=class extends Jn{async _call(e){return new F(await super._call(e))}};var Zn=class extends y{},em=class extends Zn{},tm=class extends Zn{async _call(e){return new tr(await super._call(e))}},tr=class extends Ne{constructor({logits:e,pred_boxes:r}){super(),this.logits=e,this.pred_boxes=r}};var eo=class extends y{},rm=class extends eo{},sm=class extends eo{async _call(e){return new tr(await super._call(e))}};var el=class extends Ne{constructor({audio_codes:e}){super(),this.audio_codes=e}},tl=class extends Ne{constructor({audio_values:e}){super(),this.audio_values=e}},$s=class extends y{main_input_name="input_values";forward_params=["input_values"]},nm=class extends $s{async encode(e){return new el(await ce(this.sessions.encoder_model,e))}async decode(e){return new tl(await ce(this.sessions.decoder_model,e))}},to=class extends $s{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"encoder_model"})}},ro=class extends $s{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"decoder_model"})}};var kr=class extends y{},om=class extends kr{},am=class extends kr{async _call(e){return new we(await super._call(e))}},im=class extends kr{async _call(e){return new F(await super._call(e))}},lm=class extends kr{async _call(e){return new _e(await super._call(e))}},cm=class extends kr{async _call(e){return new Ae(await super._call(e))}};var Er=class extends y{},um=class extends Er{},pm=class extends Er{async _call(e){return new we(await super._call(e))}},dm=class extends Er{async _call(e){return new F(await super._call(e))}},fm=class extends Er{async _call(e){return new _e(await super._call(e))}},mm=class extends Er{async _call(e){return new Ae(await super._call(e))}};var rl=class extends y{},hm=class extends rl{};var so=class extends y{},_m=class extends so{},gm=class extends so{async _call(e){return new F(await super._call(e))}};var sl=class extends y{},wm=class extends sl{};var nl=class extends y{},xm=class extends nl{};var Rs=class extends y{},ym=class extends Rs{},bm=class extends Rs{async _call(e){return new Us(await super._call(e))}},vm=class extends Rs{async _call(e){return new ol(await super._call(e))}},Us=class extends Ne{constructor({logits:e,pred_boxes:r}){super(),this.logits=e,this.pred_boxes=r}},ol=class extends Ne{constructor({logits:e,pred_boxes:r,pred_masks:s}){super(),this.logits=e,this.pred_boxes=r,this.pred_masks=s}};var no=class extends y{},km=class extends no{},Em=class extends no{async _call(e){return new F(await super._call(e))}};var oo=class extends y{},Am=class extends oo{},Mm=class extends oo{async _call(e){return new F(await super._call(e))}};var al=class extends y{},Tm=class extends al{};var il=class extends y{},Sm=class extends il{};var Ar=class extends y{},Om=class extends Ar{},Im=class extends Ar{async _call(e){return new F(await super._call(e))}},Cm=class extends Ar{async _call(e){return new _e(await super._call(e))}},Pm=class extends Ar{async _call(e){return new Ae(await super._call(e))}},zm=class extends Ar{async _call(e){return new we(await super._call(e))}};var ll=class extends y{},Lm=class extends ll{};var ao=class extends y{},Nm=class extends ao{},$m=class extends ao{};var io=class extends y{},Rm=class extends io{},Um=class extends io{async _call(e){return new F(await super._call(e))}};var Mr=class extends y{},Bm=class extends Mr{},Dm=class extends Mr{async _call(e){return new we(await super._call(e))}},Fm=class extends Mr{async _call(e){return new F(await super._call(e))}},jm=class extends Mr{async _call(e){return new _e(await super._call(e))}},Gm=class extends Mr{async _call(e){return new Ae(await super._call(e))}};var lo=class extends y{},qm=class extends lo{},Wm=class extends lo{};var Qr=class extends y{},Vm=class extends Qr{},Hm=class extends Qr{async _call(e){return new we(await super._call(e))}},Xm=class extends Qr{async _call(e){return new F(await super._call(e))}},Km=class extends Qr{async _call(e){return new _e(await super._call(e))}};var co=class extends y{},Ym=class extends co{},Qm=class extends co{};var uo=class extends y{},Jm=class extends uo{},Zm=class extends uo{};var po=class extends y{},eh=class extends po{},th=class extends po{};var fo=class extends y{},rh=class extends fo{},sh=class extends fo{async _call(e){return new F(await super._call(e))}};var cl=class extends y{forward_params=["input_ids","inputs_embeds","attention_mask","pixel_values","encoder_outputs","decoder_input_ids","decoder_inputs_embeds","decoder_attention_mask","past_key_values"];main_input_name="inputs_embeds"},nh=class extends cl{_merge_input_ids_with_image_features({inputs_embeds:e,image_features:r,input_ids:s,attention_mask:n}){return{inputs_embeds:Ee([r,e],1),attention_mask:Ee([rt(r.dims.slice(0,2)),n],1)}}async _prepare_inputs_embeds({input_ids:e,pixel_values:r,inputs_embeds:s,attention_mask:n}){if(!e&&!r)throw new Error("Either `input_ids` or `pixel_values` should be provided.");let o,a;return e&&(o=await this.encode_text({input_ids:e})),r&&(a=await this.encode_image({pixel_values:r})),o&&a?{inputs_embeds:s,attention_mask:n}=this._merge_input_ids_with_image_features({inputs_embeds:o,image_features:a,input_ids:e,attention_mask:n}):s=o||a,{inputs_embeds:s,attention_mask:n}}async forward({input_ids:e,pixel_values:r,attention_mask:s,decoder_input_ids:n,decoder_attention_mask:o,encoder_outputs:a,past_key_values:i,inputs_embeds:l,decoder_inputs_embeds:u}){if(l||({inputs_embeds:l,attention_mask:s}=await this._prepare_inputs_embeds({input_ids:e,pixel_values:r,inputs_embeds:l,attention_mask:s})),!a){let{last_hidden_state:f}=await qt(this,{inputs_embeds:l,attention_mask:s});a=f}if(!u){if(!n)throw new Error("Either `decoder_input_ids` or `decoder_inputs_embeds` should be provided.");u=await this.encode_text({input_ids:n})}return await Tt(this,{inputs_embeds:u,attention_mask:o,encoder_attention_mask:s,encoder_hidden_states:a,past_key_values:i},!0)}};var mo=class extends y{},oh=class extends mo{},ah=class extends mo{};var ho=class extends y{},ih=class extends ho{},lh=class extends ho{};var _o=class extends y{},ch=class extends _o{},uh=class extends _o{};var ul=class extends y{forward_params=["input_ids","attention_mask","inputs_embeds","per_layer_inputs","position_ids","pixel_values","input_features","input_features_mask","past_key_values"]},go=class extends ul{async forward({input_ids:e=null,attention_mask:r=null,pixel_values:s=null,input_features:n=null,input_features_mask:o=null,position_ids:a=null,inputs_embeds:i=null,per_layer_inputs:l=null,past_key_values:u=null,generation_config:d=null,logits_processor:f=null,...m}){if((!i||!l)&&({inputs_embeds:i,per_layer_inputs:l}=await ce(this.sessions.embed_tokens,{input_ids:e}),e.dims[1]!==1)){if(s){let{image_features:w}=await ce(this.sessions.vision_encoder,{pixel_values:s});({inputs_embeds:i,attention_mask:r}=this._merge_input_ids_with_image_features({image_features:w,inputs_embeds:i,input_ids:e,attention_mask:r}))}if(n){let{audio_features:w}=await ce(this.sessions.audio_encoder,{input_features:n,input_features_mask:o});({inputs_embeds:i,attention_mask:r}=this._merge_input_ids_with_audio_features({audio_features:w,inputs_embeds:i,input_ids:e,attention_mask:r}))}}return await Tt(this,{inputs_embeds:i,per_layer_inputs:l,past_key_values:u,attention_mask:r,position_ids:a,generation_config:d,logits_processor:f},!0)}_merge_input_ids_with_image_features(e){let r=e.image_features.dims.at(-1),s=e.image_features.view(-1,r);return ur({image_token_id:this.config.image_token_id,...e,image_features:s})}_merge_input_ids_with_audio_features(e){let r=e.audio_features.dims.at(-1),s=e.audio_features.view(-1,r);return ef({audio_token_id:this.config.audio_token_id,...e,audio_features:s})}};var wo=class extends y{},ph=class extends wo{},dh=class extends wo{};var xo=class extends y{},fh=class extends xo{},mh=class extends xo{};var yo=class extends y{},hh=class extends yo{},_h=class extends yo{};var bo=class extends y{},gh=class extends bo{},wh=class extends bo{};var vo=class extends y{},xh=class extends vo{},yh=class extends vo{};var ko=class extends y{},bh=class extends ko{},vh=class extends ko{};var Eo=class extends y{},kh=class extends Eo{},Eh=class extends Eo{};var Ao=class extends y{},Ah=class extends Ao{},Mh=class extends Ao{};var Mo=class extends y{},Th=class extends Mo{},Sh=class extends Mo{};var To=class extends y{},Oh=class extends To{},Ih=class extends To{};var pl=class extends y{},Ch=class extends pl{};var dl=class extends y{},Ph=class extends dl{};var So=class extends y{},zh=class extends So{},Lh=class extends So{};var Oo=class extends y{},Nh=class extends Oo{},$h=class extends Oo{async _call(e){return new F(await super._call(e))}};var Wt=class extends y{},Rh=class extends Wt{},Uh=class extends Wt{async _call(e){return new gt(await super._call(e))}},Bh=class extends Wt{async _call(e){return new F(await super._call(e))}},Dh=class extends Wt{async _call(e){return new _e(await super._call(e))}};var Fh=class extends y{},jh=class extends Wt{},Gh=class extends Wt{async _call(e){return new gt(await super._call(e))}},qh=class extends Wt{async _call(e){return new F(await super._call(e))}};var Io=class extends y{},Wh=class extends Io{},Vh=class extends Io{};var fl=class extends y{forward_params=["input_ids","attention_mask","pixel_values","pixel_attention_mask","position_ids","past_key_values"]},ml=class extends fl{async encode_image({pixel_values:e,pixel_attention_mask:r}){return(await ce(this.sessions.vision_encoder,{pixel_values:e,pixel_attention_mask:r})).image_features}_merge_input_ids_with_image_features(e){let r=e.image_features.dims.at(-1),s=e.image_features.view(-1,r);return ur({image_token_id:this.config.image_token_id,...e,image_features:s})}},Hh=class extends ml{};var Co=class extends y{},Xh=class extends Co{},Kh=class extends Co{async _call(e){return new F(await super._call(e))}};var Po=class extends y{},Yh=class extends Po{},Qh=class extends Po{};var Bs=class extends y{},Jh=class extends Bs{async forward(e){let r=!e.input_ids,s=!e.pixel_values;if(r&&s)throw new Error("Either `input_ids` or `pixel_values` should be provided.");if(r&&(e.input_ids=rt([e.pixel_values.dims[0],1])),s){let{image_size:u}=this.config.vision_config;e.pixel_values=Ge([0,3,u,u],0)}let{text_embeddings:n,image_embeddings:o,l2norm_text_embeddings:a,l2norm_image_embeddings:i}=await super.forward(e),l={};return r||(l.text_embeddings=n,l.l2norm_text_embeddings=a),s||(l.image_embeddings=o,l.l2norm_image_embeddings=i),l}},zo=class extends Bs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Zh=class extends Bs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"vision_model"})}};var Lo=class extends y{},e_=class extends Lo{},t_=class extends Lo{};var No=class extends y{},r_=class extends No{},s_=class extends No{};var $o=class extends y{},n_=class extends $o{},o_=class extends $o{};var hl=class extends y{},a_=class extends hl{};var _l=class extends y{forward_params=["input_ids","attention_mask","pixel_values","position_ids","past_key_values"]},Ds=class extends _l{_merge_input_ids_with_image_features(e){let r=e.image_features.dims.at(-1),s=e.image_features.view(-1,r);return ur({image_token_id:this.config.image_token_index,...e,image_features:s})}},i_=class extends Ds{},l_=class extends Ds{};var Ro=class extends y{},c_=class extends Ro{},u_=class extends Ro{};var Uo=class extends y{},p_=class extends Uo{},d_=class extends Uo{};var Bo=class extends y{},f_=class extends Bo{},m_=class extends Bo{};var Do=class extends y{},h_=class extends Do{},__=class extends Do{};var Jr=class extends y{},g_=class extends Jr{},w_=class extends Jr{},x_=class extends Jr{async _call(e){return new F(await super._call(e))}},y_=class extends Jr{};var gl=class extends y{},b_=class extends gl{};var wl=class extends y{},v_=class extends wl{};var xl=class extends Ne{constructor({char_logits:e,bpe_logits:r,wp_logits:s}){super(),this.char_logits=e,this.bpe_logits=r,this.wp_logits=s}get logits(){return[this.char_logits,this.bpe_logits,this.wp_logits]}},yl=class extends y{},k_=class extends yl{async _call(e){return new xl(await super._call(e))}};var bl=class extends Ne{constructor({audio_codes:e}){super(),this.audio_codes=e}},vl=class extends Ne{constructor({audio_values:e}){super(),this.audio_values=e}},Fs=class extends y{main_input_name="input_values";forward_params=["input_values"]},E_=class extends Fs{async encode(e){return new bl(await ce(this.sessions.encoder_model,e))}async decode(e){return new vl(await ce(this.sessions.decoder_model,e))}},Fo=class extends Fs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"encoder_model"})}},jo=class extends Fs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"decoder_model"})}};var Go=class extends y{},A_=class extends Go{},M_=class extends Go{};var Zr=class extends y{},T_=class extends Zr{},S_=class extends Zr{async _call(e){return new we(await super._call(e))}},O_=class extends Zr{async _call(e){return new F(await super._call(e))}},I_=class extends Zr{async _call(e){return new Ae(await super._call(e))}};var qo=class extends y{},C_=class extends qo{},P_=class extends qo{};var js=class extends y{},z_=class extends js{},L_=class extends js{async _call(e){return new F(await super._call(e))}},N_=class extends js{};var Gs=class extends y{},$_=class extends Gs{},R_=class extends Gs{async _call(e){return new F(await super._call(e))}},U_=class extends Gs{};var qs=class extends y{},B_=class extends qs{},D_=class extends qs{async _call(e){return new F(await super._call(e))}},F_=class extends qs{};var Ws=class extends y{},j_=class extends Ws{},G_=class extends Ws{async _call(e){return new F(await super._call(e))}},q_=class extends Ws{};var Wo=class extends y{},W_=class extends Wo{},V_=class extends Wo{async _call(e){return new F(await super._call(e))}};var Vo=class extends y{},H_=class extends Vo{},X_=class extends Vo{async _call(e){return new F(await super._call(e))}};var es=class extends y{},K_=class extends es{},Y_=class extends es{async _call(e){return new we(await super._call(e))}},Q_=class extends es{async _call(e){return new F(await super._call(e))}},J_=class extends es{async _call(e){return new _e(await super._call(e))}};var Ho=class extends y{},Z_=class extends Ho{},eg=class extends Ho{};var Xo=class extends y{requires_attention_mask=!1;main_input_name="input_values";forward_params=["input_values","decoder_input_ids","past_key_values"]},tg=class extends Xo{},rg=class extends Xo{};var Tr=class extends y{},sg=class extends Tr{},ng=class extends Tr{async _call(e){return new we(await super._call(e))}},og=class extends Tr{async _call(e){return new F(await super._call(e))}},ag=class extends Tr{async _call(e){return new _e(await super._call(e))}},ig=class extends Tr{async _call(e){return new Ae(await super._call(e))}};var Ko=class extends y{},lg=class extends Ko{},cg=class extends Ko{};var Yo=class extends y{},ug=class extends Yo{},pg=class extends Yo{};var kl=class extends y{},dg=class extends kl{forward_params=["input_ids","pixel_values","images_seq_mask","images_emb_mask","attention_mask","position_ids","past_key_values"];constructor(...e){super(...e),this._generation_mode="text"}async forward(e){let r=this._generation_mode??"text",s;if(r==="text"||!e.past_key_values){let l=this.sessions.prepare_inputs_embeds,u=at(e,l.inputNames);s=await ce(l,u)}else{let l=this.sessions.gen_img_embeds,u=at({image_ids:e.input_ids},l.inputNames);s=await ce(l,u)}let n={...e,...s},o=await Tt(this,n),a=this.sessions[r==="text"?"lm_head":"gen_head"];if(!a)throw new Error(`Unable to find "${a}" generation head`);let i=await ce(a,at(o,a.inputNames));return{...s,...o,...i}}prepare_inputs_for_generation(e,r,s){let n=!!r.past_key_values;return s.guidance_scale!==null&&s.guidance_scale>1&&(n?r.input_ids=Ee([r.input_ids,r.input_ids],0):(r.input_ids=Ee([r.input_ids,yn(r.input_ids,BigInt(s.pad_token_id))],0),r.attention_mask=Ee([r.attention_mask,yn(r.attention_mask,0n)],0))),(n||!r.pixel_values)&&(r.pixel_values=Ge([0,0,3,384,384],1)),n&&(r.images_seq_mask=new U("bool",new Array(1).fill(!0).fill(!1,0,1),[1,1]),r.images_emb_mask=new U("bool",new Array(0).fill(!1),[1,1,0])),r}async generate(e){return this._generation_mode="text",super.generate(e)}async generate_images(e){this._generation_mode="image";let r=(e.inputs??e[this.main_input_name]).dims[1],n=(await super.generate(e)).slice(null,[r,null]),o=this.sessions.image_decode,{decoded_image:a}=await ce(o,{generated_tokens:n}),i=a.add_(1).mul_(255/2).clamp_(0,255).to("uint8"),l=[];for(let u of i){let d=Xe.fromTensor(u);l.push(d)}return l}};var Qo=class extends y{},fg=class extends Qo{},mg=class extends Qo{},Jo=class extends y{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"];_apply_and_filter_by_delay_pattern_mask(e){let[r,s]=e.dims,n=this.config.decoder.num_codebooks,o=s-n,a=0;for(let u=0;u<e.size;++u){if(e.data[u]==this.config.decoder.pad_token_id)continue;let d=u%s,f=Math.floor(u/s)%n,m=d-f;m>0&&m<=o&&(e.data[a++]=e.data[u])}let i=Math.floor(r/n),l=a/(i*n);return new U(e.type,e.data.slice(0,a),[i,n,l])}prepare_inputs_for_generation(e,r,s){let n=BigInt(this.config.decoder.pad_token_id),o=structuredClone(e);for(let a=0;a<o.length;++a)for(let i=0;i<o[a].length;++i)a%this.config.decoder.num_codebooks>=i&&(o[a][i]=n);return s.guidance_scale!==null&&s.guidance_scale>1&&(o=o.concat(o)),Qi(this,o,r,s)}async generate(e){let r=await super.generate(e),s=this._apply_and_filter_by_delay_pattern_mask(r).unsqueeze_(0),{audio_values:n}=await ce(this.sessions.encodec_decode,{audio_codes:s});return n}};var Zo=class extends y{},hg=class extends Zo{},_g=class extends Zo{};var Sr=class extends y{},gg=class extends Sr{},wg=class extends Sr{async _call(e){return new we(await super._call(e))}},xg=class extends Sr{async _call(e){return new F(await super._call(e))}},yg=class extends Sr{async _call(e){return new _e(await super._call(e))}},bg=class extends Sr{async _call(e){return new Ae(await super._call(e))}};var El=class extends y{},vg=class extends El{};var ea=class extends y{},kg=class extends ea{},Eg=class extends ea{};var ta=class extends y{},Ag=class extends ta{},Mg=class extends ta{};var ra=class extends y{},Tg=class extends ra{},Sg=class extends ra{};var sa=class extends y{},Og=class extends sa{},Ig=class extends sa{};var na=class extends y{},Cg=class extends na{},Pg=class extends na{};var oa=class extends y{},zg=class extends oa{},Lg=class extends oa{};var aa=class extends y{},Ng=class extends aa{},$g=class extends aa{};var Al=class extends y{forward_params=["input_ids","attention_mask","pixel_values","position_ids","past_key_values"]},Rg=class extends Al{_merge_input_ids_with_image_features(e){let r=e.image_features.dims.at(-1),s=e.image_features.view(-1,r);return ur({image_token_id:this.config.image_token_index,...e,image_features:s})}};var Ml=class extends y{},Ug=class extends Ml{async _call(e){return new gt(await super._call(e))}};var ia=class extends y{},Bg=class extends ia{},Dg=class extends ia{};var la=class extends y{},Fg=class extends la{},jg=class extends la{};var ca=class extends y{},Gg=class extends ca{},qg=class extends ca{};var ua=class extends y{},Wg=class extends ua{},Vg=class extends ua{};var Tl=class extends y{forward_params=["input_ids","inputs_embeds","attention_mask","position_ids","pixel_values","image_sizes","past_key_values"]},pa=class extends Tl{async forward({input_ids:e=null,attention_mask:r=null,pixel_values:s=null,image_sizes:n=null,position_ids:o=null,inputs_embeds:a=null,past_key_values:i=null,generation_config:l=null,logits_processor:u=null,...d}){if(!a){let m;if(s&&e.dims[1]!==1){if(!n)throw new Error("`image_sizes` must be provided when `pixel_values` is provided.");({image_features:m}=await ce(this.sessions.vision_encoder,{pixel_values:s,image_sizes:n}))}else{let _=this.config.normalized_config.hidden_size;m=new U("float32",[],[0,_])}({inputs_embeds:a}=await ce(this.sessions.prepare_inputs_embeds,{input_ids:e,image_features:m}))}return await Tt(this,{inputs_embeds:a,past_key_values:i,attention_mask:r,position_ids:o,generation_config:l,logits_processor:u},!1)}};var da=class extends y{},Hg=class extends da{},Xg=class extends da{async _call(e){return new F(await super._call(e))}};var fa=class extends y{},Kg=class extends fa{},Yg=class extends fa{async _call(e){return new _e(await super._call(e))}};var ma=class extends y{},Qg=class extends ma{},Jg=class extends ma{};var Sl=class extends y{forward_params=["input_ids","attention_mask","position_ids","past_key_values","pixel_values","image_grid_thw"]},Zg=class extends Sl{get_rope_index(e,r,s,n){let{vision_config:o,image_token_id:a,video_token_id:i,vision_start_token_id:l}=this.config,u=o.spatial_merge_size??2,d=[];if(r||s){let f=e.tolist();n||(n=mi(e));let m=n.tolist(),_=Array.from({length:3},M=>Array.from({length:e.dims[0]},I=>Array.from({length:e.dims[1]},T=>1))),w=r?r.tolist():[],x=s?s.tolist():[],k=0,E=0;for(let M=0;M<f.length;++M){let I=f[M].filter((S,L)=>m[M][L]==1),z=I.reduce((S,L,R)=>(L==l&&S.push(R),S),[]).map(S=>I[S+1]),C=z.filter(S=>S==a).length,v=z.filter(S=>S==i).length,G=[],X=0,V=C,Q=v;for(let S=0;S<z.length;++S){let L=I.findIndex((Et,tt)=>tt>X&&Et==a),R=I.findIndex((Et,tt)=>tt>X&&Et==i),te=V>0&&L!==-1?L:I.length+1,ue=Q>0&&R!==-1?R:I.length+1,Be,Pe,vt,Qe;te<ue?([Pe,vt,Qe]=w[k],++k,--V,Be=te):([Pe,vt,Qe]=x[E],++E,--Q,Be=ue);let[et,st,Me]=[Number(Pe),Math.floor(Number(vt)/u),Math.floor(Number(Qe)/u)],xe=Be-X,qe=G.length>0?Te(G.at(-1))[0]+1:0;G.push(Array.from({length:3*xe},(Et,tt)=>qe+tt%xe));let kt=xe+qe,ge=et*st*Me,$e=Array.from({length:ge},(Et,tt)=>kt+Math.floor(tt/(st*Me))),Nr=Array.from({length:ge},(Et,tt)=>kt+Math.floor(tt/Me)%st),ns=Array.from({length:ge},(Et,tt)=>kt+tt%Me);G.push([$e,Nr,ns].flat()),X=Be+ge}if(X<I.length){let S=G.length>0?Te(G.at(-1))[0]+1:0,L=I.length-X;G.push(Array.from({length:3*L},(R,te)=>S+te%L))}let K=G.reduce((S,L)=>S+L.length,0),Y=new Array(K),B=0;for(let S=0;S<3;++S)for(let L=0;L<G.length;++L){let R=G[L],te=R.length/3;for(let ue=S*te;ue<(S+1)*te;++ue)Y[B++]=R[ue]}let P=0,se=m[M];for(let S=0;S<se.length;++S)if(se[S]==1){for(let L=0;L<3;++L)_[L][M][S]=Y[L*K/3+P];++P}let ie=Te(Y)[0];d.push(ie+1-f[M].length)}return[new U("int64",_.flat(1/0),[3,e.dims[0],e.dims[1]]),new U("int64",d,[d.length,1])]}else if(n){let{data:f,dims:m}=J0(n),_=BigInt64Array.from({length:3*f.length},(x,k)=>f[k%f.length]),w=Array.from({length:m[0]},(x,k)=>Te(f.subarray(m[1]*k,m[1]*(k+1)))[0]+1n+BigInt(m[1]));return[new U("int64",_,[3,...m]),new U("int64",w,[w.length,1])]}else{let[f,m]=e.dims,_=BigInt64Array.from({length:3*f*m},(w,x)=>BigInt(Math.floor(x%m/f)));return[new U("int64",_,[3,...e.dims]),Iu([f,1])]}}async encode_image({pixel_values:e,image_grid_thw:r}){return(await ce(this.sessions.vision_encoder,{pixel_values:e,grid_thw:r})).image_features}_merge_input_ids_with_image_features(e){return ur({image_token_id:this.config.image_token_id,...e})}prepare_inputs_for_generation(e,r,s){if(r.attention_mask&&!r.position_ids)if(!r.past_key_values)[r.position_ids,r.rope_deltas]=this.get_rope_index(r.input_ids,r.image_grid_thw,r.video_grid_thw,r.attention_mask);else{r.pixel_values=null;let n=BigInt(Object.values(r.past_key_values)[0].dims.at(-2)),o=r.rope_deltas.map(a=>n+a);r.position_ids=zt([o,o,o],0)}return r}};var ha=class extends y{},ew=class extends ha{},tw=class extends ha{};var _a=class extends y{},rw=class extends _a{},sw=class extends _a{async _call(e){return new F(await super._call(e))}};var ga=class extends y{},nw=class extends ga{},ow=class extends ga{async _call(e){return new Ol(await super._call(e))}},Ol=class extends tr{};var Or=class extends y{},aw=class extends Or{},iw=class extends Or{async _call(e){return new we(await super._call(e))}},lw=class extends Or{async _call(e){return new F(await super._call(e))}},cw=class extends Or{async _call(e){return new _e(await super._call(e))}},uw=class extends Or{async _call(e){return new Ae(await super._call(e))}};var Ir=class extends y{},pw=class extends Ir{},dw=class extends Ir{async _call(e){return new we(await super._call(e))}},fw=class extends Ir{async _call(e){return new F(await super._call(e))}},mw=class extends Ir{async _call(e){return new _e(await super._call(e))}},hw=class extends Ir{async _call(e){return new Ae(await super._call(e))}};var wa=class extends y{},_w=class extends wa{},gw=class extends wa{async _call(e){return new Il(await super._call(e))}},Il=class extends tr{};var Cl=class extends Ne{constructor({iou_scores:e,pred_masks:r}){super(),this.iou_scores=e,this.pred_masks=r}},Pl=class extends y{},ww=class extends Pl{async get_image_embeddings({pixel_values:e}){return await qt(this,{pixel_values:e})}async forward(e){!e.image_embeddings||!e.image_positional_embeddings?e={...e,...await this.get_image_embeddings(e)}:e={...e},e.input_labels??=rt(e.input_points.dims.slice(0,-1));let r={image_embeddings:e.image_embeddings,image_positional_embeddings:e.image_positional_embeddings};return e.input_points&&(r.input_points=e.input_points),e.input_labels&&(r.input_labels=e.input_labels),e.input_boxes&&(r.input_boxes=e.input_boxes),await ce(this.sessions.prompt_encoder_mask_decoder,r)}async _call(e){return new Cl(await super._call(e))}};var zl=class extends Ne{constructor({iou_scores:e,pred_masks:r,object_score_logits:s}){super(),this.iou_scores=e,this.pred_masks=r,this.object_score_logits=s}},Ll=class extends y{},xa=class extends Ll{async get_image_embeddings({pixel_values:e}){return await qt(this,{pixel_values:e})}async forward(e){let{num_feature_levels:r}=this.config.vision_config;if(Array.from({length:r},(a,i)=>`image_embeddings.${i}`).some(a=>!e[a])?e={...e,...await this.get_image_embeddings(e)}:e={...e},e.input_points){if(e.input_boxes&&e.input_boxes.dims[1]!==1)throw new Error("When both `input_points` and `input_boxes` are provided, the number of boxes per image must be 1.");let a=e.input_points.dims;e.input_labels??=rt(a.slice(0,-1)),e.input_boxes??=Ge([a[0],0,4],0)}else if(e.input_boxes){let a=e.input_boxes.dims;e.input_labels=Ge([a[0],a[1],0],-1n),e.input_points=Ge([a[0],1,0,2],0)}else throw new Error("At least one of `input_points` or `input_boxes` must be provided.");let n=this.sessions.prompt_encoder_mask_decoder,o=at(e,n.inputNames);return await ce(n,o)}async _call(e){return new zl(await super._call(e))}},xw=class extends xa{},yw=class extends xa{};var Vs=class extends y{},bw=class extends Vs{},vw=class extends Vs{},kw=class extends Vs{};var Hs=class extends y{},Ew=class extends Hs{},Aw=class extends Hs{},Mw=class extends Hs{};var ya=class extends y{},Tw=class extends ya{},ba=class extends ya{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Sw=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"vision_model"})}};var va=class extends y{},Ow=class extends va{},Iw=class extends va{};var Xs=class extends y{main_input_name="input_values";forward_params=["input_values"]},Cw=class extends Xs{async encode(e){return await ce(this.sessions.encoder_model,e)}async decode(e){return await ce(this.sessions.decoder_model,e)}},ka=class extends Xs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"encoder_model"})}},Ea=class extends Xs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"decoder_model"})}};var Ks=class extends y{},Pw=class extends Ks{},zw=class extends Ks{},Lw=class extends Ks{async generate_speech(e,r,{threshold:s=.5,minlenratio:n=0,maxlenratio:o=20,vocoder:a=null}={}){let i={input_ids:e},{encoder_outputs:l,encoder_attention_mask:u}=await qt(this,i),d=l.dims[1]/this.config.reduction_factor,f=Math.floor(d*o),m=Math.floor(d*n),_=this.config.num_mel_bins,w=[],x=null,k=null,E=0;for(;;){++E;let T=Q0(!!k),z;k?z=k.output_sequence_out:z=new U("float32",new Float32Array(_),[1,1,_]);let C={use_cache_branch:T,output_sequence:z,encoder_attention_mask:u,speaker_embeddings:r,encoder_hidden_states:l};this.addPastKeyValues(C,x),k=await ce(this.sessions.decoder_model_merged,C),x=this.getPastKeyValues(k,x);let{prob:v,spectrum:G}=k;if(w.push(G),E>=m&&(Array.from(v.data).filter(X=>X>=s).length>0||E>=f))break}let M=Ee(w),{waveform:I}=await ce(a.sessions.model,{spectrogram:M});return{spectrogram:M,waveform:I}}},Nw=class extends y{main_input_name="spectrogram"};var ts=class extends y{},$w=class extends ts{},Rw=class extends ts{async _call(e){return new we(await super._call(e))}},Uw=class extends ts{async _call(e){return new F(await super._call(e))}},Bw=class extends ts{async _call(e){return new Ae(await super._call(e))}};var Aa=class extends y{},Dw=class extends Aa{},Fw=class extends Aa{};var Ma=class extends y{},jw=class extends Ma{},Gw=class extends Ma{};var Nl=class extends y{},qw=class extends Nl{};var $l=class extends y{},Ta=class extends $l{async generate_speech({input_ids:e,attention_mask:r,style:s,num_inference_steps:n=5,speed:o=1.05}){let{sampling_rate:a,chunk_compress_factor:i,base_chunk_size:l,latent_dim:u}=this.config,{last_hidden_state:d,durations:f}=await ce(this.sessions.text_encoder,{input_ids:e,attention_mask:r,style:s}),m=f.div(o).mul_(a),_=l*i,w=m.data,x=Int32Array.from(w,V=>Math.ceil(V/_)),k=Math.max(...x),E=e.dims[0],M=new BigInt64Array(E*k);for(let V=0;V<E;++V)M.fill(1n,V*k,V*k+x[V]);let I=new U("int64",M,[E,k]),T=u*i,z=T*k,C=z0([E,T,k]),v=C.data;for(let V=0;V<E;++V)if(x[V]!==k)for(let Q=0;Q<T;++Q)v.fill(0,V*z+Q*k+x[V],V*z+(Q+1)*k);let G=Ge([E],n);for(let V=0;V<n;++V){let Q=Ge([E],V);({denoised_latents:C}=await ce(this.sessions.latent_denoiser,{style:s,noisy_latents:C,latent_mask:I,encoder_outputs:d,attention_mask:r,timestep:Q,num_inference_steps:G}))}let{waveform:X}=await ce(this.sessions.voice_decoder,{latents:C});return{waveform:X,durations:m}}};var Ys=class extends y{},Ww=class extends Ys{},Vw=class extends Ys{async _call(e){return new F(await super._call(e))}},Hw=class extends Ys{};var Sa=class extends y{},Xw=class extends Sa{},Kw=class extends Sa{};var Oa=class extends y{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"]},Yw=class extends Oa{},Qw=class extends Oa{};var Ia=class extends y{},Jw=class extends Ia{},Zw=class extends Ia{async _call(e){return new Rl(await super._call(e))}},Rl=class extends Us{};var Ul=class extends y{},ex=class extends Ul{};var Bl=class extends y{forward_params=["input_ids","attention_mask","position_ids","audio_values","past_key_values"]},Dl=class extends Bl{_merge_input_ids_with_audio_features(e){let r=e.audio_features.dims.at(-1),s=e.audio_features.view(-1,r);return ef({audio_token_id:this.config.ignore_index??this.config.audio_token_id,...e,audio_features:s})}},tx=class extends Dl{};var Qs=class extends y{},rx=class extends Qs{},sx=class extends Qs{async _call(e){return new gt(await super._call(e))}},nx=class extends Qs{async _call(e){return new F(await super._call(e))}};var rs=class extends y{},ox=class extends rs{},ax=class extends rs{async _call(e){return new gt(await super._call(e))}},ix=class extends rs{async _call(e){return new F(await super._call(e))}},lx=class extends rs{async _call(e){return new _e(await super._call(e))}};var Ca=class extends y{},cx=class extends Ca{},ux=class extends Ca{};var px=class extends y{main_input_name="pixel_values";forward_params=["pixel_values","decoder_input_ids","encoder_hidden_states","past_key_values"]};var Pa=class extends y{},dx=class extends Pa{},fx=class extends Pa{async _call(e){return new F(await super._call(e))}};var Fl=class extends y{},mx=class extends Fl{};var za=class extends y{},hx=class extends za{},_x=class extends za{async _call(e){return new F(await super._call(e))}};var jl=class extends y{},gx=class extends jl{async _call(e){return new Yd(await super._call(e))}};var Gl=class extends y{},wx=class extends Gl{};var ql=class extends Ne{constructor({waveform:e,spectrogram:r}){super(),this.waveform=e,this.spectrogram=r}},Wl=class extends y{},xx=class extends Wl{async _call(e){return new ql(await super._call(e))}};var Js=class extends y{},yx=class extends Js{},bx=class extends Js{async _call(e){return new gt(await super._call(e))}},vx=class extends Js{async _call(e){return new F(await super._call(e))}};var Vl=class extends Ne{constructor({logits:e,embeddings:r}){super(),this.logits=e,this.embeddings=r}},Cr=class extends y{},kx=class extends Cr{},Ex=class extends Cr{async _call(e){return new gt(await super._call(e))}},Ax=class extends Cr{async _call(e){return new F(await super._call(e))}},Mx=class extends Cr{async _call(e){return new Vl(await super._call(e))}},Tx=class extends Cr{async _call(e){return new _e(await super._call(e))}};var Hl=class extends y{},Sx=class extends Hl{};var Ox=class extends $n{return_timestamps=null;return_token_timestamps=null;num_frames=null;alignment_heads=null;task=null;language=null;no_timestamps_token_id=null;prompt_ids=null;is_multilingual=null;lang_to_id=null;task_to_id=null;max_initial_timestamp_index=1};var La=class extends y{requires_attention_mask=!1;main_input_name="input_features";forward_params=["input_features","attention_mask","decoder_input_ids","decoder_attention_mask","past_key_values"]},Ix=class extends La{},Xl=class extends La{_prepare_generation_config(e,r){return super._prepare_generation_config(e,r,Ox)}_retrieve_init_tokens(e){let r=[e.decoder_start_token_id],s=e.language,n=e.task;if(e.is_multilingual){s||(console.warn("No language specified - defaulting to English (en)."),s="en");let a=`<|${tA(s)}|>`;r.push(e.lang_to_id[a]),r.push(e.task_to_id[n??"transcribe"])}else if(s||n)throw new Error("Cannot specify `task` or `language` for an English-only model. If the model is intended to be multilingual, pass `is_multilingual=true` to generate, or update the generation config.");return!e.return_timestamps&&e.no_timestamps_token_id&&r.at(-1)!==e.no_timestamps_token_id?r.push(e.no_timestamps_token_id):e.return_timestamps&&r.at(-1)===e.no_timestamps_token_id&&(console.warn("<|notimestamps|> prompt token is removed from generation_config since `return_timestamps` is set to `true`."),r.pop()),r.filter(o=>o!=null)}async generate({inputs:e=null,generation_config:r=null,logits_processor:s=null,stopping_criteria:n=null,...o}){r=this._prepare_generation_config(r,o);let a=o.decoder_input_ids??this._retrieve_init_tokens(r);if(r.return_timestamps&&(s??=new Kr,s.push(new Ui(r,a))),r.begin_suppress_tokens&&(s??=new Kr,s.push(new Os(r.begin_suppress_tokens,a.length))),r.return_token_timestamps){if(!r.alignment_heads)throw new Error("Model generation config has no `alignment_heads`, token-level timestamps not available. See https://gist.github.com/hollance/42e32852f24243b748ae6bc1f985b13a on how to add this property to the generation config.");r.task==="translate"&&console.warn("Token-level timestamps may not be reliable for task 'translate'."),r.output_attentions=!0,r.return_dict_in_generate=!0}let i=await super.generate({inputs:e,generation_config:r,logits_processor:s,decoder_input_ids:a,...o});return r.return_token_timestamps&&(i.token_timestamps=this._extract_token_timestamps(i,r.alignment_heads,r.num_frames)),i}_extract_token_timestamps(e,r,s=null,n=.02){if(!e.cross_attentions)throw new Error("Model outputs must contain cross attentions to extract timestamps. This is most likely because the model was not exported with `output_attentions=True`.");s==null&&console.warn("`num_frames` has not been set, meaning the entire audio will be analyzed. This may lead to inaccurate token-level timestamps for short audios (< 30 seconds).");let o=this.config.median_filter_width;o===void 0&&(console.warn("Model config has no `median_filter_width`, using default value of 7."),o=7);let a=e.cross_attentions,i=Array.from({length:this.config.decoder_layers},(x,k)=>Ee(a.map(E=>E[k]),2)),l=zt(r.map(([x,k])=>{if(x>=i.length)throw new Error(`Layer index ${x} is out of bounds for cross attentions (length ${i.length}).`);return s?i[x].slice(null,k,null,[0,s]):i[x].slice(null,k)})).transpose(1,0,2,3),[u,d]=Ou(l,-2,0,!0),f=l.clone();for(let x=0;x<f.dims[0];++x){let k=f[x];for(let E=0;E<k.dims[0];++E){let M=k[E],I=u[x][E][0].data,T=d[x][E][0].data;for(let z=0;z<M.dims[0];++z){let C=M[z].data;for(let v=0;v<C.length;++v)C[v]=(C[v]-T[v])/I[v];C.set(_k(C,o))}}}let m=[fi(f,1)],_=e.sequences.dims,w=new U("float32",new Float32Array(_[0]*_[1]),_);for(let x=0;x<_[0];++x){let k=m[x].neg().squeeze_(0),[E,M]=wk(k.tolist()),I=Array.from({length:E.length-1},(C,v)=>E[v+1]-E[v]),T=dt([1],I).map(C=>!!C),z=[];for(let C=0;C<T.length;++C)T[C]&&z.push(M[C]*n);w[x].data.set(z,1)}return w}},Cx=class extends Xl{};var Pr=class extends y{},Px=class extends Pr{},zx=class extends Pr{async _call(e){return new we(await super._call(e))}},Lx=class extends Pr{async _call(e){return new F(await super._call(e))}},Nx=class extends Pr{async _call(e){return new _e(await super._call(e))}},$x=class extends Pr{async _call(e){return new Ae(await super._call(e))}};var zr=class extends y{},Rx=class extends zr{},Ux=class extends zr{async _call(e){return new we(await super._call(e))}},Bx=class extends zr{async _call(e){return new F(await super._call(e))}},Dx=class extends zr{async _call(e){return new _e(await super._call(e))}},Fx=class extends zr{async _call(e){return new Ae(await super._call(e))}};var Na=class extends y{},jx=class extends Na{},Gx=class extends Na{async _call(e){return new Kl(await super._call(e))}},Kl=class extends Ne{constructor({logits:e,pred_boxes:r}){super(),this.logits=e,this.pred_boxes=r}};var $a=class extends y{},qx=class extends $a{},Wx=class extends $a{};var tz=new Map([["bert","BertModel"],["neobert","NeoBertModel"],["modernbert","ModernBertModel"],["nomic_bert","NomicBertModel"],["roformer","RoFormerModel"],["electra","ElectraModel"],["esm","EsmModel"],["convbert","ConvBertModel"],["camembert","CamembertModel"],["deberta","DebertaModel"],["deberta-v2","DebertaV2Model"],["mpnet","MPNetModel"],["albert","AlbertModel"],["distilbert","DistilBertModel"],["roberta","RobertaModel"],["xlm","XLMModel"],["xlm-roberta","XLMRobertaModel"],["clap","ClapModel"],["clip","CLIPModel"],["clipseg","CLIPSegModel"],["chinese_clip","ChineseCLIPModel"],["siglip","SiglipModel"],["jina_clip","JinaCLIPModel"],["mobilebert","MobileBertModel"],["squeezebert","SqueezeBertModel"],["wav2vec2","Wav2Vec2Model"],["wav2vec2-bert","Wav2Vec2BertModel"],["unispeech","UniSpeechModel"],["unispeech-sat","UniSpeechSatModel"],["hubert","HubertModel"],["wavlm","WavLMModel"],["audio-spectrogram-transformer","ASTModel"],["vits","VitsModel"],["pyannote","PyAnnoteModel"],["wespeaker-resnet","WeSpeakerResNetModel"],["detr","DetrModel"],["rt_detr","RTDetrModel"],["rt_detr_v2","RTDetrV2Model"],["rf_detr","RFDetrModel"],["d_fine","DFineModel"],["table-transformer","TableTransformerModel"],["vit","ViTModel"],["ijepa","IJepaModel"],["pvt","PvtModel"],["vit_msn","ViTMSNModel"],["vit_mae","ViTMAEModel"],["groupvit","GroupViTModel"],["fastvit","FastViTModel"],["mobilevit","MobileViTModel"],["mobilevitv2","MobileViTV2Model"],["owlvit","OwlViTModel"],["owlv2","Owlv2Model"],["beit","BeitModel"],["deit","DeiTModel"],["hiera","HieraModel"],["convnext","ConvNextModel"],["convnextv2","ConvNextV2Model"],["dinov2","Dinov2Model"],["dinov2_with_registers","Dinov2WithRegistersModel"],["dinov3_vit","DINOv3ViTModel"],["dinov3_convnext","DINOv3ConvNextModel"],["resnet","ResNetModel"],["swin","SwinModel"],["swin2sr","Swin2SRModel"],["donut-swin","DonutSwinModel"],["yolos","YolosModel"],["dpt","DPTModel"],["glpn","GLPNModel"],["hifigan","SpeechT5HifiGan"],["efficientnet","EfficientNetModel"],["decision_transformer","DecisionTransformerModel"],["patchtst","PatchTSTModel"],["patchtsmixer","PatchTSMixerModel"],["mobilenet_v1","MobileNetV1Model"],["mobilenet_v2","MobileNetV2Model"],["mobilenet_v3","MobileNetV3Model"],["mobilenet_v4","MobileNetV4Model"],["maskformer","MaskFormerModel"],["mgp-str","MgpstrForSceneTextRecognition"],["style_text_to_speech_2","StyleTextToSpeech2Model"]]),rz=new Map([["t5","T5Model"],["longt5","LongT5Model"],["mt5","MT5Model"],["bart","BartModel"],["mbart","MBartModel"],["marian","MarianModel"],["whisper","WhisperModel"],["m2m_100","M2M100Model"],["blenderbot","BlenderbotModel"],["blenderbot-small","BlenderbotSmallModel"]]),sz=new Map([["mimi","MimiModel"],["dac","DacModel"],["snac","SnacModel"]]),nz=new Map([["bloom","BloomModel"],["jais","JAISModel"],["gpt2","GPT2Model"],["gpt_oss","GptOssModel"],["gptj","GPTJModel"],["gpt_bigcode","GPTBigCodeModel"],["gpt_neo","GPTNeoModel"],["gpt_neox","GPTNeoXModel"],["codegen","CodeGenModel"],["llama","LlamaModel"],["apertus","ApertusModel"],["nanochat","NanoChatModel"],["arcee","ArceeModel"],["lfm2","Lfm2Model"],["lfm2_moe","Lfm2MoeModel"],["smollm3","SmolLM3Model"],["exaone","ExaoneModel"],["olmo","OlmoModel"],["olmo2","Olmo2Model"],["olmo3","Olmo3Model"],["mobilellm","MobileLLMModel"],["granite","GraniteModel"],["granitemoehybrid","GraniteMoeHybridModel"],["cohere","CohereModel"],["gemma","GemmaModel"],["gemma2","Gemma2Model"],["vaultgemma","VaultGemmaModel"],["gemma3_text","Gemma3Model"],["helium","HeliumModel"],["glm","GlmModel"],["openelm","OpenELMModel"],["qwen2","Qwen2Model"],["qwen3","Qwen3Model"],["phi","PhiModel"],["phi3","Phi3Model"],["mpt","MptModel"],["opt","OPTModel"],["mistral","MistralModel"],["ministral","MinistralModel"],["ministral3","Ministral3Model"],["ernie4_5","Ernie4_5_Model"],["starcoder2","Starcoder2Model"],["falcon","FalconModel"],["falcon_h1","FalconH1Model"],["stablelm","StableLmModel"],["modernbert-decoder","ModernBertDecoderModel"],["hunyuan_v1_dense","HunYuanDenseV1Model"],["youtu","YoutuModel"]]),AA=new Map([["speecht5","SpeechT5ForSpeechToText"],["whisper","WhisperForConditionalGeneration"],["lite-whisper","LiteWhisperForConditionalGeneration"],["moonshine","MoonshineForConditionalGeneration"]]),MA=new Map([["speecht5","SpeechT5ForTextToSpeech"]]),TA=new Map([["vits","VitsModel"],["musicgen","MusicgenForConditionalGeneration"],["supertonic","SupertonicForConditionalGeneration"]]),SA=new Map([["bert","BertForSequenceClassification"],["neobert","NeoBertForSequenceClassification"],["modernbert","ModernBertForSequenceClassification"],["roformer","RoFormerForSequenceClassification"],["electra","ElectraForSequenceClassification"],["esm","EsmForSequenceClassification"],["convbert","ConvBertForSequenceClassification"],["camembert","CamembertForSequenceClassification"],["deberta","DebertaForSequenceClassification"],["deberta-v2","DebertaV2ForSequenceClassification"],["mpnet","MPNetForSequenceClassification"],["albert","AlbertForSequenceClassification"],["distilbert","DistilBertForSequenceClassification"],["roberta","RobertaForSequenceClassification"],["xlm","XLMForSequenceClassification"],["xlm-roberta","XLMRobertaForSequenceClassification"],["bart","BartForSequenceClassification"],["mbart","MBartForSequenceClassification"],["mobilebert","MobileBertForSequenceClassification"],["squeezebert","SqueezeBertForSequenceClassification"]]),OA=new Map([["bert","BertForTokenClassification"],["neobert","NeoBertForTokenClassification"],["modernbert","ModernBertForTokenClassification"],["roformer","RoFormerForTokenClassification"],["electra","ElectraForTokenClassification"],["esm","EsmForTokenClassification"],["convbert","ConvBertForTokenClassification"],["camembert","CamembertForTokenClassification"],["deberta","DebertaForTokenClassification"],["deberta-v2","DebertaV2ForTokenClassification"],["mpnet","MPNetForTokenClassification"],["distilbert","DistilBertForTokenClassification"],["roberta","RobertaForTokenClassification"],["xlm","XLMForTokenClassification"],["xlm-roberta","XLMRobertaForTokenClassification"]]),IA=new Map([["t5","T5ForConditionalGeneration"],["longt5","LongT5ForConditionalGeneration"],["mt5","MT5ForConditionalGeneration"],["bart","BartForConditionalGeneration"],["mbart","MBartForConditionalGeneration"],["marian","MarianMTModel"],["m2m_100","M2M100ForConditionalGeneration"],["blenderbot","BlenderbotForConditionalGeneration"],["blenderbot-small","BlenderbotSmallForConditionalGeneration"]]),CA=new Map([["bloom","BloomForCausalLM"],["gpt2","GPT2LMHeadModel"],["gpt_oss","GptOssForCausalLM"],["jais","JAISLMHeadModel"],["gptj","GPTJForCausalLM"],["gpt_bigcode","GPTBigCodeForCausalLM"],["gpt_neo","GPTNeoForCausalLM"],["gpt_neox","GPTNeoXForCausalLM"],["codegen","CodeGenForCausalLM"],["llama","LlamaForCausalLM"],["nanochat","NanoChatForCausalLM"],["apertus","ApertusForCausalLM"],["llama4_text","Llama4ForCausalLM"],["arcee","ArceeForCausalLM"],["lfm2","Lfm2ForCausalLM"],["lfm2_moe","Lfm2MoeForCausalLM"],["smollm3","SmolLM3ForCausalLM"],["exaone","ExaoneForCausalLM"],["olmo","OlmoForCausalLM"],["olmo2","Olmo2ForCausalLM"],["olmo3","Olmo3ForCausalLM"],["mobilellm","MobileLLMForCausalLM"],["granite","GraniteForCausalLM"],["granitemoehybrid","GraniteMoeHybridForCausalLM"],["cohere","CohereForCausalLM"],["gemma","GemmaForCausalLM"],["gemma2","Gemma2ForCausalLM"],["vaultgemma","VaultGemmaForCausalLM"],["gemma3_text","Gemma3ForCausalLM"],["helium","HeliumForCausalLM"],["glm","GlmForCausalLM"],["openelm","OpenELMForCausalLM"],["qwen2","Qwen2ForCausalLM"],["qwen3","Qwen3ForCausalLM"],["phi","PhiForCausalLM"],["phi3","Phi3ForCausalLM"],["mpt","MptForCausalLM"],["opt","OPTForCausalLM"],["mbart","MBartForCausalLM"],["mistral","MistralForCausalLM"],["ministral","MinistralForCausalLM"],["ministral3","Ministral3ForCausalLM"],["ernie4_5","Ernie4_5_ForCausalLM"],["starcoder2","Starcoder2ForCausalLM"],["falcon","FalconForCausalLM"],["falcon_h1","FalconH1ForCausalLM"],["trocr","TrOCRForCausalLM"],["stablelm","StableLmForCausalLM"],["modernbert-decoder","ModernBertDecoderForCausalLM"],["hunyuan_v1_dense","HunYuanDenseV1ForCausalLM"],["youtu","YoutuForCausalLM"],["phi3_v","Phi3VForCausalLM"]]),oz=new Map([["multi_modality","MultiModalityCausalLM"]]),PA=new Map([["bert","BertForMaskedLM"],["neobert","NeoBertForMaskedLM"],["modernbert","ModernBertForMaskedLM"],["roformer","RoFormerForMaskedLM"],["electra","ElectraForMaskedLM"],["esm","EsmForMaskedLM"],["convbert","ConvBertForMaskedLM"],["camembert","CamembertForMaskedLM"],["deberta","DebertaForMaskedLM"],["deberta-v2","DebertaV2ForMaskedLM"],["mpnet","MPNetForMaskedLM"],["albert","AlbertForMaskedLM"],["distilbert","DistilBertForMaskedLM"],["roberta","RobertaForMaskedLM"],["xlm","XLMWithLMHeadModel"],["xlm-roberta","XLMRobertaForMaskedLM"],["mobilebert","MobileBertForMaskedLM"],["squeezebert","SqueezeBertForMaskedLM"]]),zA=new Map([["bert","BertForQuestionAnswering"],["neobert","NeoBertForQuestionAnswering"],["roformer","RoFormerForQuestionAnswering"],["electra","ElectraForQuestionAnswering"],["convbert","ConvBertForQuestionAnswering"],["camembert","CamembertForQuestionAnswering"],["deberta","DebertaForQuestionAnswering"],["deberta-v2","DebertaV2ForQuestionAnswering"],["mpnet","MPNetForQuestionAnswering"],["albert","AlbertForQuestionAnswering"],["distilbert","DistilBertForQuestionAnswering"],["roberta","RobertaForQuestionAnswering"],["xlm","XLMForQuestionAnswering"],["xlm-roberta","XLMRobertaForQuestionAnswering"],["mobilebert","MobileBertForQuestionAnswering"],["squeezebert","SqueezeBertForQuestionAnswering"]]),LA=new Map([["vision-encoder-decoder","VisionEncoderDecoderModel"],["idefics3","Idefics3ForConditionalGeneration"],["smolvlm","SmolVLMForConditionalGeneration"]]),NA=new Map([["llava","LlavaForConditionalGeneration"],["llava_onevision","LlavaOnevisionForConditionalGeneration"],["moondream1","Moondream1ForConditionalGeneration"],["florence2","Florence2ForConditionalGeneration"],["qwen2-vl","Qwen2VLForConditionalGeneration"],["idefics3","Idefics3ForConditionalGeneration"],["smolvlm","SmolVLMForConditionalGeneration"],["paligemma","PaliGemmaForConditionalGeneration"],["llava_qwen2","LlavaQwen2ForCausalLM"],["gemma3n","Gemma3nForConditionalGeneration"],["mistral3","Mistral3ForConditionalGeneration"]]),$A=new Map([["ultravox","UltravoxModel"],["voxtral","VoxtralForConditionalGeneration"]]),az=new Map([["vision-encoder-decoder","VisionEncoderDecoderModel"]]),RA=new Map([["vit","ViTForImageClassification"],["ijepa","IJepaForImageClassification"],["pvt","PvtForImageClassification"],["vit_msn","ViTMSNForImageClassification"],["fastvit","FastViTForImageClassification"],["mobilevit","MobileViTForImageClassification"],["mobilevitv2","MobileViTV2ForImageClassification"],["beit","BeitForImageClassification"],["deit","DeiTForImageClassification"],["hiera","HieraForImageClassification"],["convnext","ConvNextForImageClassification"],["convnextv2","ConvNextV2ForImageClassification"],["dinov2","Dinov2ForImageClassification"],["dinov2_with_registers","Dinov2WithRegistersForImageClassification"],["resnet","ResNetForImageClassification"],["swin","SwinForImageClassification"],["segformer","SegformerForImageClassification"],["efficientnet","EfficientNetForImageClassification"],["mobilenet_v1","MobileNetV1ForImageClassification"],["mobilenet_v2","MobileNetV2ForImageClassification"],["mobilenet_v3","MobileNetV3ForImageClassification"],["mobilenet_v4","MobileNetV4ForImageClassification"]]),UA=new Map([["detr","DetrForObjectDetection"],["rt_detr","RTDetrForObjectDetection"],["rt_detr_v2","RTDetrV2ForObjectDetection"],["rf_detr","RFDetrForObjectDetection"],["d_fine","DFineForObjectDetection"],["table-transformer","TableTransformerForObjectDetection"],["yolos","YolosForObjectDetection"]]),BA=new Map([["owlvit","OwlViTForObjectDetection"],["owlv2","Owlv2ForObjectDetection"],["grounding-dino","GroundingDinoForObjectDetection"]]),Ra=new Map([["detr","DetrForSegmentation"],["clipseg","CLIPSegForImageSegmentation"]]),DA=new Map([["segformer","SegformerForSemanticSegmentation"],["sapiens","SapiensForSemanticSegmentation"],["swin","SwinForSemanticSegmentation"],["mobilenet_v1","MobileNetV1ForSemanticSegmentation"],["mobilenet_v2","MobileNetV2ForSemanticSegmentation"],["mobilenet_v3","MobileNetV3ForSemanticSegmentation"],["mobilenet_v4","MobileNetV4ForSemanticSegmentation"]]),FA=new Map([["detr","DetrForSegmentation"],["maskformer","MaskFormerForInstanceSegmentation"]]),jA=new Map([["sam","SamModel"],["sam2","Sam2Model"],["edgetam","EdgeTamModel"],["sam3_tracker","Sam3TrackerModel"]]),GA=new Map([["wav2vec2","Wav2Vec2ForCTC"],["wav2vec2-bert","Wav2Vec2BertForCTC"],["unispeech","UniSpeechForCTC"],["unispeech-sat","UniSpeechSatForCTC"],["wavlm","WavLMForCTC"],["hubert","HubertForCTC"],["parakeet_ctc","ParakeetForCTC"]]),qA=new Map([["wav2vec2","Wav2Vec2ForSequenceClassification"],["wav2vec2-bert","Wav2Vec2BertForSequenceClassification"],["unispeech","UniSpeechForSequenceClassification"],["unispeech-sat","UniSpeechSatForSequenceClassification"],["wavlm","WavLMForSequenceClassification"],["hubert","HubertForSequenceClassification"],["audio-spectrogram-transformer","ASTForAudioClassification"]]),WA=new Map([["wavlm","WavLMForXVector"]]),VA=new Map([["unispeech-sat","UniSpeechSatForAudioFrameClassification"],["wavlm","WavLMForAudioFrameClassification"],["wav2vec2","Wav2Vec2ForAudioFrameClassification"],["pyannote","PyAnnoteForAudioFrameClassification"]]),HA=new Map([["vitmatte","VitMatteForImageMatting"]]),iz=new Map([["patchtst","PatchTSTForPrediction"],["patchtsmixer","PatchTSMixerForPrediction"]]),XA=new Map([["swin2sr","Swin2SRForImageSuperResolution"]]),KA=new Map([["dpt","DPTForDepthEstimation"],["depth_anything","DepthAnythingForDepthEstimation"],["glpn","GLPNForDepthEstimation"],["sapiens","SapiensForDepthEstimation"],["depth_pro","DepthProForDepthEstimation"],["metric3d","Metric3DForDepthEstimation"],["metric3dv2","Metric3Dv2ForDepthEstimation"]]),YA=new Map([["sapiens","SapiensForNormalEstimation"]]),QA=new Map([["vitpose","VitPoseForPoseEstimation"]]),JA=new Map([["clip","CLIPVisionModelWithProjection"],["siglip","SiglipVisionModel"],["jina_clip","JinaCLIPVisionModel"]]),Z0=[[tz,H.EncoderOnly],[rz,H.EncoderDecoder],[nz,H.DecoderOnlyWithoutHead],[sz,H.AutoEncoder],[SA,H.EncoderOnly],[OA,H.EncoderOnly],[IA,H.Seq2Seq],[AA,H.Seq2Seq],[CA,H.DecoderOnly],[oz,H.MultiModality],[PA,H.EncoderOnly],[zA,H.EncoderOnly],[LA,H.Vision2Seq],[NA,H.ImageTextToText],[$A,H.AudioTextToText],[RA,H.EncoderOnly],[Ra,H.EncoderOnly],[FA,H.EncoderOnly],[DA,H.EncoderOnly],[HA,H.EncoderOnly],[iz,H.EncoderOnly],[XA,H.EncoderOnly],[KA,H.EncoderOnly],[YA,H.EncoderOnly],[QA,H.EncoderOnly],[UA,H.EncoderOnly],[BA,H.EncoderOnly],[jA,H.MaskGeneration],[GA,H.EncoderOnly],[qA,H.EncoderOnly],[MA,H.Seq2Seq],[TA,H.EncoderOnly],[WA,H.EncoderOnly],[VA,H.EncoderOnly],[JA,H.EncoderOnly]];for(let[t,e]of Z0)for(let r of t.values()){zs.set(r,e);let s=Yl[r];Ps.set(s,r),Zd.set(r,s)}var lz=[["MusicgenForConditionalGeneration",Jo,H.Musicgen],["Phi3VForCausalLM",pa,H.Phi3V],["CLIPTextModelWithProjection",Hn,H.EncoderOnly],["SiglipTextModel",ba,H.EncoderOnly],["JinaCLIPTextModel",zo,H.EncoderOnly],["ClapTextModelWithProjection",Wn,H.EncoderOnly],["ClapAudioModelWithProjection",Vn,H.EncoderOnly],["DacEncoderModel",to,H.EncoderOnly],["DacDecoderModel",ro,H.EncoderOnly],["MimiEncoderModel",Fo,H.EncoderOnly],["MimiDecoderModel",jo,H.EncoderOnly],["SnacEncoderModel",ka,H.EncoderOnly],["SnacDecoderModel",Ea,H.EncoderOnly],["Gemma3nForConditionalGeneration",go,H.ImageAudioTextToText],["SupertonicForConditionalGeneration",Ta,H.Supertonic],["ChatterboxModel",qn,H.Chatterbox]];for(let[t,e,r]of lz)zs.set(t,r),Ps.set(e,t),Zd.set(t,e);var eb=new Map([["modnet",Ra],["birefnet",Ra],["isnet",Ra],["ben",Ra]]);for(let[t,e]of eb.entries())e.set(t,"PreTrainedModel"),zs.set(t,H.EncoderOnly),Zd.set(t,y);zs.set("PreTrainedModel",H.EncoderOnly);Ps.set(y,"PreTrainedModel");var Ce={MODEL_FOR_SEQUENCE_CLASSIFICATION_MAPPING_NAMES:SA,MODEL_FOR_TOKEN_CLASSIFICATION_MAPPING_NAMES:OA,MODEL_FOR_TEXT_TO_SPECTROGRAM_MAPPING_NAMES:MA,MODEL_FOR_TEXT_TO_WAVEFORM_MAPPING_NAMES:TA,MODEL_FOR_MASKED_LM_MAPPING_NAMES:PA,MODEL_FOR_QUESTION_ANSWERING_MAPPING_NAMES:zA,MODEL_FOR_IMAGE_CLASSIFICATION_MAPPING_NAMES:RA,MODEL_FOR_IMAGE_SEGMENTATION_MAPPING_NAMES:Ra,MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPING_NAMES:DA,MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPING_NAMES:FA,MODEL_FOR_OBJECT_DETECTION_MAPPING_NAMES:UA,MODEL_FOR_ZERO_SHOT_OBJECT_DETECTION_MAPPING_NAMES:BA,MODEL_FOR_MASK_GENERATION_MAPPING_NAMES:jA,MODEL_FOR_CTC_MAPPING_NAMES:GA,MODEL_FOR_AUDIO_CLASSIFICATION_MAPPING_NAMES:qA,MODEL_FOR_AUDIO_XVECTOR_MAPPING_NAMES:WA,MODEL_FOR_AUDIO_FRAME_CLASSIFICATION_MAPPING_NAMES:VA,MODEL_FOR_DOCUMENT_QUESTION_ANSWERING_MAPPING_NAMES:az,MODEL_FOR_IMAGE_MATTING_MAPPING_NAMES:HA,MODEL_FOR_IMAGE_TO_IMAGE_MAPPING_NAMES:XA,MODEL_FOR_DEPTH_ESTIMATION_MAPPING_NAMES:KA,MODEL_FOR_NORMAL_ESTIMATION_MAPPING_NAMES:YA,MODEL_FOR_POSE_ESTIMATION_MAPPING_NAMES:QA,MODEL_FOR_IMAGE_FEATURE_EXTRACTION_MAPPING_NAMES:JA,MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPING_NAMES:NA,MODEL_FOR_AUDIO_TEXT_TO_TEXT_MAPPING_NAMES:$A,MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMES:IA,MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPING_NAMES:AA,MODEL_FOR_CAUSAL_LM_MAPPING_NAMES:CA,MODEL_FOR_VISION_2_SEQ_MAPPING_NAMES:LA};bA(Ce);var Se=class{static MODEL_CLASS_MAPPINGS=null;static BASE_IF_FAIL=!1;static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main",model_file_name:i=null,subfolder:l="onnx",device:u=null,dtype:d=null,use_external_data_format:f=null,session_options:m={}}={}){let _={progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a,model_file_name:i,subfolder:l,device:u,dtype:d,use_external_data_format:f,session_options:m};if(_.config=await Xr.from_pretrained(e,_),!this.MODEL_CLASS_MAPPINGS)throw new Error("`MODEL_CLASS_MAPPINGS` not implemented for this type of `AutoClass`: "+this.name);let w=_.config.model_type;for(let x of this.MODEL_CLASS_MAPPINGS){let k=x.get(w);if(!k){for(let E of x.values())if(E[0]===w){k=E;break}if(!k)continue}return await Yl[k].from_pretrained(e,_)}if(this.BASE_IF_FAIL)return eb.has(w)||console.warn(`Unknown model class "${w}", attempting to construct from base class.`),await y.from_pretrained(e,_);throw Error(`Unsupported model type: ${w}`)}},pr=class extends Se{static MODEL_CLASS_MAPPINGS=Z0.map(e=>e[0]);static BASE_IF_FAIL=!0},Ua=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_SEQUENCE_CLASSIFICATION_MAPPING_NAMES]},Ql=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_TOKEN_CLASSIFICATION_MAPPING_NAMES]},Zs=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMES]},Jl=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPING_NAMES]},Zl=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_TEXT_TO_SPECTROGRAM_MAPPING_NAMES]},ec=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_TEXT_TO_WAVEFORM_MAPPING_NAMES]},tc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_CAUSAL_LM_MAPPING_NAMES]},rc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_MASKED_LM_MAPPING_NAMES]},sc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_QUESTION_ANSWERING_MAPPING_NAMES]},nc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_VISION_2_SEQ_MAPPING_NAMES]},oc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_CLASSIFICATION_MAPPING_NAMES]},Ba=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_SEGMENTATION_MAPPING_NAMES]},Da=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPING_NAMES]},Fa=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPING_NAMES]},ac=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_OBJECT_DETECTION_MAPPING_NAMES]},ic=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_ZERO_SHOT_OBJECT_DETECTION_MAPPING_NAMES]},tb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_MASK_GENERATION_MAPPING_NAMES]},lc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_CTC_MAPPING_NAMES]},cc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_AUDIO_CLASSIFICATION_MAPPING_NAMES]},rb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_AUDIO_XVECTOR_MAPPING_NAMES]},sb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_AUDIO_FRAME_CLASSIFICATION_MAPPING_NAMES]},uc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_DOCUMENT_QUESTION_ANSWERING_MAPPING_NAMES]},nb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_MATTING_MAPPING_NAMES]},pc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_TO_IMAGE_MAPPING_NAMES]},dc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_DEPTH_ESTIMATION_MAPPING_NAMES]},ob=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_NORMAL_ESTIMATION_MAPPING_NAMES]},ab=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_POSE_ESTIMATION_MAPPING_NAMES]},fc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_FEATURE_EXTRACTION_MAPPING_NAMES]},ib=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPING_NAMES]},lb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_AUDIO_TEXT_TO_TEXT_MAPPING_NAMES]};async function Ye(t){return Array.isArray(t)||(t=[t]),await Promise.all(t.map(e=>Xe.read(e)))}async function ss(t,e){return Array.isArray(t)||(t=[t]),await Promise.all(t.map(r=>typeof r=="string"||r instanceof URL?kp(r,e):r instanceof Float64Array?new Float32Array(r):r))}function mc(t,e){e&&(t=t.map(a=>a|0));let[r,s,n,o]=t;return{xmin:r,ymin:s,xmax:n,ymax:o}}var pe=class extends Je{constructor({task:e,model:r,tokenizer:s=null,processor:n=null}){super(),this.task=e,this.model=r,this.tokenizer=s,this.processor=n}async dispose(){await this.model.dispose()}};var hc=class extends pe{async _call(e,{top_k:r=1}={}){let s=this.tokenizer(e,{padding:!0,truncation:!0}),n=await this.model(s),{problem_type:o,id2label:a}=this.model.config,i=o==="multi_label_classification"?u=>u.sigmoid():u=>new U("float32",Oe(u.data),u.dims),l=[];for(let u of n.logits){let d=i(u),f=await Gt(d,r),m=f[0].tolist(),w=f[1].tolist().map((x,k)=>({label:a?a[x]:`LABEL_${x}`,score:m[k]}));r===1?l.push(...w):l.push(w)}return Array.isArray(e)||r===1?l:l[0]}};var _c=class extends pe{async _call(e,{ignore_labels:r=["O"]}={}){let s=Array.isArray(e),n=this.tokenizer(s?e:[e],{padding:!0,truncation:!0}),a=(await this.model(n)).logits,i=this.model.config.id2label,l=[];for(let u=0;u<a.dims[0];++u){let d=n.input_ids[u],f=a[u],m=[];for(let _=0;_<f.dims[0];++_){let w=f[_],x=Te(w.data)[1],k=i?i[x]:`LABEL_${x}`;if(r.includes(k))continue;let E=this.tokenizer.decode([d[_].item()],{skip_special_tokens:!0});if(E==="")continue;let M=Oe(w.data);m.push({entity:k,score:M[x],index:_,word:E})}l.push(m)}return s?l:l[0]}};var gc=class extends pe{async _call(e,r,{top_k:s=1}={}){let n=this.tokenizer(e,{text_pair:r,padding:!0,truncation:!0}),o=Array.isArray(e),{start_logits:a,end_logits:i}=await this.model(n),l=n.input_ids.tolist(),u=n.attention_mask.tolist(),{all_special_ids:d,sep_token_id:f}=this.tokenizer,m=[];for(let _=0;_<a.dims[0];++_){let w=l[_],x=w.findIndex(C=>C==f),k=a[_].tolist(),E=i[_].tolist();for(let C=1;C<k.length;++C)(u[_]==0||C<=x||d.findIndex(v=>v==w[C])!==-1)&&(k[C]=-1/0,E[C]=-1/0);let M=Oe(k).map((C,v)=>[C,v]),I=Oe(E).map((C,v)=>[C,v]);M[0][0]=0,I[0][0]=0;let T=sk(M,I).filter(C=>C[0][1]<=C[1][1]).map(C=>[C[0][1],C[1][1],C[0][0]*C[1][0]]).sort((C,v)=>v[2]-C[2]),z=[];for(let C=0;C<Math.min(T.length,s);++C){let[v,G,X]=T[C],V=w.slice(v,G+1),Q=this.tokenizer.decode(V,{skip_special_tokens:!0});z.push({answer:Q,score:X})}s===1?m.push(...z):m.push(z)}return o?m:m[0]}};var wc=class extends pe{async _call(e,{top_k:r=5}={}){let{mask_token_id:s,mask_token:n}=this.tokenizer,o=this.tokenizer(e,{padding:!0,truncation:!0}),{logits:a}=await this.model(o),i=[],l=o.input_ids.tolist();for(let u=0;u<l.length;++u){let d=l[u],f=d.findIndex(k=>k==s);if(f===-1)throw Error(`Mask token (${n}) not found in text.`);let m=a[u][f],_=await Gt(new U("float32",Oe(m.data),m.dims),r),w=_[0].tolist(),x=_[1].tolist();i.push(x.map((k,E)=>{let M=d.slice();return M[f]=k,{score:w[E],token:Number(k),token_str:this.tokenizer.decode([k]),sequence:this.tokenizer.decode(M,{skip_special_tokens:!0})}}))}return Array.isArray(e)?i:i[0]}};var Lr=class extends pe{_key="generated_text";async _call(e,r={}){Array.isArray(e)||(e=[e]),this.model.config.prefix&&(e=e.map(l=>this.model.config.prefix+l));let s=this.model.config.task_specific_params;s&&s[this.task]&&s[this.task].prefix&&(e=e.map(l=>s[this.task].prefix+l));let n=this.tokenizer,o={padding:!0,truncation:!0},a;this.task==="translation"&&"_build_translation_inputs"in n?a=n._build_translation_inputs(e,o,r):a=n(e,o);let i=await this.model.generate({...a,...r});return n.batch_decode(i,{skip_special_tokens:!0}).map(l=>({[this._key]:l}))}};var xc=class extends Lr{_key="summary_text"};var yc=class extends Lr{_key="translation_text"};function ZA(t){return Array.isArray(t)&&t.every(e=>"role"in e&&"content"in e)}var bc=class extends pe{async _call(e,r={}){let s=!1,n=!1,o=r.add_special_tokens??(this.tokenizer.add_bos_token||this.tokenizer.add_eos_token)??!1,a=r.tokenizer_encode_kwargs,i;if(typeof e=="string")i=e=[e];else if(Array.isArray(e)&&e.every(w=>typeof w=="string"))s=!0,i=e;else{if(ZA(e))e=[e];else if(Array.isArray(e)&&e.every(ZA))s=!0;else throw new Error("Input must be a string, an array of strings, a Chat, or an array of Chats");n=!0,i=e.map(w=>this.tokenizer.apply_chat_template(w,{tokenize:!1,add_generation_prompt:!0,...a})),o=!1,a=void 0}let l=n?!1:r.return_full_text??!0;this.tokenizer.padding_side="left";let u=this.tokenizer(i,{add_special_tokens:o,padding:!0,truncation:!0,...a}),d=await this.model.generate({...u,...r}),f=this.tokenizer.batch_decode(d,{skip_special_tokens:!0}),m;!l&&u.input_ids.dims.at(-1)>0&&(m=this.tokenizer.batch_decode(u.input_ids,{skip_special_tokens:!0}).map(w=>w.length));let _=Array.from({length:e.length},w=>[]);for(let w=0;w<f.length;++w){let x=Math.floor(w/d.dims[0]*e.length);m&&(f[w]=f[w].slice(m[x])),_[x].push({generated_text:n?[...e[x],{role:"assistant",content:f[w]}]:f[w]})}return!s&&_.length===1?_[0]:_}};var vc=class extends pe{constructor(e){super(e),this.label2id=Object.fromEntries(Object.entries(this.model.config.label2id).map(([r,s])=>[r.toLowerCase(),s])),this.entailment_id=this.label2id.entailment,this.entailment_id===void 0&&(console.warn("Could not find 'entailment' in label2id mapping. Using 2 as entailment_id."),this.entailment_id=2),this.contradiction_id=this.label2id.contradiction??this.label2id.not_entailment,this.contradiction_id===void 0&&(console.warn("Could not find 'contradiction' in label2id mapping. Using 0 as contradiction_id."),this.contradiction_id=0)}async _call(e,r,{hypothesis_template:s="This example is {}.",multi_label:n=!1}={}){let o=Array.isArray(e);o||(e=[e]),Array.isArray(r)||(r=[r]);let a=r.map(u=>s.replace("{}",u)),i=n||r.length===1,l=[];for(let u of e){let d=[];for(let _ of a){let w=this.tokenizer(u,{text_pair:_,padding:!0,truncation:!0}),x=await this.model(w);i?d.push([x.logits.data[this.contradiction_id],x.logits.data[this.entailment_id]]):d.push(x.logits.data[this.entailment_id])}let m=(i?d.map(_=>Oe(_)[1]):Oe(d)).map((_,w)=>[_,w]).sort((_,w)=>w[0]-_[0]);l.push({sequence:u,labels:m.map(_=>r[_[1]]),scores:m.map(_=>_[0])})}return o?l:l[0]}};var kc=class extends pe{async _call(e,{top_k:r=5}={}){let s=this.processor.feature_extractor.config.sampling_rate,n=await ss(e,s),o=this.model.config.id2label,a=[];for(let i of n){let l=await this.processor(i),d=(await this.model(l)).logits[0],f=await Gt(new U("float32",Oe(d.data),d.dims),r),m=f[0].tolist(),w=f[1].tolist().map((x,k)=>({label:o?o[x]:`LABEL_${x}`,score:m[k]}));a.push(w)}return Array.isArray(e)?a:a[0]}};var Ec=class extends pe{async _call(e,r,{hypothesis_template:s="This is a sound of {}."}={}){let n=!Array.isArray(e);n&&(e=[e]);let o=r.map(d=>s.replace("{}",d)),a=this.tokenizer(o,{padding:!0,truncation:!0}),i=this.processor.feature_extractor.config.sampling_rate,l=await ss(e,i),u=[];for(let d of l){let f=await this.processor(d),m=await this.model({...a,...f}),_=Oe(m.logits_per_audio.data);u.push([..._].map((w,x)=>({score:w,label:r[x]})))}return n?u[0]:u}};var Ac=class extends pe{async _call(e,r={}){switch(this.model.config.model_type){case"whisper":case"lite-whisper":return this._call_whisper(e,r);case"wav2vec2":case"wav2vec2-bert":case"unispeech":case"unispeech-sat":case"hubert":case"parakeet_ctc":return this._call_wav2vec2(e,r);case"moonshine":return this._call_moonshine(e,r);default:throw new Error(`AutomaticSpeechRecognitionPipeline does not support model type '${this.model.config.model_type}'.`)}}async _call_wav2vec2(e,r){r.language&&console.warn('`language` parameter is not yet supported for `wav2vec2` models, defaulting to "English".'),r.task&&console.warn('`task` parameter is not yet supported for `wav2vec2` models, defaulting to "transcribe".');let s=!Array.isArray(e),n=s?[e]:e,o=this.processor.feature_extractor.config.sampling_rate,a=await ss(n,o),i=[];for(let l of a){let u=await this.processor(l),f=(await this.model(u)).logits[0],m=[];for(let w of f)m.push(Te(w.data)[1]);let _=this.tokenizer.decode(m,{skip_special_tokens:!0}).trim();i.push({text:_})}return s?i[0]:i}async _call_whisper(e,r){let s=r.return_timestamps??!1,n=r.chunk_length_s??0,o=r.force_full_sequences??!1,a=r.stride_length_s??null,i={...r};s==="word"&&(i.return_token_timestamps=!0,i.return_timestamps=!1);let l=!Array.isArray(e),u=l?[e]:e,d=this.processor.feature_extractor.config,f=d.chunk_length/this.model.config.max_source_positions,m=d.hop_length,_=d.sampling_rate,w=await ss(u,_),x=[];for(let k of w){let E=[];if(n>0){if(a===null)a=n/6;else if(n<=a)throw Error("`chunk_length_s` must be larger than `stride_length_s`.");let T=_*n,z=_*a,C=T-2*z,v=0;for(;;){let G=v+T,X=k.subarray(v,G),V=await this.processor(X),Q=v===0,K=G>=k.length;if(E.push({stride:[X.length,Q?0:z,K?0:z],input_features:V.input_features,is_last:K}),K)break;v+=C}}else E=[{stride:[k.length,0,0],input_features:(await this.processor(k)).input_features,is_last:!0}];for(let T of E){i.num_frames=Math.floor(T.stride[0]/m);let z=await this.model.generate({inputs:T.input_features,...i});s==="word"?(T.tokens=z.sequences.tolist()[0],T.token_timestamps=z.token_timestamps.tolist()[0].map(C=>ms(C,2))):T.tokens=z[0].tolist(),T.stride=T.stride.map(C=>C/_)}let[M,I]=this.tokenizer._decode_asr(E,{time_precision:f,return_timestamps:s,force_full_sequences:o});x.push({text:M,...I})}return l?x[0]:x}async _call_moonshine(e,r){let s=!Array.isArray(e),n=s?[e]:e,o=this.processor.feature_extractor.config.sampling_rate,a=await ss(n,o),i=[];for(let l of a){let u=await this.processor(l),d=Math.floor(l.length/o)*6,f=await this.model.generate({max_new_tokens:d,...r,...u}),m=this.processor.batch_decode(f,{skip_special_tokens:!0})[0];i.push({text:m})}return s?i[0]:i}};var Mc=class extends pe{DEFAULT_VOCODER_ID="Xenova/speecht5_hifigan";constructor(e){super(e),this.vocoder=e.vocoder??null}async _prepare_speaker_embeddings(e,r){if((typeof e=="string"||e instanceof URL)&&(e=new Float32Array(await(await fetch(e)).arrayBuffer())),e instanceof Float32Array)e=new U("float32",e,[e.length]);else if(!(e instanceof U))throw new Error("Speaker embeddings must be a `Tensor`, `Float32Array`, `string`, or `URL`.");if(r>1){if(e.dims[0]===1)e=e.repeat(r,1);else if(e.dims[0]!==r)throw new Error(`Expected speaker embeddings batch size to be 1 or ${r}, but got ${e.dims[0]}.`)}return e}_postprocess_waveform(e,r,s,n=null){let o=r.data,[a,i]=r.dims,l=n?n.data:null,u=[];for(let d=0;d<a;++d){let f=l?Math.min(Math.ceil(l[d]),i):i,m=d*i;u.push(new An(o.slice(m,m+f),s))}return Array.isArray(e)?u:u[0]}async _call(e,r){return this.processor?this._call_text_to_spectrogram(e,r):this.model.config.model_type==="supertonic"?this._call_supertonic(e,r):this._call_text_to_waveform(e)}async _call_supertonic(e,{speaker_embeddings:r,num_inference_steps:s,speed:n}){if(!r)throw new Error("Speaker embeddings must be provided for Supertonic models.");let{sampling_rate:o,style_dim:a}=this.model.config,i=this.tokenizer(e,{padding:!0,truncation:!0}),l=i.input_ids.dims[0];r=await this._prepare_speaker_embeddings(r,l),r=r.view(l,-1,a);let{waveform:u,durations:d}=await this.model.generate_speech({...i,style:r,num_inference_steps:s,speed:n});return this._postprocess_waveform(e,u,o,d)}async _call_text_to_waveform(e){let r=this.tokenizer(e,{padding:!0,truncation:!0}),{waveform:s}=await this.model(r),n=this.model.config.sampling_rate;return this._postprocess_waveform(e,s,n)}async _call_text_to_spectrogram(e,{speaker_embeddings:r}){this.vocoder||(console.log("No vocoder specified, using default HifiGan vocoder."),this.vocoder=await pr.from_pretrained(this.DEFAULT_VOCODER_ID,{dtype:"fp32"}));let{input_ids:s}=this.tokenizer(e,{padding:!0,truncation:!0}),n=s.dims[0];r=await this._prepare_speaker_embeddings(r,n),r=r.view(n,-1);let{waveform:o}=await this.model.generate_speech(s,r,{vocoder:this.vocoder}),a=this.processor.feature_extractor.config.sampling_rate;return this._postprocess_waveform(e,o,a)}};var Tc=class extends pe{async _call(e,r={}){let s=Array.isArray(e),n=await Ye(e),{pixel_values:o}=await this.processor(n),a=[];for(let i of o){i.dims=[1,...i.dims];let l=await this.model.generate({inputs:i,...r}),u=this.tokenizer.batch_decode(l,{skip_special_tokens:!0}).map(d=>({generated_text:d.trim()}));a.push(u)}return s?a:a[0]}};var Sc=class extends pe{async _call(e,{top_k:r=5}={}){let s=await Ye(e),{pixel_values:n}=await this.processor(s),o=await this.model({pixel_values:n}),{id2label:a}=this.model.config,i=[];for(let l of o.logits){let u=await Gt(new U("float32",Oe(l.data),l.dims),r),d=u[0].tolist(),m=u[1].tolist().map((_,w)=>({label:a?a[_]:`LABEL_${_}`,score:d[w]}));i.push(m)}return Array.isArray(e)?i:i[0]}};var e2={panoptic:"post_process_panoptic_segmentation",instance:"post_process_instance_segmentation",semantic:"post_process_semantic_segmentation"},en=class extends pe{async _call(e,{threshold:r=.5,mask_threshold:s=.5,overlap_mask_area_threshold:n=.8,label_ids_to_fuse:o=null,target_sizes:a=null,subtask:i=null}={}){if(Array.isArray(e)&&e.length!==1)throw Error("Image segmentation pipeline currently only supports a batch size of 1.");let u=await Ye(e),d=u.map(M=>[M.height,M.width]),f=await this.processor(u),{inputNames:m,outputNames:_}=this.model.sessions.model;if(!m.includes("pixel_values")){if(m.length!==1)throw Error(`Expected a single input name, but got ${m.length} inputs: ${m}.`);let M=m[0];if(M in f)throw Error(`Input name ${M} already exists in the inputs.`);f[M]=f.pixel_values}let w=await this.model(f),x=null;if(i!==null)x=e2[i];else if(this.processor.image_processor){for(let[M,I]of Object.entries(e2))if(I in this.processor.image_processor){x=this.processor.image_processor[I].bind(this.processor.image_processor),i=M;break}}let k=this.model.config.id2label,E=[];if(i)if(i==="panoptic"||i==="instance"){let M=x(w,r,s,n,o,a??d)[0],I=M.segmentation;for(let T of M.segments_info){let z=new Uint8ClampedArray(I.data.length);for(let v=0;v<I.data.length;++v)I.data[v]===T.id&&(z[v]=255);let C=new Xe(z,I.dims[1],I.dims[0],1);E.push({score:T.score,label:k[T.label_id],mask:C})}}else if(i==="semantic"){let{segmentation:M,labels:I}=x(w,a??d)[0];for(let T of I){let z=new Uint8ClampedArray(M.data.length);for(let v=0;v<M.data.length;++v)M.data[v]===T&&(z[v]=255);let C=new Xe(z,M.dims[1],M.dims[0],1);E.push({score:null,label:k[T],mask:C})}}else throw Error(`Subtask ${i} not supported.`);else{let I=w[_[0]];for(let T=0;T<d.length;++T){let z=d[T],C=I[T];C.data.some(G=>G<-1e-5||G>1+1e-5)&&C.sigmoid_();let v=await Xe.fromTensor(C.mul_(255).to("uint8")).resize(z[1],z[0]);E.push({label:null,score:null,mask:v})}}return E}};var Oc=class extends en{async _call(e,r={}){let s=await Ye(e),n=await super._call(e,r),o=s.map((a,i)=>{let l=a.clone();return l.putAlpha(n[i].mask),l});return Array.isArray(e)?o:o[0]}};var Ic=class extends pe{async _call(e,r,{hypothesis_template:s="This is a photo of {}"}={}){let n=Array.isArray(e),o=await Ye(e),a=r.map(m=>s.replace("{}",m)),i=this.tokenizer(a,{padding:this.model.config.model_type==="siglip"?"max_length":!0,truncation:!0}),{pixel_values:l}=await this.processor(o),u=await this.model({...i,pixel_values:l}),d=this.model.config.model_type==="siglip"?m=>m.sigmoid().data:m=>Oe(m.data),f=[];for(let m of u.logits_per_image){let w=[...d(m)].map((x,k)=>({score:x,label:r[k]}));w.sort((x,k)=>k.score-x.score),f.push(w)}return n?f:f[0]}};var Cc=class extends pe{async _call(e,{threshold:r=.9,percentage:s=!1}={}){let n=Array.isArray(e);if(n&&e.length!==1)throw Error("Object detection pipeline currently only supports a batch size of 1.");let o=await Ye(e),a=s?null:o.map(_=>[_.height,_.width]),{pixel_values:i,pixel_mask:l}=await this.processor(o),u=await this.model({pixel_values:i,pixel_mask:l}),d=this.processor.image_processor.post_process_object_detection(u,r,a),{id2label:f}=this.model.config,m=d.map(_=>_.boxes.map((w,x)=>({score:_.scores[x],label:f[_.classes[x]],box:mc(w,!s)})));return n?m:m[0]}};var Pc=class extends pe{async _call(e,r,{threshold:s=.1,top_k:n=null,percentage:o=!1}={}){let a=Array.isArray(e),i=await Ye(e),l=this.tokenizer(r,{padding:!0,truncation:!0}),u=await this.processor(i),d=[];for(let f=0;f<i.length;++f){let m=i[f],_=o?null:[[m.height,m.width]],w=u.pixel_values[f].unsqueeze_(0),x=await this.model({...l,pixel_values:w}),k;if("post_process_grounded_object_detection"in this.processor){let E=this.processor.post_process_grounded_object_detection(x,l.input_ids,{box_threshold:s,text_threshold:s,target_sizes:_})[0];k=E.boxes.map((M,I)=>({score:E.scores[I],label:E.labels[I],box:mc(M,!o)}))}else{let E=this.processor.image_processor.post_process_object_detection(x,s,_,!0)[0];k=E.boxes.map((M,I)=>({score:E.scores[I],label:r[E.classes[I]],box:mc(M,!o)}))}k.sort((E,M)=>M.score-E.score),n!==null&&(k=k.slice(0,n)),d.push(k)}return a?d:d[0]}};var zc=class extends pe{async _call(e,r,s={}){if(Array.isArray(e)){if(e.length!==1)throw Error("Document Question Answering pipeline currently only supports a batch size of 1.");e=e[0]}let n=(await Ye(e))[0],{pixel_values:o}=await this.processor(n),a=`<s_docvqa><s_question>${r}</s_question><s_answer>`,i=this.tokenizer(a,{add_special_tokens:!1,padding:!0,truncation:!0}).input_ids,l=await this.model.generate({inputs:o,max_length:this.model.config.decoder.max_position_embeddings,decoder_input_ids:i,...s}),d=this.tokenizer.batch_decode(l)[0].match(/<s_answer>(.*?)<\/s_answer>/),f=null;return d&&d.length>=2&&(f=d[1].trim()),[{answer:f}]}};var Lc=class extends pe{async _call(e){let r=await Ye(e),s=await this.processor(r),n=await this.model(s),o=[];for(let a of n.reconstruction){let i=a.squeeze().clamp_(0,1).mul_(255).round_().to("uint8");o.push(Xe.fromTensor(i))}return Array.isArray(e)?o:o[0]}};var Nc=class extends pe{async _call(e){let r=await Ye(e),s=await this.processor(r),{predicted_depth:n}=await this.model(s),o=[];for(let a=0;a<r.length;++a){let i=n[a],[l,u]=i.dims.slice(-2),[d,f]=r[a].size,m=(await Pt(i.view(1,1,l,u),{size:[f,d],mode:"bilinear"})).view(f,d),_=m.min().item(),w=m.max().item(),x=m.sub(_).div_(w-_).mul_(255).to("uint8").unsqueeze(0),k=Xe.fromTensor(x);o.push({predicted_depth:m,depth:k})}return Array.isArray(e)?o:o[0]}};var $c=class extends pe{async _call(e,{pooling:r="none",normalize:s=!1,quantize:n=!1,precision:o="binary"}={}){let a=this.tokenizer(e,{padding:!0,truncation:!0}),i=await this.model(a),l=i.last_hidden_state??i.logits??i.token_embeddings;switch(r){case"none":break;case"mean":l=C0(l,a.attention_mask);break;case"first_token":case"cls":l=l.slice(null,0);break;case"last_token":case"eos":l=l.slice(null,-1);break;default:throw Error(`Pooling method '${r}' not supported.`)}return s&&(l=l.normalize(2,-1)),n&&(l=L0(l,o)),l}};var Rc=class extends pe{async _call(e,{pool:r=null}={}){let s=await Ye(e),{pixel_values:n}=await this.processor(s),o=await this.model({pixel_values:n}),a;if(r){if(!("pooler_output"in o))throw Error("No pooled output was returned. Make sure the model has a 'pooler' layer when using the 'pool' option.");a=o.pooler_output}else a=o.last_hidden_state??o.logits??o.image_embeds;return a}};var t2=Object.freeze({"text-classification":{tokenizer:J,pipeline:hc,model:Ua,default:{model:"Xenova/distilbert-base-uncased-finetuned-sst-2-english"},type:"text"},"token-classification":{tokenizer:J,pipeline:_c,model:Ql,default:{model:"Xenova/bert-base-multilingual-cased-ner-hrl"},type:"text"},"question-answering":{tokenizer:J,pipeline:gc,model:sc,default:{model:"Xenova/distilbert-base-cased-distilled-squad"},type:"text"},"fill-mask":{tokenizer:J,pipeline:wc,model:rc,default:{model:"onnx-community/ettin-encoder-32m-ONNX",dtype:"fp32"},type:"text"},summarization:{tokenizer:J,pipeline:xc,model:Zs,default:{model:"Xenova/distilbart-cnn-6-6"},type:"text"},translation:{tokenizer:J,pipeline:yc,model:Zs,default:{model:"Xenova/t5-small"},type:"text"},"text2text-generation":{tokenizer:J,pipeline:Lr,model:Zs,default:{model:"Xenova/flan-t5-small"},type:"text"},"text-generation":{tokenizer:J,pipeline:bc,model:tc,default:{model:"onnx-community/Qwen3-0.6B-ONNX",dtype:"q4"},type:"text"},"zero-shot-classification":{tokenizer:J,pipeline:vc,model:Ua,default:{model:"Xenova/distilbert-base-uncased-mnli"},type:"text"},"audio-classification":{pipeline:kc,model:cc,processor:lt,default:{model:"Xenova/wav2vec2-base-superb-ks"},type:"audio"},"zero-shot-audio-classification":{tokenizer:J,pipeline:Ec,model:pr,processor:lt,default:{model:"Xenova/clap-htsat-unfused"},type:"multimodal"},"automatic-speech-recognition":{tokenizer:J,pipeline:Ac,model:[Jl,lc],processor:lt,default:{model:"Xenova/whisper-tiny.en"},type:"multimodal"},"text-to-audio":{tokenizer:J,pipeline:Mc,model:[ec,Zl],processor:[lt,null],default:{model:"onnx-community/Supertonic-TTS-ONNX",dtype:"fp32"},type:"text"},"image-to-text":{tokenizer:J,pipeline:Tc,model:nc,processor:lt,default:{model:"Xenova/vit-gpt2-image-captioning"},type:"multimodal"},"image-classification":{pipeline:Sc,model:oc,processor:lt,default:{model:"Xenova/vit-base-patch16-224"},type:"multimodal"},"image-segmentation":{pipeline:en,model:[Ba,Da,Fa],processor:lt,default:{model:"Xenova/detr-resnet-50-panoptic"},type:"multimodal"},"background-removal":{pipeline:Oc,model:[Ba,Da,Fa],processor:lt,default:{model:"Xenova/modnet"},type:"image"},"zero-shot-image-classification":{tokenizer:J,pipeline:Ic,model:pr,processor:lt,default:{model:"Xenova/clip-vit-base-patch32"},type:"multimodal"},"object-detection":{pipeline:Cc,model:ac,processor:lt,default:{model:"Xenova/detr-resnet-50"},type:"multimodal"},"zero-shot-object-detection":{tokenizer:J,pipeline:Pc,model:ic,processor:lt,default:{model:"Xenova/owlvit-base-patch32"},type:"multimodal"},"document-question-answering":{tokenizer:J,pipeline:zc,model:uc,processor:lt,default:{model:"Xenova/donut-base-finetuned-docvqa"},type:"multimodal"},"image-to-image":{pipeline:Lc,model:pc,processor:lt,default:{model:"Xenova/swin2SR-classical-sr-x2-64"},type:"image"},"depth-estimation":{pipeline:Nc,model:dc,processor:lt,default:{model:"onnx-community/depth-anything-v2-small"},type:"image"},"feature-extraction":{tokenizer:J,pipeline:$c,model:pr,default:{model:"onnx-community/all-MiniLM-L6-v2-ONNX",dtype:"fp32"},type:"text"},"image-feature-extraction":{processor:lt,pipeline:Rc,model:[fc,pr],default:{model:"onnx-community/dinov3-vits16-pretrain-lvd1689m-ONNX",dtype:"fp32"},type:"image"}}),cz=Object.freeze({"sentiment-analysis":"text-classification",ner:"token-classification",asr:"automatic-speech-recognition","text-to-speech":"text-to-audio",embeddings:"feature-extraction"});async function uz(t,e=null,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main",device:i=null,dtype:l=null,subfolder:u="onnx",use_external_data_format:d=null,model_file_name:f=null,session_options:m={}}={}){t=cz[t]??t;let _=t2[t.split("_",1)[0]];if(!_)throw Error(`Unsupported pipeline: ${t}. Must be one of [${Object.keys(t2)}]`);e||(e=_.default.model,console.log(`No model specified. Using default model: "${e}".`),!l&&_.default.dtype&&(l=_.default.dtype));let w={progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a,device:i,dtype:l,subfolder:u,use_external_data_format:d,model_file_name:f,session_options:m},x=new Map([["tokenizer",_.tokenizer],["model",_.model],["processor",_.processor]]),k=await pz(x,e,w);k.task=t,wr(r,{status:"ready",task:t,model:e});let E=_.pipeline;return new E(k)}async function pz(t,e,r){let s=Object.create(null),n=[];for(let[o,a]of t.entries()){if(!a)continue;let i;Array.isArray(a)?i=new Promise(async(l,u)=>{let d;for(let f of a){if(f===null){l(null);return}try{l(await f.from_pretrained(e,r));return}catch(m){if(m.message?.includes("Unsupported model type"))d=m;else if(m.message?.includes("Could not locate file"))d=m;else{u(m);return}}}u(d)}):i=a.from_pretrained(e,r),s[o]=i,n.push(i)}await Promise.all(n);for(let[o,a]of Object.entries(s))s[o]=await a;return s}var dz=t=>t>=19968&&t<=40959||t>=13312&&t<=19903||t>=131072&&t<=173791||t>=173824&&t<=177983||t>=177984&&t<=178207||t>=178208&&t<=183983||t>=63744&&t<=64255||t>=194560&&t<=195103,Vx=class{put(e){throw Error("Not implemented")}end(){throw Error("Not implemented")}},r2=be.IS_PROCESS_AVAILABLE?t=>process.stdout.write(t):t=>console.log(t),Hx=class extends Vx{constructor(e,{skip_prompt:r=!1,callback_function:s=null,token_callback_function:n=null,skip_special_tokens:o=!0,decode_kwargs:a={},...i}={}){super(),this.tokenizer=e,this.skip_prompt=r,this.callback_function=s??r2,this.token_callback_function=n,this.decode_kwargs={skip_special_tokens:o,...a,...i},this.token_cache=[],this.print_len=0,this.next_tokens_are_prompt=!0}put(e){if(e.length>1)throw Error("TextStreamer only supports batch size of 1");let r=this.next_tokens_are_prompt;if(r&&(this.next_tokens_are_prompt=!1,this.skip_prompt))return;let s=e[0];this.token_callback_function?.(s),this.token_cache=dt(this.token_cache,s);let n=this.tokenizer.decode(this.token_cache,this.decode_kwargs),o;r||n.endsWith(`
|
|
27
|
+
`}):(console.warn("You are passing both `text` and `images` to `PaliGemmaProcessor`. The processor expects special image tokens in the text, as many tokens as there are images per each text. It is recommended to add `<image>` tokens in the very beginning of your text. For this call, we will infer how many images each text has and add special tokens."),a=r.map(u=>FP(u,n,o,Pn,e.length)));let i=this.tokenizer(a,s);return{...await this.image_processor(e,s),...i}}};var _A="<|image|>",jP=/<\|image_\d+\|>/g,$d=class extends ne{static image_processor_class=Le;static tokenizer_class=J;async _call(e,r=null,{padding:s=!0,truncation:n=!0,num_crops:o=null}={}){Array.isArray(e)||(e=[e]);let a,i;if(r){i=await this.image_processor(r,{num_crops:o});let{num_img_tokens:l}=i,u=e.map((f,m)=>f.split(jP).join(_A.repeat(l[m])));a=this.tokenizer(u,{padding:s,truncation:n});let d=this.tokenizer._tokenizer.token_to_id(_A);a.input_ids.map_(f=>f==d?-f:f)}else a=this.tokenizer(e);return{...a,...i}}};var Rd=class extends ne{static tokenizer_class=J;static image_processor_class=Le;static uses_processor_config=!0;async _call(e,r=null,s={}){let n=await this.image_processor(e,s);if(r){let[a,i]=n.pixel_values.dims.slice(-2),{image_token:l,image_break_token:u,image_end_token:d,patch_size:f,spatial_merge_size:m}=this.config,_=f*m,w=Math.floor(a/_),x=Math.floor(i/_);r=structuredClone(r),Array.isArray(r)||(r=[r]);for(let k=0;k<r.length;++k){let E=l.repeat(x),M=E+u,I=E+d,T=M.repeat(w-1)+I;r[k]=r[k].replace(l,T)}}let o=r?this.tokenizer(r,s):{};return{...n,...o}}};var Ud=class extends ne{static feature_extractor_class=Sn;async _call(e){return await this.feature_extractor(e)}post_process_speaker_diarization(...e){return this.feature_extractor.post_process_speaker_diarization(...e)}get sampling_rate(){return this.feature_extractor.config.sampling_rate}};var Bd=class extends ne{static image_processor_class=Le;static tokenizer_class=J;async _call(e,r=null,...s){Array.isArray(e)||(e=[e]);let n,o;if(r&&(n=await this.image_processor(r),o=n.image_grid_thw),o){let i=this.image_processor.config.merge_size**2,l=0,u=o.tolist();e=e.map(d=>{for(;d.includes("<|image_pad|>");){let f=Number(u[l++].reduce((m,_)=>m*_,1n));d=d.replace("<|image_pad|>","<|placeholder|>".repeat(Math.floor(f/i)))}return d.replaceAll("<|placeholder|>","<|image_pad|>")})}return{...this.tokenizer(e),...n}}};var zn=class extends ne{static image_processor_class=Le;async _call(...e){return await this.image_processor(...e)}post_process_masks(...e){return this.image_processor.post_process_masks(...e)}reshape_input_points(...e){return this.image_processor.reshape_input_points(...e)}};var Li=class extends zn{},Dd=class extends Li{};var Fd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var jd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;static uses_processor_config=!0;async _call(e,r=null,s={}){if(Array.isArray(e))throw new Error("Batched inputs are not supported yet.");let n={};if(r){let a=r.length,{input_features:i}=await this.feature_extractor(r,{...s,max_length:a}),l=Math.round(a/this.config.encoder_ds_factor+1e-4),u=1+Math.ceil(l/this.config.stack_factor);n.audio_token_len=[u],n.audio_values=i;let d=this.config.audio_placeholder;if(!e.includes(d))throw new Error(`The input text does not contain the image token ${d}.`);e=e.replaceAll(d,d.repeat(u))}return{...this.tokenizer(e,{add_special_tokens:!1,...s}),...n}}};var Gd="[AUDIO]",GP="[BEGIN_AUDIO]",qP=375;function WP(t,e){let r=[];for(let s=0;s<t.length;s+=e)r.push(t.subarray(s,Math.min(s+e,t.length)));return r}var qd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;static uses_processor_config=!1;async _call(e,r=null,s={}){if(Array.isArray(e))throw new Error("Batched inputs are not supported yet.");let n={};if(r){if(!e.includes(Gd))throw new Error(`The input text does not contain the audio token ${Gd}.`);Array.isArray(r)||(r=[r]);let a=e.split(Gd),i=a.length-1;if(i!==r.length)throw new Error(`The number of audio inputs (${r.length}) does not match the number of audio tokens in the text (${i}).`);let l=this.feature_extractor.config.n_samples,u=r.map(w=>WP(w,l)),d=u.map(w=>w.length),f=u.flat(),m=(await Promise.all(f.map(w=>this.feature_extractor(w,s)))).map(w=>w.input_features);n.audio_values=m.length>1?Ee(m,0):m[0];let _=a[0];for(let w=0;w<d.length;++w){_+=GP;for(let x=0;x<d[w];++x)_+=Gd.repeat(qP);_+=a[w+1]}e=_}return{...this.tokenizer(e,{add_special_tokens:!1,...s}),...n}}};var Wd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var Vd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var Hd=class extends ne{static tokenizer_class=J;static feature_extractor_class=Ze;async _call(e){return await this.feature_extractor(e)}};var lt=class{static async from_pretrained(e,r={}){let s=await it(e,En,!0,r),{image_processor_type:n,feature_extractor_type:o,processor_class:a}=s;if(a&&Xd[a])return Xd[a].from_pretrained(e,r);if(!n&&!o)throw new Error("No `image_processor_type` or `feature_extractor_type` found in the config.");let i={};if(n){let u=Cn[n.replace(/Fast$/,"")];if(!u)throw new Error(`Unknown image_processor_type: '${n}'.`);i.image_processor=new u(s)}if(o){let u=Cn[o];if(u)i.image_processor=new u(s);else{let d=gi[o];if(!d)throw new Error(`Unknown feature_extractor_type: '${o}'.`);i.feature_extractor=new d(s)}}let l={};return new ne(l,i,null)}};async function VP(t,e){return await it(t,"config.json",!0,e)}function Ln(t){let e={},r={};switch(t.model_type){case"llava":case"paligemma":case"gemma3":case"florence2":case"llava_onevision":case"idefics3":case"ultravox":case"voxtral":case"smolvlm":case"gemma3n":case"chatterbox":case"mistral3":r=Ln(t.text_config);break;case"moondream1":r=Ln(t.phi_config);break;case"musicgen":r=Ln(t.decoder);break;case"multi_modality":r=Ln(t.language_config);break;case"gpt2":case"gptj":case"jais":case"codegen":case"gpt_bigcode":e.num_heads="n_head",e.num_layers="n_layer",e.hidden_size="n_embd";break;case"gpt_neox":case"stablelm":case"opt":case"falcon":case"modernbert-decoder":e.num_heads="num_attention_heads",e.num_layers="num_hidden_layers",e.hidden_size="hidden_size";break;case"gpt_oss":case"llama":case"llama4_text":case"nanochat":case"apertus":case"arcee":case"lfm2":case"lfm2_moe":case"smollm3":case"olmo":case"olmo2":case"olmo3":case"mobilellm":case"granite":case"granitemoehybrid":case"cohere":case"mistral":case"starcoder2":case"qwen2":case"qwen2_vl":case"phi":case"phi3":case"phi3_v":case"llava_qwen2":e.num_heads="num_key_value_heads",e.num_layers="num_hidden_layers",e.hidden_size="hidden_size",e.num_attention_heads="num_attention_heads",e.dim_kv="head_dim";break;case"qwen3":case"gemma":case"gemma2":case"vaultgemma":case"gemma3_text":case"gemma3n_text":case"glm":case"helium":case"ernie4_5":case"hunyuan_v1_dense":case"falcon_h1":case"ministral":case"ministral3":e.num_heads="num_key_value_heads",e.num_layers="num_hidden_layers",e.dim_kv="head_dim";break;case"openelm":e.num_heads="num_kv_heads",e.num_layers="num_transformer_layers",e.dim_kv="head_dim";break;case"gpt_neo":case"donut-swin":e.num_heads="num_heads",e.num_layers="num_layers",e.hidden_size="hidden_size";break;case"bloom":e.num_heads="n_head",e.num_layers="n_layer",e.hidden_size="hidden_size";break;case"mpt":e.num_heads="n_heads",e.num_layers="n_layers",e.hidden_size="d_model";break;case"exaone":e.num_heads="num_key_value_heads",e.num_layers="num_layers",e.dim_kv="head_dim",e.num_attention_heads="num_attention_heads";break;case"youtu":e.num_heads="num_key_value_heads",e.num_layers="num_hidden_layers",e.dim_kv="qk_head_dim",e.num_attention_heads="num_attention_heads";break;case"t5":case"mt5":case"longt5":e.num_decoder_layers="num_decoder_layers",e.num_decoder_heads="num_heads",e.decoder_dim_kv="d_kv",e.num_encoder_layers="num_layers",e.num_encoder_heads="num_heads",e.encoder_dim_kv="d_kv";break;case"bart":case"mbart":case"marian":case"whisper":case"lite-whisper":case"m2m_100":case"blenderbot":case"blenderbot-small":case"florence2_language":e.num_decoder_layers="decoder_layers",e.num_decoder_heads="decoder_attention_heads",e.decoder_hidden_size="d_model",e.num_encoder_layers="encoder_layers",e.num_encoder_heads="encoder_attention_heads",e.encoder_hidden_size="d_model";break;case"speecht5":e.num_decoder_layers="decoder_layers",e.num_decoder_heads="decoder_attention_heads",e.decoder_hidden_size="hidden_size",e.num_encoder_layers="encoder_layers",e.num_encoder_heads="encoder_attention_heads",e.encoder_hidden_size="hidden_size";break;case"trocr":e.num_encoder_layers=e.num_decoder_layers="decoder_layers",e.num_encoder_heads=e.num_decoder_heads="decoder_attention_heads",e.encoder_hidden_size=e.decoder_hidden_size="d_model";break;case"musicgen_decoder":e.num_encoder_layers=e.num_decoder_layers="num_hidden_layers",e.num_encoder_heads=e.num_decoder_heads="num_attention_heads",e.encoder_hidden_size=e.decoder_hidden_size="hidden_size";break;case"moonshine":e.num_decoder_layers="decoder_num_hidden_layers",e.num_decoder_heads="decoder_num_key_value_heads",e.num_encoder_layers="encoder_num_hidden_layers",e.num_encoder_heads="encoder_num_key_value_heads",e.encoder_hidden_size=e.decoder_hidden_size="hidden_size";break;case"vision-encoder-decoder":let n=Ln(t.decoder),o="num_decoder_layers"in n,a=at(t,["model_type","is_encoder_decoder"]);return o?(a.num_decoder_layers=n.num_decoder_layers,a.num_decoder_heads=n.num_decoder_heads,a.decoder_hidden_size=n.decoder_hidden_size,a.num_encoder_layers=n.num_encoder_layers,a.num_encoder_heads=n.num_encoder_heads,a.encoder_hidden_size=n.encoder_hidden_size):(a.num_layers=n.num_layers,a.num_heads=n.num_heads,a.hidden_size=n.hidden_size),a}let s={...r,...at(t,["model_type","multi_query","is_encoder_decoder"])};for(let n in e)s[n]=t[e[n]];return s}function Kd(t,e){if(["lfm2","lfm2_moe"].includes(t.model_type)){let r=e?.prefix??"past_key_values",s=r==="present"?"present":"past",n={},{layer_types:o,num_attention_heads:a,num_key_value_heads:i,hidden_size:l,conv_L_cache:u}=t,d=l/a,f=e?.batch_size??1;for(let m=0;m<o.length;++m)if(o[m]==="full_attention")for(let _ of["key","value"])n[`${r}.${m}.${_}`]=[f,i,0,d];else if(o[m]==="conv")n[`${s}_conv.${m}`]=[f,l,u];else throw new Error(`Unsupported layer type: ${o[m]}`);return n}else if(["granitemoehybrid","falcon_h1"].includes(t.model_type)){let r=e?.prefix??"past_key_values",s=r==="present"?"present":"past",n={},{layer_types:o,num_hidden_layers:a,num_attention_heads:i,num_key_value_heads:l,hidden_size:u,mamba_d_conv:d,mamba_n_heads:f,mamba_d_head:m,mamba_d_state:_,mamba_n_groups:w,mamba_expand:x,mamba_d_ssm:k}=t,E=u/i,M=e?.batch_size??1,I=(k??x*u)+2*w*_;for(let T=0;T<a;++T)if((!o||o[T]==="mamba")&&(n[`${s}_conv.${T}`]=[M,I,d],n[`${s}_ssm.${T}`]=[M,f,m,_]),!o||o[T]==="attention")for(let z of["key","value"])n[`${r}.${T}.${z}`]=[M,l,0,E];return n}return HP(t,e)}function HP(t,{prefix:e="past_key_values",batch_size:r=1}={}){let s={},n=t.normalized_config;if(n.is_encoder_decoder&&"num_encoder_heads"in n&&"num_decoder_heads"in n){let o=n.encoder_dim_kv??n.encoder_hidden_size/n.num_encoder_heads,a=n.decoder_dim_kv??n.decoder_hidden_size/n.num_decoder_heads,i=[r,n.num_encoder_heads,0,o],l=[r,n.num_decoder_heads,0,a];for(let u=0;u<n.num_decoder_layers;++u)s[`${e}.${u}.encoder.key`]=i,s[`${e}.${u}.encoder.value`]=i,s[`${e}.${u}.decoder.key`]=l,s[`${e}.${u}.decoder.value`]=l}else{let o=n.num_heads,a=n.num_layers,i=n.dim_kv??n.hidden_size/(n.num_attention_heads??o);if(n.model_type==="falcon"){let l=[r*o,0,i];for(let u=0;u<a;++u)s[`${e}.${u}.key`]=l,s[`${e}.${u}.value`]=l}else if(n.multi_query){let l=[r*o,0,2*i];for(let u=0;u<a;++u)s[`${e}.${u}.key_value`]=l}else if(n.model_type==="bloom"){let l=[r*o,i,0],u=[r*o,0,i];for(let d=0;d<a;++d)s[`${e}.${d}.key`]=l,s[`${e}.${d}.value`]=u}else if(n.model_type==="openelm")for(let l=0;l<a;++l){let u=[r,o[l],0,i];s[`${e}.${l}.key`]=u,s[`${e}.${l}.value`]=u}else{let l=[r,o,0,i];for(let u=0;u<a;++u)s[`${e}.${u}.key`]=l,s[`${e}.${u}.value`]=l}}return s}var Ni=class t{model_type=null;is_encoder_decoder=!1;max_position_embeddings;"transformers.js_config";constructor(e){Object.assign(this,e),this.normalized_config=Ln(this)}static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main"}={}){s&&!(s instanceof t)&&(s=new t(s));let i=s??await VP(e,{progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a});return new this(i)}},Xr=class{static async from_pretrained(...e){return Ni.from_pretrained(...e)}};async function gA(t,e,r,s){let n=`${e}${s}.onnx`,o=`${r.subfolder??""}/${n}`;return await ei(t,o,!0,r,be.IS_NODE_ENV)}async function wA(t,e,r,s,n,o={}){let a=`${e}${r}.onnx`,i=be.IS_NODE_ENV,l=[];if(n){let u;typeof n=="object"?n.hasOwnProperty(a)?u=n[a]:n.hasOwnProperty(e)?u=n[e]:u=!1:u=n;let d=+u;if(d>iu)throw new Error(`The number of external data chunks (${d}) exceeds the maximum allowed value (${iu}).`);for(let f=0;f<d;++f){let m=`${a}_data${f===0?"":"_"+f}`,_=`${s.subfolder??""}/${m}`;l.push(new Promise(async(w,x)=>{let k=await ei(t,_,!0,s,i);w(k instanceof Uint8Array?{path:m,data:k}:m)}))}}else o.externalData!==void 0&&(l=o.externalData.map(async u=>{if(typeof u.data=="string"){let d=await ei(t,u.data,!0,s);return{...u,data:d}}return u}));return Promise.all(l)}async function XP(t,e,r,s=!1){let n=r.config?.["transformers.js_config"]??{},o=r.device??n.device;o&&typeof o!="string"&&(o.hasOwnProperty(e)?o=o[e]:(console.warn(`device not specified for "${e}". Using the default device.`),o=null));let a=o??(be.IS_NODE_ENV?"cpu":"wasm"),i=HE(a),l=n.device_config??{};l.hasOwnProperty(a)&&(n={...n,...l[a]});let u=r.dtype??n.dtype;if(typeof u!="string"&&(u&&u.hasOwnProperty(e)?u=u[e]:(u=T0[a]??mt.fp32,console.warn(`dtype not specified for "${e}". Using the default dtype (${u}) for this device (${a}).`))),u===mt.auto){let z=n.dtype;typeof z!="string"&&(z=z?.[e]),z&&z!==mt.auto&&mt.hasOwnProperty(z)?u=z:u=T0[a]??mt.fp32}let d=u;if(S0.hasOwnProperty(d)){if(a==="webgpu"&&!be.IS_NODE_ENV&&d===mt.fp16&&!await YE())throw new Error(`The device (${a}) does not support fp16.`)}else throw new Error(`Invalid dtype: ${d}. Should be one of: ${Object.keys(mt).join(", ")}`);let f=n.kv_cache_dtype,m=f?typeof f=="string"?f:f[d]??"float32":void 0;if(m&&!["float32","float16"].includes(m))throw new Error(`Invalid kv_cache_dtype: ${m}. Should be one of: float32, float16`);let _=S0[d],w={...r.session_options};w.executionProviders??=i;let x=n.free_dimension_overrides;x?w.freeDimensionOverrides??=x:a.startsWith("webnn")&&!w.freeDimensionOverrides&&console.warn(`WebNN does not currently support dynamic shapes and requires 'free_dimension_overrides' to be set in config.json, preferably as a field within config["transformers.js_config"]["device_config"]["${a}"]. When 'free_dimension_overrides' is not set, you may experience significant performance degradation.`);let k=gA(t,e,r,_),E=r.use_external_data_format??n.use_external_data_format,M=await wA(t,e,_,r,E,w);if(M.length>0&&!be.IS_NODE_ENV&&(w.externalData=M),s&&a==="webgpu"&&f!==!1){let z=Kd(r.config,{prefix:"present"});if(Object.keys(z).length>0&&!ui()){let C={};for(let v in z)C[v]="gpu-buffer";w.preferredOutputLocation=C}}return{buffer_or_path:await k,session_options:w,session_config:{dtype:d,kv_cache_dtype:m,device:a}}}async function bt(t,e,r,s=void 0){return Object.fromEntries(await Promise.all(Object.keys(e).map(async n=>{let{buffer_or_path:o,session_options:a,session_config:i}=await XP(t,e[n],r,n===s),l=await Eu(o,a,i);return[n,l]})))}function xA(t){for(let e in t)Mu(t[e])?t[e]=new U(t[e]):typeof t[e]=="object"&&xA(t[e]);return t}async function ce(t,e){let r=KP(t,e);try{let s=Object.fromEntries(Object.entries(r).map(([o,a])=>{let i=a.ort_tensor;return be.IS_NODE_ENV&&typeof Float16Array<"u"&&i.cpuData instanceof Float16Array&&(i.cpuData=new Uint16Array(i.cpuData.buffer)),[o,i]})),n=await Au(t,s);return xA(n)}catch(s){let n=Object.fromEntries(Object.entries(r).map(([o,a])=>{let i={type:a.type,dims:a.dims,location:a.location};return i.location!=="gpu-buffer"&&(i.data=a.data),[o,i]}));throw console.error(`An error occurred during model execution: "${s}".`),console.error("Inputs given to model:",n),s}}function KP(t,e){let r=Object.create(null),s=[];for(let a of t.inputNames){let i=e[a];if(!(i instanceof U)){s.push(a);continue}r[a]=ui()?i.clone():i}if(s.length>0)throw new Error(`An error occurred during model execution: "Missing the following inputs: ${s.join(", ")}.`);let n=Object.keys(e).length,o=t.inputNames.length;if(n>o){let a=Object.keys(e).filter(i=>!t.inputNames.includes(i));console.warn(`WARNING: Too many inputs were provided (${n} > ${o}). The following inputs will be ignored: "${a.join(", ")}".`)}return r}var Ne=class{};var F=class extends Ne{constructor({logits:e,...r}){super(),this.logits=e;let s=Object.values(r);s.length>0&&(this.attentions=s)}},_e=class extends Ne{constructor({logits:e}){super(),this.logits=e}},we=class extends Ne{constructor({logits:e}){super(),this.logits=e}},Ae=class extends Ne{constructor({start_logits:e,end_logits:r}){super(),this.start_logits=e,this.end_logits=r}},gt=class extends Ne{constructor({logits:e}){super(),this.logits=e}};var Yd=class extends Ne{constructor({alphas:e}){super(),this.alphas=e}};var Nt=class extends Je{_call(e,r){throw Error("`_call` should be implemented in a subclass")}},Nn=class extends Je{_call(e,r){throw Error("`_call` should be implemented in a subclass")}},Kr=class extends Je{constructor(){super(),this.processors=[]}push(e){this.processors.push(e)}extend(e){this.processors.push(...e)}_call(e,r){let s=r;for(let n of this.processors)s=n(e,s);return s}[Symbol.iterator](){return this.processors.values()}},$i=class extends Nt{constructor(e){super(),this.bos_token_id=e}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length===1){let n=r[s].data;n.fill(-1/0),n[this.bos_token_id]=0}return r}},Ri=class extends Nt{constructor(e,r){super(),this.max_length=e,this.eos_token_id=Array.isArray(r)?r:[r]}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length===this.max_length-1){let n=r[s].data;n.fill(-1/0);for(let o of this.eos_token_id)n[o]=0}return r}},Os=class extends Nt{constructor(e,r){super(),this.begin_suppress_tokens=e,this.begin_index=r}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length===this.begin_index){let n=r[s].data;for(let o of this.begin_suppress_tokens)n[o]=-1/0}return r}},Ui=class extends Nt{constructor(e,r){super(),this.eos_token_id=Array.isArray(e.eos_token_id)?e.eos_token_id[0]:e.eos_token_id,this.no_timestamps_token_id=e.no_timestamps_token_id,this.timestamp_begin=this.no_timestamps_token_id+1,this.begin_index=r.length,r.at(-1)===this.no_timestamps_token_id&&(this.begin_index-=1),this.max_initial_timestamp_index=e.max_initial_timestamp_index}_call(e,r){for(let s=0;s<e.length;++s){let n=r[s].data;if(n[this.no_timestamps_token_id]=-1/0,e[s].length===this.begin_index-1){n.fill(-1/0),n[this.timestamp_begin]=0;continue}let o=e[s].slice(this.begin_index),a=o.length>=1&&o[o.length-1]>=this.timestamp_begin,i=o.length<2||o[o.length-2]>=this.timestamp_begin;if(a&&(i?n.subarray(this.timestamp_begin).fill(-1/0):n.subarray(0,this.eos_token_id).fill(-1/0)),e[s].length===this.begin_index&&this.max_initial_timestamp_index!==null){let f=this.timestamp_begin+this.max_initial_timestamp_index;n.subarray(f+1).fill(-1/0)}let l=pu(n),u=Math.log(l.subarray(this.timestamp_begin).map(Math.exp).reduce((f,m)=>f+m)),d=Te(l.subarray(0,this.timestamp_begin))[0];u>d&&n.subarray(0,this.timestamp_begin).fill(-1/0)}return r}},Bi=class extends Nt{constructor(e){super(),this.no_repeat_ngram_size=e}getNgrams(e){let r=e.length,s=[];for(let o=0;o<r+1-this.no_repeat_ngram_size;++o){let a=[];for(let i=0;i<this.no_repeat_ngram_size;++i)a.push(e[o+i]);s.push(a.map(Number))}let n=new Map;for(let o of s){let a=o.slice(0,o.length-1),i=JSON.stringify(a),l=n.get(i)??[];l.push(o[o.length-1]),n.set(i,l)}return n}getGeneratedNgrams(e,r){let s=r.slice(r.length+1-this.no_repeat_ngram_size,r.length);return e.get(JSON.stringify(s.map(Number)))??[]}calcBannedNgramTokens(e){let r=[];if(e.length+1<this.no_repeat_ngram_size)return r;{let s=this.getNgrams(e);return this.getGeneratedNgrams(s,e)}}_call(e,r){for(let s=0;s<e.length;++s){let n=r[s].data,o=this.calcBannedNgramTokens(e[s]);for(let a of o)n[a]=-1/0}return r}},Di=class extends Nt{constructor(e){super(),this.penalty=e}_call(e,r){for(let s=0;s<e.length;++s){let n=r[s].data;for(let o of new Set(e[s])){let a=Number(o);n[a]<0?n[a]*=this.penalty:n[a]/=this.penalty}}return r}},Fi=class extends Nt{constructor(e,r){super(),this.min_length=e,this.eos_token_id=Array.isArray(r)?r:[r]}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length<this.min_length){let n=r[s].data;for(let o of this.eos_token_id)n[o]=-1/0}return r}},ji=class extends Nt{constructor(e,r,s){super(),this.prompt_length_to_skip=e,this.min_new_tokens=r,this.eos_token_id=Array.isArray(s)?s:[s]}_call(e,r){for(let s=0;s<e.length;++s)if(e[s].length-this.prompt_length_to_skip<this.min_new_tokens){let o=r[s].data;for(let a of this.eos_token_id)o[a]=-1/0}return r}},Gi=class extends Nt{constructor(e,r){super(),this.bad_words_ids=e,this.eos_token_id=Array.isArray(r)?r:[r]}_call(e,r){for(let s=0;s<e.length;++s){let n=r[s].data,o=e[s];for(let a of this.bad_words_ids){if(o.length<a.length-1)continue;let i=!0;for(let l=1;l<=a.length-1;++l)if(a.at(-l-1)!=o.at(-l)){i=!1;break}i&&(n[a.at(-1)]=-1/0)}}return r}},qi=class extends Nt{constructor(e){if(super(),e<=1)throw new Error(`Require guidance scale >1 to use the classifier free guidance processor, got guidance scale ${e}.`);this.guidance_scale=e}_call(e,r){if(r.dims[0]!==2*e.length)throw new Error(`Logits should have twice the batch size of the input ids, the first half of batches corresponding to the conditional inputs, and the second half of batches corresponding to the unconditional inputs. Got batch size ${r.dims[0]} for the logits and ${e.length} for the input ids.`);let s=e.length,n=r.slice([0,s],null),o=r.slice([s,r.dims[0]],null);for(let a=0;a<o.data.length;++a)o.data[a]+=(n.data[a]-o.data[a])*this.guidance_scale;return o}},Wi=class extends Nn{constructor(e){if(super(),typeof e!="number"||e<=0){let r=`\`temperature\` (=${e}) must be a strictly positive float, otherwise your next token scores will be invalid.`;e===0&&(r+=" If you're looking for greedy decoding strategies, set `do_sample=false`.")}this.temperature=e}_call(e,r){let s=r.data;for(let n=0;n<s.length;++n)s[n]/=this.temperature;return r}},q0=class extends Nn{constructor(e,{filter_value:r=-1/0,min_tokens_to_keep:s=1}={}){if(super(),e<0||e>1)throw new Error(`\`top_p\` must be a float > 0 and < 1, but is ${e}`);if(!Number.isInteger(s)||s<1)throw new Error(`\`min_tokens_to_keep\` must be a positive integer, but is ${s}`);this.top_p=e,this.filter_value=r,this.min_tokens_to_keep=s}},W0=class extends Nn{constructor(e,{filter_value:r=-1/0,min_tokens_to_keep:s=1}={}){if(super(),!Number.isInteger(e)||e<0)throw new Error(`\`top_k\` must be a positive integer, but is ${e}`);this.top_k=Math.max(e,s),this.filter_value=r}};var $n=class{max_length=20;max_new_tokens=null;min_length=0;min_new_tokens=null;early_stopping=!1;max_time=null;do_sample=!1;num_beams=1;num_beam_groups=1;penalty_alpha=null;use_cache=!0;temperature=1;top_k=50;top_p=1;typical_p=1;epsilon_cutoff=0;eta_cutoff=0;diversity_penalty=0;repetition_penalty=1;encoder_repetition_penalty=1;length_penalty=1;no_repeat_ngram_size=0;bad_words_ids=null;force_words_ids=null;renormalize_logits=!1;constraints=null;forced_bos_token_id=null;forced_eos_token_id=null;remove_invalid_values=!1;exponential_decay_length_penalty=null;suppress_tokens=null;streamer=null;begin_suppress_tokens=null;forced_decoder_ids=null;guidance_scale=null;num_return_sequences=1;output_attentions=!1;output_hidden_states=!1;output_scores=!1;return_dict_in_generate=!1;pad_token_id=null;bos_token_id=null;eos_token_id=null;encoder_no_repeat_ngram_size=0;decoder_start_token_id=null;generation_kwargs={};constructor(e){Object.assign(this,at(e,Object.getOwnPropertyNames(this)))}};var Is=class extends Je{_call(e,r){throw Error("StoppingCriteria needs to be subclassed")}},Vi=class t extends Je{constructor(){super(),this.criteria=[]}push(e){this.criteria.push(e)}extend(e){e instanceof t?e=e.criteria:e instanceof Is&&(e=[e]),this.criteria.push(...e)}_call(e,r){let s=new Array(e.length).fill(!1);for(let n of this.criteria){let o=n(e,r);for(let a=0;a<s.length;++a)s[a]||=o[a]}return s}[Symbol.iterator](){return this.criteria.values()}},Hi=class extends Is{constructor(e,r=null){super(),this.max_length=e,this.max_position_embeddings=r}_call(e){return e.map(r=>r.length>=this.max_length)}},Xi=class extends Is{constructor(e){super(),Array.isArray(e)||(e=[e]),this.eos_token_id=e}_call(e,r){return e.map(s=>{let n=s.at(-1);return this.eos_token_id.some(o=>n==o)})}},V0=class extends Is{constructor(){super(),this.interrupted=!1}interrupt(){this.interrupted=!0}reset(){this.interrupted=!1}_call(e,r){return new Array(e.length).fill(this.interrupted)}};var Cs=class extends Je{constructor(e){super(),this.generation_config=e}async _call(e){return this.sample(e)}async sample(e){throw Error("sample should be implemented in subclasses.")}getLogits(e,r){let s=e.dims.at(-1),n=e.data;if(r===-1)n=n.slice(-s);else{let o=r*s;n=n.slice(o,o+s)}return n}randomSelect(e){let r=0;for(let n=0;n<e.length;++n)r+=e[n];let s=Math.random()*r;for(let n=0;n<e.length;++n)if(s-=e[n],s<=0)return n;return 0}static getSampler(e){if(e.do_sample)return new X0(e);if(e.num_beams>1)return new K0(e);if(e.num_return_sequences>1)throw Error(`num_return_sequences has to be 1 when doing greedy search, but is ${e.num_return_sequences}.`);return new H0(e)}},H0=class extends Cs{async sample(e){let r=Te(e.data)[1];return[[BigInt(r),0]]}},X0=class extends Cs{async sample(e){let r=e.dims.at(-1);this.generation_config.top_k>0&&(r=Math.min(this.generation_config.top_k,r));let[s,n]=await Gt(e,r),o=Oe(s.data);return Array.from({length:this.generation_config.num_beams},()=>{let a=this.randomSelect(o);return[n.data[a],Math.log(o[a])]})}},K0=class extends Cs{async sample(e){let r=e.dims.at(-1);this.generation_config.top_k>0&&(r=Math.min(this.generation_config.top_k,r));let[s,n]=await Gt(e,r),o=Oe(s.data);return Array.from({length:this.generation_config.num_beams},(a,i)=>[n.data[i],Math.log(o[i])])}};var Ki=null;function bA(t){Ki=t}function Y0(t){if(t instanceof U)return t;if(t.length===0)throw Error("items must be non-empty");if(Array.isArray(t[0])){if(t.some(e=>e.length!==t[0].length))throw Error("Unable to create tensor, you should probably activate truncation and/or padding with 'padding=True' and/or 'truncation=True' to have batched tensors with the same length.");return new U("int64",BigInt64Array.from(t.flat().map(e=>BigInt(e))),[t.length,t[0].length])}else return new U("int64",BigInt64Array.from(t.map(e=>BigInt(e))),[1,t.length])}function Q0(t){return new U("bool",[t],[1])}var H={EncoderOnly:0,EncoderDecoder:1,Seq2Seq:2,Vision2Seq:3,DecoderOnly:4,DecoderOnlyWithoutHead:5,MaskGeneration:6,ImageTextToText:7,Musicgen:8,MultiModality:9,Phi3V:10,AudioTextToText:11,AutoEncoder:12,ImageAudioTextToText:13,Supertonic:14,Chatterbox:15},yA={[H.DecoderOnly]:{can_generate:!0,forward:Tt,prepare_inputs:Yi},[H.DecoderOnlyWithoutHead]:{can_generate:!1,forward:Tt,prepare_inputs:Yi},[H.Seq2Seq]:{can_generate:!0,forward:Qd,prepare_inputs:Qi},[H.Vision2Seq]:{can_generate:!0,forward:Qd,prepare_inputs:Qi},[H.Musicgen]:{can_generate:!0,forward:Qd},[H.EncoderDecoder]:{can_generate:!1,forward:Qd},[H.ImageTextToText]:{can_generate:!0,forward:JP,prepare_inputs:Jd},[H.AudioTextToText]:{can_generate:!0,forward:QP,prepare_inputs:Jd},[H.Phi3V]:{can_generate:!0,prepare_inputs:Jd},[H.ImageAudioTextToText]:{can_generate:!0,prepare_inputs:Jd},[H.MultiModality]:{can_generate:!0},[H.AutoEncoder]:{can_generate:!1,forward:YP},[H.Chatterbox]:{can_generate:!0,forward:qt},default:{can_generate:!1,forward:qt}},zs=new Map,Zd=new Map,Ps=new Map,y=class extends Je{main_input_name="input_ids";forward_params=["input_ids","attention_mask"];_return_dict_in_generate_keys=null;constructor(e,r,s){super(),this.config=e,this.sessions=r,this.configs=s;let n=Ps.get(this.constructor),o=zs.get(n),a=yA[o]??yA.default;this.can_generate=a.can_generate,this._forward=a.forward,this._prepare_inputs_for_generation=a.prepare_inputs,this.can_generate&&this.forward_params.push("past_key_values"),this.custom_config=this.config["transformers.js_config"]??{}}async dispose(){let e=[];for(let r of Object.values(this.sessions))e.push(r.release?.());return await Promise.all(e)}static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main",model_file_name:i=null,subfolder:l="onnx",device:u=null,dtype:d=null,use_external_data_format:f=null,session_options:m={}}={}){let _={progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a,model_file_name:i,subfolder:l,device:u,dtype:d,use_external_data_format:f,session_options:m},w=Ps.get(this),x=zs.get(w);s=_.config=await Xr.from_pretrained(e,_);let k;if(x===H.DecoderOnly)k=await Promise.all([bt(e,{model:_.model_file_name??"model"},_,"model"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.Seq2Seq||x===H.Vision2Seq)k=await Promise.all([bt(e,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},_,"decoder_model_merged"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.MaskGeneration)k=await Promise.all([bt(e,{model:"vision_encoder",prompt_encoder_mask_decoder:"prompt_encoder_mask_decoder"},_)]);else if(x===H.EncoderDecoder)k=await Promise.all([bt(e,{model:"encoder_model",decoder_model_merged:"decoder_model_merged"},_,"decoder_model_merged")]);else if(x===H.ImageTextToText){let E={embed_tokens:"embed_tokens",vision_encoder:"vision_encoder",decoder_model_merged:"decoder_model_merged"};s.is_encoder_decoder&&(E.model="encoder_model"),k=await Promise.all([bt(e,E,_,"decoder_model_merged"),xr(e,{generation_config:"generation_config.json"},_)])}else if(x===H.AudioTextToText){let E={embed_tokens:"embed_tokens",audio_encoder:"audio_encoder",decoder_model_merged:"decoder_model_merged"};k=await Promise.all([bt(e,E,_,"decoder_model_merged"),xr(e,{generation_config:"generation_config.json"},_)])}else if(x===H.ImageAudioTextToText){let E={embed_tokens:"embed_tokens",audio_encoder:"audio_encoder",vision_encoder:"vision_encoder",decoder_model_merged:"decoder_model_merged"};k=await Promise.all([bt(e,E,_),xr(e,{generation_config:"generation_config.json"},_)])}else if(x===H.Musicgen)k=await Promise.all([bt(e,{model:"text_encoder",decoder_model_merged:"decoder_model_merged",encodec_decode:"encodec_decode"},_,"decoder_model_merged"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.MultiModality)k=await Promise.all([bt(e,{prepare_inputs_embeds:"prepare_inputs_embeds",model:"language_model",lm_head:"lm_head",gen_head:"gen_head",gen_img_embeds:"gen_img_embeds",image_decode:"image_decode"},_,"model"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.Phi3V)k=await Promise.all([bt(e,{prepare_inputs_embeds:"prepare_inputs_embeds",model:"model",vision_encoder:"vision_encoder"},_,"model"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.Chatterbox)k=await Promise.all([bt(e,{embed_tokens:"embed_tokens",speech_encoder:"speech_encoder",model:"language_model",conditional_decoder:"conditional_decoder"},_,"model"),xr(e,{generation_config:"generation_config.json"},_)]);else if(x===H.AutoEncoder)k=await Promise.all([bt(e,{encoder_model:"encoder_model",decoder_model:"decoder_model"},_)]);else if(x===H.Supertonic)k=await Promise.all([bt(e,{text_encoder:"text_encoder",latent_denoiser:"latent_denoiser",voice_decoder:"voice_decoder"},_)]);else{if(x===void 0){let E=w??s?.model_type;E!=="custom"&&console.warn(`Model type for '${E}' not found, assuming encoder-only architecture. Please report this at ${kn}.`)}k=await Promise.all([bt(e,{model:_.model_file_name??"model"},_)])}return new this(s,...k)}async _call(e){return await this.forward(e)}async forward(e){return await this._forward(this,e)}get generation_config(){return this.configs?.generation_config??null}_get_logits_processor(e,r,s=null){let n=new Kr;if(e.repetition_penalty!==null&&e.repetition_penalty!==1&&n.push(new Di(e.repetition_penalty)),e.no_repeat_ngram_size!==null&&e.no_repeat_ngram_size>0&&n.push(new Bi(e.no_repeat_ngram_size)),e.bad_words_ids!==null&&n.push(new Gi(e.bad_words_ids,e.eos_token_id)),e.min_length!==null&&e.eos_token_id!==null&&e.min_length>0&&n.push(new Fi(e.min_length,e.eos_token_id)),e.min_new_tokens!==null&&e.eos_token_id!==null&&e.min_new_tokens>0&&n.push(new ji(r,e.min_new_tokens,e.eos_token_id)),e.forced_bos_token_id!==null&&n.push(new $i(e.forced_bos_token_id)),e.forced_eos_token_id!==null&&n.push(new Ri(e.max_length,e.forced_eos_token_id)),e.begin_suppress_tokens!==null){let o=r>1||e.forced_bos_token_id===null?r:r+1;n.push(new Os(e.begin_suppress_tokens,o))}return e.guidance_scale!==null&&e.guidance_scale>1&&n.push(new qi(e.guidance_scale)),e.temperature===0&&e.do_sample&&(console.warn("`do_sample` changed to false because `temperature: 0` implies greedy sampling (always selecting the most likely token), which is incompatible with `do_sample: true`."),e.do_sample=!1),e.do_sample&&e.temperature!==null&&e.temperature!==1&&n.push(new Wi(e.temperature)),s!==null&&n.extend(s),n}_prepare_generation_config(e,r,s=$n){let n={...this.config};for(let a of["decoder","generator","text_config"])a in n&&Object.assign(n,n[a]);let o=new s(n);return Object.assign(o,this.generation_config??{}),e&&Object.assign(o,e),r&&Object.assign(o,at(r,Object.getOwnPropertyNames(o))),o}_get_stopping_criteria(e,r=null){let s=new Vi;return e.max_length!==null&&s.push(new Hi(e.max_length,this.config.max_position_embeddings??null)),e.eos_token_id!==null&&s.push(new Xi(e.eos_token_id)),r&&s.extend(r),s}_validate_model_class(){if(!this.can_generate){let e=[Ki.MODEL_FOR_CAUSAL_LM_MAPPING_NAMES,Ki.MODEL_FOR_VISION_2_SEQ_MAPPING_NAMES,Ki.MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMES,Ki.MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPING_NAMES].filter(Boolean),r=Ps.get(this.constructor),s=new Set,n=this.config.model_type;for(let a of e){let i=a?.get(n);i&&s.add(i)}let o=`The current model class (${r}) is not compatible with \`.generate()\`, as it doesn't have a language model head.`;throw s.size>0&&(o+=` Please use the following class instead: ${[...s].join(", ")}`),Error(o)}}prepare_inputs_for_generation(...e){if(!this._prepare_inputs_for_generation)throw new Error("prepare_inputs_for_generation is not implemented for this model.");return this._prepare_inputs_for_generation(this,...e)}_update_model_kwargs_for_generation({generated_input_ids:e,outputs:r,model_inputs:s,is_encoder_decoder:n}){return s.past_key_values=this.getPastKeyValues(r,s.past_key_values),s.input_ids=new U("int64",e.flat(),[e.length,1]),n?"decoder_attention_mask"in s:s.attention_mask=Ee([s.attention_mask,rt([s.attention_mask.dims[0],1])],1),s.position_ids=null,s}_prepare_model_inputs({inputs:e,bos_token_id:r,model_kwargs:s}){let n=at(s,this.forward_params),o=this.main_input_name;if(o in n){if(e)throw new Error("`inputs`: {inputs}` were passed alongside {input_name} which is not allowed. Make sure to either pass {inputs} or {input_name}=...")}else n[o]=e;return{inputs_tensor:n[o],model_inputs:n,model_input_name:o}}async _prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:e,model_inputs:r,model_input_name:s,generation_config:n}){if(this.sessions.model.inputNames.includes("inputs_embeds")&&!r.inputs_embeds&&"_prepare_inputs_embeds"in this){let{input_ids:a,pixel_values:i,attention_mask:l,...u}=r,d=await this._prepare_inputs_embeds(r);r={...u,...at(d,["inputs_embeds","attention_mask"])}}let{last_hidden_state:o}=await qt(this,r);if(n.guidance_scale!==null&&n.guidance_scale>1)o=Ee([o,yn(o,0)],0),"attention_mask"in r&&(r.attention_mask=Ee([r.attention_mask,Cu(r.attention_mask)],0));else if(r.decoder_input_ids){let a=Y0(r.decoder_input_ids).dims[0];if(a!==o.dims[0]){if(o.dims[0]!==1)throw new Error(`The encoder outputs have a different batch size (${o.dims[0]}) than the decoder inputs (${a}).`);o=Ee(Array.from({length:a},()=>o),0)}}return r.encoder_outputs=o,r}_prepare_decoder_input_ids_for_generation({batch_size:e,model_input_name:r,model_kwargs:s,decoder_start_token_id:n,bos_token_id:o,generation_config:a}){let{decoder_input_ids:i,...l}=s;if(!(i instanceof U)){if(i)Array.isArray(i[0])||(i=Array.from({length:e},()=>i));else if(n??=o,this.config.model_type==="musicgen")i=Array.from({length:e*this.config.decoder.num_codebooks},()=>[n]);else if(Array.isArray(n)){if(n.length!==e)throw new Error(`\`decoder_start_token_id\` expcted to have length ${e} but got ${n.length}`);i=n}else i=Array.from({length:e},()=>[n]);i=Y0(i)}return s.decoder_attention_mask=mi(i),{input_ids:i,model_inputs:l}}async generate({inputs:e=null,generation_config:r=null,logits_processor:s=null,stopping_criteria:n=null,streamer:o=null,...a}){this._validate_model_class(),r=this._prepare_generation_config(r,a);let{inputs_tensor:i,model_inputs:l,model_input_name:u}=this._prepare_model_inputs({inputs:e,model_kwargs:a}),d=this.config.is_encoder_decoder;d&&("encoder_outputs"in l||(l=await this._prepare_encoder_decoder_kwargs_for_generation({inputs_tensor:i,model_inputs:l,model_input_name:u,generation_config:r})));let f;d?{input_ids:f,model_inputs:l}=this._prepare_decoder_input_ids_for_generation({batch_size:l[u].dims.at(0),model_input_name:u,model_kwargs:l,decoder_start_token_id:r.decoder_start_token_id,bos_token_id:r.bos_token_id,generation_config:r}):f=l[u];let m=f.dims.at(-1);r.max_new_tokens!==null&&(r.max_length=m+r.max_new_tokens);let _=this._get_logits_processor(r,m,s),w=this._get_stopping_criteria(r,n),x=l[u].dims.at(0),k=Cs.getSampler(r),E=new Array(x).fill(0),M=f.tolist();o&&o.put(M);let I,T={},z={};for(;;){if(l=this.prepare_inputs_for_generation(M,l,r),I=await this.forward(l),r.return_dict_in_generate)if(r.output_attentions){let K=this.getAttentions(I);for(let Y in K)Y in T||(T[Y]=[]),T[Y].push(K[Y])}else this._return_dict_in_generate_keys&&Object.assign(z,at(I,this._return_dict_in_generate_keys));let G=I.logits.slice(null,-1,null).to("float32"),X=_(M,G),V=[];for(let K=0;K<X.dims.at(0);++K){let Y=X[K],B=await k(Y);for(let[P,se]of B){let ie=BigInt(P);E[K]+=se,M[K].push(ie),V.push([ie]);break}}if(o&&o.put(V),w(M).every(K=>K))break;l=this._update_model_kwargs_for_generation({generated_input_ids:V,outputs:I,model_inputs:l,is_encoder_decoder:d})}o&&o.end();let C=this.getPastKeyValues(I,l.past_key_values,!0),v=new U("int64",M.flat(),[M.length,M[0].length]);if(r.return_dict_in_generate)return{sequences:v,past_key_values:C,...T,...z};for(let G of Object.values(I))G.location==="gpu-buffer"&&G.dispose();return v}getPastKeyValues(e,r,s=!1){let n=Object.create(null);for(let o in e)if(o.startsWith("present")){let a=o.replace("present_ssm","past_ssm").replace("present_conv","past_conv").replace("present","past_key_values"),i=o.includes("encoder");if(i&&r?n[a]=r[a]:n[a]=e[o],r&&(!i||s)){let l=r[a];l.location==="gpu-buffer"&&l.dispose()}}return n}getAttentions(e){let r={};for(let s of["cross_attentions","encoder_attentions","decoder_attentions"])for(let n in e)n.startsWith(s)&&(s in r||(r[s]=[]),r[s].push(e[n]));return r}addPastKeyValues(e,r){if(r)Object.assign(e,r);else{let s=this.sessions.decoder_model_merged??this.sessions.model,n=(e[this.main_input_name]??e.attention_mask)?.dims?.[0]??1,o=s?.config?.kv_cache_dtype??"float32",a=o==="float16"?xn.float16:xn.float32,i=Kd(this.config,{batch_size:n});for(let l in i){let u=i[l].reduce((d,f)=>d*f,1);e[l]=new U(o,new a(u),i[l])}}}async encode_image({pixel_values:e}){return(await ce(this.sessions.vision_encoder,{pixel_values:e})).image_features}async encode_text({input_ids:e}){return(await ce(this.sessions.embed_tokens,{input_ids:e})).inputs_embeds}async encode_audio({audio_values:e}){return(await ce(this.sessions.audio_encoder,{audio_values:e})).audio_features}};async function Qd(t,e){let{encoder_outputs:r,input_ids:s,decoder_input_ids:n,...o}=e;if(!r){let a=at(e,t.sessions.model.inputNames);r=(await qt(t,a)).last_hidden_state}return o.input_ids=n,o.encoder_hidden_states=r,t.sessions.decoder_model_merged.inputNames.includes("encoder_attention_mask")&&(o.encoder_attention_mask=e.attention_mask),await Tt(t,o,!0)}async function qt(t,e){let r=t.sessions.model,s=at(e,r.inputNames);if(r.inputNames.includes("inputs_embeds")&&!s.inputs_embeds){if(!e.input_ids)throw new Error("Both `input_ids` and `inputs_embeds` are missing in the model inputs.");s.inputs_embeds=await t.encode_text({input_ids:e.input_ids})}if(r.inputNames.includes("token_type_ids")&&!s.token_type_ids){if(!s.input_ids)throw new Error("Both `input_ids` and `token_type_ids` are missing in the model inputs.");s.token_type_ids=Cu(s.input_ids)}if(r.inputNames.includes("pixel_mask")&&!s.pixel_mask){if(!s.pixel_values)throw new Error("Both `pixel_values` and `pixel_mask` are missing in the model inputs.");let n=s.pixel_values.dims;s.pixel_mask=rt([n[0],n[2],n[3]])}return await ce(r,s)}async function YP(t,e){let r=await t.encode(e);return await t.decode(r)}async function Tt(t,e,r=!1){let s=t.sessions[r?"decoder_model_merged":"model"],{past_key_values:n,...o}=e;if(s.inputNames.includes("use_cache_branch")&&(o.use_cache_branch=Q0(!!n)),s.inputNames.includes("position_ids")&&o.attention_mask&&!o.position_ids){let i=["paligemma","gemma3_text","gemma3"].includes(t.config.model_type)?1:0;o.position_ids=ZP(o,n,i)}t.addPastKeyValues(o,n);let a=at(o,s.inputNames);return await ce(s,a)}async function vA(t,{encode_function:e,merge_function:r,modality_input_name:s,modality_output_name:n,input_ids:o=null,attention_mask:a=null,position_ids:i=null,inputs_embeds:l=null,past_key_values:u=null,generation_config:d=null,logits_processor:f=null,...m}){let _=m[s];if(!l){if(l=await t.encode_text({input_ids:o,...m}),_&&o.dims[1]!==1){let x=await e({[s]:_,...m});({inputs_embeds:l,attention_mask:a}=r({[n]:x,inputs_embeds:l,input_ids:o,attention_mask:a}))}else if(u&&_&&o.dims[1]===1){let x=o.dims[1],k=Object.values(u)[0].dims.at(-2);a=Ee([rt([o.dims[0],k]),a.slice(null,[a.dims[1]-x,a.dims[1]])],1)}}if(!i&&t.config.model_type==="qwen2_vl"){let{image_grid_thw:x,video_grid_thw:k}=m;[i]=t.get_rope_index(o,x,k,a)}return await Tt(t,{inputs_embeds:l,past_key_values:u,attention_mask:a,position_ids:i,generation_config:d,logits_processor:f},!0)}async function QP(t,e){return await vA(t,{...e,modality_input_name:"audio_values",modality_output_name:"audio_features",encode_function:t.encode_audio.bind(t),merge_function:t._merge_input_ids_with_audio_features.bind(t)})}async function JP(t,e){return await vA(t,{...e,modality_input_name:"pixel_values",modality_output_name:"image_features",encode_function:t.encode_image.bind(t),merge_function:t._merge_input_ids_with_image_features.bind(t)})}function J0(t,e=0){let[r,s]=t.dims,n=t.data,o=new BigInt64Array(n.length);for(let a=0;a<r;++a){let i=a*s,l=BigInt(e);for(let u=0;u<s;++u){let d=i+u;n[d]===0n?o[d]=BigInt(1):(o[d]=l,l+=n[d])}}return{data:o,dims:t.dims}}function ZP(t,e=null,r=0){let{input_ids:s,inputs_embeds:n,attention_mask:o}=t,{data:a,dims:i}=J0(o,r),l=new U("int64",a,i);if(e){let u=-(s??n).dims.at(1);l=l.slice(null,[u,null])}return l}function Yi(t,e,r,s){let n=r.past_key_values?Object.values(r.past_key_values)[0].dims.at(-2):0;if(!r.attention_mask){let o;for(let a of["input_ids","inputs_embeds","position_ids"])if(r[a]){o=r[a].dims;break}if(!o)throw new Error("attention_mask is not provided, and unable to infer its shape from model inputs.");r.attention_mask=rt([o[0],n+o[1]])}if(r.past_key_values){let{input_ids:o,attention_mask:a}=r;a&&a.dims[1]>o.dims[1]||n<o.dims[1]&&(r.input_ids=o.slice(null,[n,null]))}return r}function Qi(t,e,r,s){return r.past_key_values&&(e=e.map(n=>[n.at(-1)])),{...r,decoder_input_ids:Y0(e)}}function Jd(t,...e){return t.config.is_encoder_decoder?Qi(t,...e):Yi(t,...e)}function kA({modality_token_id:t,inputs_embeds:e,modality_features:r,input_ids:s,attention_mask:n}){let o=s.tolist().map(u=>u.reduce((d,f,m)=>(f==t&&d.push(m),d),[])),a=o.reduce((u,d)=>u+d.length,0),i=r.dims[0];if(a!==i)throw new Error(`Number of tokens and features do not match: tokens: ${a}, features ${i}`);let l=0;for(let u=0;u<o.length;++u){let d=o[u],f=e[u];for(let m=0;m<d.length;++m)f[d[m]].data.set(r[l++].data)}return{inputs_embeds:e,attention_mask:n}}function ur({image_token_id:t,inputs_embeds:e,image_features:r,input_ids:s,attention_mask:n}){return kA({modality_token_id:t,inputs_embeds:e,modality_features:r,input_ids:s,attention_mask:n})}function ef({audio_token_id:t,inputs_embeds:e,audio_features:r,input_ids:s,attention_mask:n}){return kA({modality_token_id:t,inputs_embeds:e,modality_features:r,input_ids:s,attention_mask:n})}async function xr(t,e,r){return Object.fromEntries(await Promise.all(Object.keys(e).map(async s=>{let n=await it(t,e[s],!1,r);return[s,n]})))}var Yl={};cs(Yl,{ASTForAudioClassification:()=>pf,ASTModel:()=>uf,ASTPreTrainedModel:()=>Bn,AlbertForMaskedLM:()=>nf,AlbertForQuestionAnswering:()=>sf,AlbertForSequenceClassification:()=>rf,AlbertModel:()=>tf,AlbertPreTrainedModel:()=>Yr,ApertusForCausalLM:()=>af,ApertusModel:()=>of,ApertusPreTrainedModel:()=>Rn,ArceeForCausalLM:()=>cf,ArceeModel:()=>lf,ArceePreTrainedModel:()=>Un,BartForConditionalGeneration:()=>ff,BartForSequenceClassification:()=>mf,BartModel:()=>df,BartPretrainedModel:()=>Ls,BeitForImageClassification:()=>_f,BeitModel:()=>hf,BeitPreTrainedModel:()=>Dn,BertForMaskedLM:()=>wf,BertForQuestionAnswering:()=>bf,BertForSequenceClassification:()=>xf,BertForTokenClassification:()=>yf,BertModel:()=>gf,BertPreTrainedModel:()=>yr,BlenderbotForConditionalGeneration:()=>kf,BlenderbotModel:()=>vf,BlenderbotPreTrainedModel:()=>Fn,BlenderbotSmallForConditionalGeneration:()=>Af,BlenderbotSmallModel:()=>Ef,BlenderbotSmallPreTrainedModel:()=>jn,BloomForCausalLM:()=>Tf,BloomModel:()=>Mf,BloomPreTrainedModel:()=>Gn,CLIPModel:()=>Nf,CLIPPreTrainedModel:()=>er,CLIPSegForImageSegmentation:()=>Df,CLIPSegModel:()=>Bf,CLIPSegPreTrainedModel:()=>Xn,CLIPTextModel:()=>$f,CLIPTextModelWithProjection:()=>Hn,CLIPVisionModel:()=>Rf,CLIPVisionModelWithProjection:()=>Uf,CamembertForMaskedLM:()=>Of,CamembertForQuestionAnswering:()=>Pf,CamembertForSequenceClassification:()=>If,CamembertForTokenClassification:()=>Cf,CamembertModel:()=>Sf,CamembertPreTrainedModel:()=>br,ChatterboxModel:()=>qn,ChatterboxPreTrainedModel:()=>Ji,ChineseCLIPModel:()=>zf,ChineseCLIPPreTrainedModel:()=>Zi,ClapAudioModelWithProjection:()=>Vn,ClapModel:()=>Lf,ClapPreTrainedModel:()=>Ns,ClapTextModelWithProjection:()=>Wn,CodeGenForCausalLM:()=>jf,CodeGenModel:()=>Ff,CodeGenPreTrainedModel:()=>Kn,CohereForCausalLM:()=>qf,CohereModel:()=>Gf,CoherePreTrainedModel:()=>Yn,ConvBertForMaskedLM:()=>Vf,ConvBertForQuestionAnswering:()=>Kf,ConvBertForSequenceClassification:()=>Hf,ConvBertForTokenClassification:()=>Xf,ConvBertModel:()=>Wf,ConvBertPreTrainedModel:()=>vr,ConvNextForImageClassification:()=>Qf,ConvNextModel:()=>Yf,ConvNextPreTrainedModel:()=>Qn,ConvNextV2ForImageClassification:()=>Zf,ConvNextV2Model:()=>Jf,ConvNextV2PreTrainedModel:()=>Jn,DFineForObjectDetection:()=>sm,DFineModel:()=>rm,DFinePreTrainedModel:()=>eo,DINOv3ConvNextModel:()=>Tm,DINOv3ConvNextPreTrainedModel:()=>al,DINOv3ViTModel:()=>Sm,DINOv3ViTPreTrainedModel:()=>il,DPTForDepthEstimation:()=>$m,DPTModel:()=>Nm,DPTPreTrainedModel:()=>ao,DacDecoderModel:()=>ro,DacDecoderOutput:()=>tl,DacEncoderModel:()=>to,DacEncoderOutput:()=>el,DacModel:()=>nm,DacPreTrainedModel:()=>$s,DebertaForMaskedLM:()=>am,DebertaForQuestionAnswering:()=>cm,DebertaForSequenceClassification:()=>im,DebertaForTokenClassification:()=>lm,DebertaModel:()=>om,DebertaPreTrainedModel:()=>kr,DebertaV2ForMaskedLM:()=>pm,DebertaV2ForQuestionAnswering:()=>mm,DebertaV2ForSequenceClassification:()=>dm,DebertaV2ForTokenClassification:()=>fm,DebertaV2Model:()=>um,DebertaV2PreTrainedModel:()=>Er,DecisionTransformerModel:()=>hm,DecisionTransformerPreTrainedModel:()=>rl,DeiTForImageClassification:()=>gm,DeiTModel:()=>_m,DeiTPreTrainedModel:()=>so,DepthAnythingForDepthEstimation:()=>wm,DepthAnythingPreTrainedModel:()=>sl,DepthProForDepthEstimation:()=>xm,DepthProPreTrainedModel:()=>nl,DetrForObjectDetection:()=>bm,DetrForSegmentation:()=>vm,DetrModel:()=>ym,DetrObjectDetectionOutput:()=>Us,DetrPreTrainedModel:()=>Rs,DetrSegmentationOutput:()=>ol,Dinov2ForImageClassification:()=>Em,Dinov2Model:()=>km,Dinov2PreTrainedModel:()=>no,Dinov2WithRegistersForImageClassification:()=>Mm,Dinov2WithRegistersModel:()=>Am,Dinov2WithRegistersPreTrainedModel:()=>oo,DistilBertForMaskedLM:()=>zm,DistilBertForQuestionAnswering:()=>Pm,DistilBertForSequenceClassification:()=>Im,DistilBertForTokenClassification:()=>Cm,DistilBertModel:()=>Om,DistilBertPreTrainedModel:()=>Ar,DonutSwinModel:()=>Lm,DonutSwinPreTrainedModel:()=>ll,EdgeTamModel:()=>xw,EfficientNetForImageClassification:()=>Um,EfficientNetModel:()=>Rm,EfficientNetPreTrainedModel:()=>io,ElectraForMaskedLM:()=>Dm,ElectraForQuestionAnswering:()=>Gm,ElectraForSequenceClassification:()=>Fm,ElectraForTokenClassification:()=>jm,ElectraModel:()=>Bm,ElectraPreTrainedModel:()=>Mr,Ernie4_5ForCausalLM:()=>Wm,Ernie4_5Model:()=>qm,Ernie4_5PretrainedModel:()=>lo,EsmForMaskedLM:()=>Hm,EsmForSequenceClassification:()=>Xm,EsmForTokenClassification:()=>Km,EsmModel:()=>Vm,EsmPreTrainedModel:()=>Qr,ExaoneForCausalLM:()=>Qm,ExaoneModel:()=>Ym,ExaonePreTrainedModel:()=>co,FalconForCausalLM:()=>Zm,FalconH1ForCausalLM:()=>th,FalconH1Model:()=>eh,FalconH1PreTrainedModel:()=>po,FalconModel:()=>Jm,FalconPreTrainedModel:()=>uo,FastViTForImageClassification:()=>sh,FastViTModel:()=>rh,FastViTPreTrainedModel:()=>fo,Florence2ForConditionalGeneration:()=>nh,Florence2PreTrainedModel:()=>cl,GLPNForDepthEstimation:()=>mh,GLPNModel:()=>fh,GLPNPreTrainedModel:()=>xo,GPT2LMHeadModel:()=>Eh,GPT2Model:()=>kh,GPT2PreTrainedModel:()=>Eo,GPTBigCodeForCausalLM:()=>_h,GPTBigCodeModel:()=>hh,GPTBigCodePreTrainedModel:()=>yo,GPTJForCausalLM:()=>Mh,GPTJModel:()=>Ah,GPTJPreTrainedModel:()=>Ao,GPTNeoForCausalLM:()=>wh,GPTNeoModel:()=>gh,GPTNeoPreTrainedModel:()=>bo,GPTNeoXForCausalLM:()=>yh,GPTNeoXModel:()=>xh,GPTNeoXPreTrainedModel:()=>vo,Gemma2ForCausalLM:()=>lh,Gemma2Model:()=>ih,Gemma2PreTrainedModel:()=>ho,Gemma3ForCausalLM:()=>uh,Gemma3Model:()=>ch,Gemma3PreTrainedModel:()=>_o,Gemma3nForConditionalGeneration:()=>go,Gemma3nPreTrainedModel:()=>ul,GemmaForCausalLM:()=>ah,GemmaModel:()=>oh,GemmaPreTrainedModel:()=>mo,GlmForCausalLM:()=>dh,GlmModel:()=>ph,GlmPreTrainedModel:()=>wo,GptOssForCausalLM:()=>vh,GptOssModel:()=>bh,GptOssPreTrainedModel:()=>ko,GraniteForCausalLM:()=>Sh,GraniteModel:()=>Th,GraniteMoeHybridForCausalLM:()=>Ih,GraniteMoeHybridModel:()=>Oh,GraniteMoeHybridPreTrainedModel:()=>To,GranitePreTrainedModel:()=>Mo,GroundingDinoForObjectDetection:()=>Ch,GroundingDinoPreTrainedModel:()=>pl,GroupViTModel:()=>Ph,GroupViTPreTrainedModel:()=>dl,HeliumForCausalLM:()=>Lh,HeliumModel:()=>zh,HeliumPreTrainedModel:()=>So,HieraForImageClassification:()=>$h,HieraModel:()=>Nh,HieraPreTrainedModel:()=>Oo,HubertForCTC:()=>Gh,HubertForSequenceClassification:()=>qh,HubertModel:()=>jh,HubertPreTrainedModel:()=>Fh,HunYuanDenseV1ForCausalLM:()=>Vh,HunYuanDenseV1Model:()=>Wh,HunYuanDenseV1PreTrainedModel:()=>Io,IJepaForImageClassification:()=>Kh,IJepaModel:()=>Xh,IJepaPreTrainedModel:()=>Co,Idefics3ForConditionalGeneration:()=>ml,Idefics3PreTrainedModel:()=>fl,JAISLMHeadModel:()=>Qh,JAISModel:()=>Yh,JAISPreTrainedModel:()=>Po,JinaCLIPModel:()=>Jh,JinaCLIPPreTrainedModel:()=>Bs,JinaCLIPTextModel:()=>zo,JinaCLIPVisionModel:()=>Zh,Lfm2ForCausalLM:()=>t_,Lfm2Model:()=>e_,Lfm2MoeForCausalLM:()=>s_,Lfm2MoeModel:()=>r_,Lfm2MoePreTrainedModel:()=>No,Lfm2PreTrainedModel:()=>Lo,LiteWhisperForConditionalGeneration:()=>Cx,Llama4ForCausalLM:()=>a_,Llama4PreTrainedModel:()=>hl,LlamaForCausalLM:()=>o_,LlamaModel:()=>n_,LlamaPreTrainedModel:()=>$o,LlavaForConditionalGeneration:()=>Ds,LlavaOnevisionForConditionalGeneration:()=>Ds,LlavaPreTrainedModel:()=>_l,LlavaQwen2ForCausalLM:()=>l_,LongT5ForConditionalGeneration:()=>u_,LongT5Model:()=>c_,LongT5PreTrainedModel:()=>Ro,M2M100ForConditionalGeneration:()=>d_,M2M100Model:()=>p_,M2M100PreTrainedModel:()=>Uo,MBartForCausalLM:()=>y_,MBartForConditionalGeneration:()=>w_,MBartForSequenceClassification:()=>x_,MBartModel:()=>g_,MBartPreTrainedModel:()=>Jr,MPNetForMaskedLM:()=>ng,MPNetForQuestionAnswering:()=>ig,MPNetForSequenceClassification:()=>og,MPNetForTokenClassification:()=>ag,MPNetModel:()=>sg,MPNetPreTrainedModel:()=>Tr,MT5ForConditionalGeneration:()=>pg,MT5Model:()=>ug,MT5PreTrainedModel:()=>Yo,MarianMTModel:()=>m_,MarianModel:()=>f_,MarianPreTrainedModel:()=>Bo,MaskFormerForInstanceSegmentation:()=>__,MaskFormerModel:()=>h_,MaskFormerPreTrainedModel:()=>Do,Metric3DForDepthEstimation:()=>b_,Metric3DPreTrainedModel:()=>gl,Metric3Dv2ForDepthEstimation:()=>v_,Metric3Dv2PreTrainedModel:()=>wl,MgpstrForSceneTextRecognition:()=>k_,MgpstrModelOutput:()=>xl,MgpstrPreTrainedModel:()=>yl,MimiDecoderModel:()=>jo,MimiDecoderOutput:()=>vl,MimiEncoderModel:()=>Fo,MimiEncoderOutput:()=>bl,MimiModel:()=>E_,MimiPreTrainedModel:()=>Fs,MistralForCausalLM:()=>M_,MistralModel:()=>A_,MistralPreTrainedModel:()=>Go,MobileBertForMaskedLM:()=>S_,MobileBertForQuestionAnswering:()=>I_,MobileBertForSequenceClassification:()=>O_,MobileBertModel:()=>T_,MobileBertPreTrainedModel:()=>Zr,MobileLLMForCausalLM:()=>P_,MobileLLMModel:()=>C_,MobileLLMPreTrainedModel:()=>qo,MobileNetV1ForImageClassification:()=>L_,MobileNetV1ForSemanticSegmentation:()=>N_,MobileNetV1Model:()=>z_,MobileNetV1PreTrainedModel:()=>js,MobileNetV2ForImageClassification:()=>R_,MobileNetV2ForSemanticSegmentation:()=>U_,MobileNetV2Model:()=>$_,MobileNetV2PreTrainedModel:()=>Gs,MobileNetV3ForImageClassification:()=>D_,MobileNetV3ForSemanticSegmentation:()=>F_,MobileNetV3Model:()=>B_,MobileNetV3PreTrainedModel:()=>qs,MobileNetV4ForImageClassification:()=>G_,MobileNetV4ForSemanticSegmentation:()=>q_,MobileNetV4Model:()=>j_,MobileNetV4PreTrainedModel:()=>Ws,MobileViTForImageClassification:()=>V_,MobileViTModel:()=>W_,MobileViTPreTrainedModel:()=>Wo,MobileViTV2ForImageClassification:()=>X_,MobileViTV2Model:()=>H_,MobileViTV2PreTrainedModel:()=>Vo,ModernBertDecoderForCausalLM:()=>eg,ModernBertDecoderModel:()=>Z_,ModernBertDecoderPreTrainedModel:()=>Ho,ModernBertForMaskedLM:()=>Y_,ModernBertForSequenceClassification:()=>Q_,ModernBertForTokenClassification:()=>J_,ModernBertModel:()=>K_,ModernBertPreTrainedModel:()=>es,Moondream1ForConditionalGeneration:()=>i_,MoonshineForConditionalGeneration:()=>rg,MoonshineModel:()=>tg,MoonshinePreTrainedModel:()=>Xo,MptForCausalLM:()=>cg,MptModel:()=>lg,MptPreTrainedModel:()=>Ko,MultiModalityCausalLM:()=>dg,MultiModalityPreTrainedModel:()=>kl,MusicgenForCausalLM:()=>mg,MusicgenForConditionalGeneration:()=>Jo,MusicgenModel:()=>fg,MusicgenPreTrainedModel:()=>Qo,NanoChatForCausalLM:()=>_g,NanoChatModel:()=>hg,NanoChatPreTrainedModel:()=>Zo,NeoBertForMaskedLM:()=>wg,NeoBertForQuestionAnswering:()=>bg,NeoBertForSequenceClassification:()=>xg,NeoBertForTokenClassification:()=>yg,NeoBertModel:()=>gg,NeoBertPreTrainedModel:()=>Sr,NomicBertModel:()=>vg,NomicBertPreTrainedModel:()=>El,OPTForCausalLM:()=>Pg,OPTModel:()=>Cg,OPTPreTrainedModel:()=>na,Olmo2ForCausalLM:()=>Mg,Olmo2Model:()=>Ag,Olmo2PreTrainedModel:()=>ta,Olmo3ForCausalLM:()=>Sg,Olmo3Model:()=>Tg,Olmo3PreTrainedModel:()=>ra,OlmoForCausalLM:()=>Eg,OlmoModel:()=>kg,OlmoPreTrainedModel:()=>ea,OpenELMForCausalLM:()=>Ig,OpenELMModel:()=>Og,OpenELMPreTrainedModel:()=>sa,OwlViTForObjectDetection:()=>$g,OwlViTModel:()=>Ng,OwlViTPreTrainedModel:()=>aa,Owlv2ForObjectDetection:()=>Lg,Owlv2Model:()=>zg,Owlv2PreTrainedModel:()=>oa,PaliGemmaForConditionalGeneration:()=>Rg,PaliGemmaPreTrainedModel:()=>Al,ParakeetForCTC:()=>Ug,ParakeetPreTrainedModel:()=>Ml,PatchTSMixerForPrediction:()=>Dg,PatchTSMixerModel:()=>Bg,PatchTSMixerPreTrainedModel:()=>ia,PatchTSTForPrediction:()=>jg,PatchTSTModel:()=>Fg,PatchTSTPreTrainedModel:()=>la,Phi3ForCausalLM:()=>Vg,Phi3Model:()=>Wg,Phi3PreTrainedModel:()=>ua,Phi3VForCausalLM:()=>pa,Phi3VPreTrainedModel:()=>Tl,PhiForCausalLM:()=>qg,PhiModel:()=>Gg,PhiPreTrainedModel:()=>ca,PreTrainedModel:()=>y,PvtForImageClassification:()=>Xg,PvtModel:()=>Hg,PvtPreTrainedModel:()=>da,PyAnnoteForAudioFrameClassification:()=>Yg,PyAnnoteModel:()=>Kg,PyAnnotePreTrainedModel:()=>fa,Qwen2ForCausalLM:()=>Jg,Qwen2Model:()=>Qg,Qwen2PreTrainedModel:()=>ma,Qwen2VLForConditionalGeneration:()=>Zg,Qwen2VLPreTrainedModel:()=>Sl,Qwen3ForCausalLM:()=>tw,Qwen3Model:()=>ew,Qwen3PreTrainedModel:()=>ha,RFDetrForObjectDetection:()=>ow,RFDetrModel:()=>nw,RFDetrObjectDetectionOutput:()=>Ol,RFDetrPreTrainedModel:()=>ga,RTDetrForObjectDetection:()=>tm,RTDetrModel:()=>em,RTDetrObjectDetectionOutput:()=>tr,RTDetrPreTrainedModel:()=>Zn,RTDetrV2ForObjectDetection:()=>gw,RTDetrV2Model:()=>_w,RTDetrV2ObjectDetectionOutput:()=>Il,RTDetrV2PreTrainedModel:()=>wa,ResNetForImageClassification:()=>sw,ResNetModel:()=>rw,ResNetPreTrainedModel:()=>_a,RoFormerForMaskedLM:()=>dw,RoFormerForQuestionAnswering:()=>hw,RoFormerForSequenceClassification:()=>fw,RoFormerForTokenClassification:()=>mw,RoFormerModel:()=>pw,RoFormerPreTrainedModel:()=>Ir,RobertaForMaskedLM:()=>iw,RobertaForQuestionAnswering:()=>uw,RobertaForSequenceClassification:()=>lw,RobertaForTokenClassification:()=>cw,RobertaModel:()=>aw,RobertaPreTrainedModel:()=>Or,Sam2ImageSegmentationOutput:()=>zl,Sam2Model:()=>xa,Sam2PreTrainedModel:()=>Ll,Sam3TrackerModel:()=>yw,SamImageSegmentationOutput:()=>Cl,SamModel:()=>ww,SamPreTrainedModel:()=>Pl,SapiensForDepthEstimation:()=>vw,SapiensForNormalEstimation:()=>kw,SapiensForSemanticSegmentation:()=>bw,SapiensPreTrainedModel:()=>Vs,SegformerForImageClassification:()=>Aw,SegformerForSemanticSegmentation:()=>Mw,SegformerModel:()=>Ew,SegformerPreTrainedModel:()=>Hs,SiglipModel:()=>Tw,SiglipPreTrainedModel:()=>ya,SiglipTextModel:()=>ba,SiglipVisionModel:()=>Sw,SmolLM3ForCausalLM:()=>Iw,SmolLM3Model:()=>Ow,SmolLM3PreTrainedModel:()=>va,SmolVLMForConditionalGeneration:()=>Hh,SnacDecoderModel:()=>Ea,SnacEncoderModel:()=>ka,SnacModel:()=>Cw,SnacPreTrainedModel:()=>Xs,SpeechT5ForSpeechToText:()=>zw,SpeechT5ForTextToSpeech:()=>Lw,SpeechT5HifiGan:()=>Nw,SpeechT5Model:()=>Pw,SpeechT5PreTrainedModel:()=>Ks,SqueezeBertForMaskedLM:()=>Rw,SqueezeBertForQuestionAnswering:()=>Bw,SqueezeBertForSequenceClassification:()=>Uw,SqueezeBertModel:()=>$w,SqueezeBertPreTrainedModel:()=>ts,StableLmForCausalLM:()=>Fw,StableLmModel:()=>Dw,StableLmPreTrainedModel:()=>Aa,Starcoder2ForCausalLM:()=>Gw,Starcoder2Model:()=>jw,Starcoder2PreTrainedModel:()=>Ma,StyleTextToSpeech2Model:()=>qw,StyleTextToSpeech2PreTrainedModel:()=>Nl,SupertonicForConditionalGeneration:()=>Ta,SupertonicPreTrainedModel:()=>$l,Swin2SRForImageSuperResolution:()=>Kw,Swin2SRModel:()=>Xw,Swin2SRPreTrainedModel:()=>Sa,SwinForImageClassification:()=>Vw,SwinForSemanticSegmentation:()=>Hw,SwinModel:()=>Ww,SwinPreTrainedModel:()=>Ys,T5ForConditionalGeneration:()=>Qw,T5Model:()=>Yw,T5PreTrainedModel:()=>Oa,TableTransformerForObjectDetection:()=>Zw,TableTransformerModel:()=>Jw,TableTransformerObjectDetectionOutput:()=>Rl,TableTransformerPreTrainedModel:()=>Ia,TrOCRForCausalLM:()=>ex,TrOCRPreTrainedModel:()=>Ul,UltravoxModel:()=>Dl,UltravoxPreTrainedModel:()=>Bl,UniSpeechForCTC:()=>sx,UniSpeechForSequenceClassification:()=>nx,UniSpeechModel:()=>rx,UniSpeechPreTrainedModel:()=>Qs,UniSpeechSatForAudioFrameClassification:()=>lx,UniSpeechSatForCTC:()=>ax,UniSpeechSatForSequenceClassification:()=>ix,UniSpeechSatModel:()=>ox,UniSpeechSatPreTrainedModel:()=>rs,VaultGemmaForCausalLM:()=>ux,VaultGemmaModel:()=>cx,VaultGemmaPreTrainedModel:()=>Ca,ViTForImageClassification:()=>fx,ViTMAEModel:()=>mx,ViTMAEPreTrainedModel:()=>Fl,ViTMSNForImageClassification:()=>_x,ViTMSNModel:()=>hx,ViTMSNPreTrainedModel:()=>za,ViTModel:()=>dx,ViTPreTrainedModel:()=>Pa,VisionEncoderDecoderModel:()=>px,VitMatteForImageMatting:()=>gx,VitMattePreTrainedModel:()=>jl,VitPoseForPoseEstimation:()=>wx,VitPosePreTrainedModel:()=>Gl,VitsModel:()=>xx,VitsModelOutput:()=>ql,VitsPreTrainedModel:()=>Wl,VoxtralForConditionalGeneration:()=>tx,Wav2Vec2BertForCTC:()=>bx,Wav2Vec2BertForSequenceClassification:()=>vx,Wav2Vec2BertModel:()=>yx,Wav2Vec2BertPreTrainedModel:()=>Js,Wav2Vec2ForAudioFrameClassification:()=>Dh,Wav2Vec2ForCTC:()=>Uh,Wav2Vec2ForSequenceClassification:()=>Bh,Wav2Vec2Model:()=>Rh,Wav2Vec2PreTrainedModel:()=>Wt,WavLMForAudioFrameClassification:()=>Tx,WavLMForCTC:()=>Ex,WavLMForSequenceClassification:()=>Ax,WavLMForXVector:()=>Mx,WavLMModel:()=>kx,WavLMPreTrainedModel:()=>Cr,WeSpeakerResNetModel:()=>Sx,WeSpeakerResNetPreTrainedModel:()=>Hl,WhisperForConditionalGeneration:()=>Xl,WhisperModel:()=>Ix,WhisperPreTrainedModel:()=>La,XLMForQuestionAnswering:()=>$x,XLMForSequenceClassification:()=>Lx,XLMForTokenClassification:()=>Nx,XLMModel:()=>Px,XLMPreTrainedModel:()=>Pr,XLMRobertaForMaskedLM:()=>Ux,XLMRobertaForQuestionAnswering:()=>Fx,XLMRobertaForSequenceClassification:()=>Bx,XLMRobertaForTokenClassification:()=>Dx,XLMRobertaModel:()=>Rx,XLMRobertaPreTrainedModel:()=>zr,XLMWithLMHeadModel:()=>zx,XVectorOutput:()=>Vl,YolosForObjectDetection:()=>Gx,YolosModel:()=>jx,YolosObjectDetectionOutput:()=>Kl,YolosPreTrainedModel:()=>Na,YoutuForCausalLM:()=>Wx,YoutuModel:()=>qx,YoutuPreTrainedModel:()=>$a});var Yr=class extends y{},tf=class extends Yr{},rf=class extends Yr{async _call(e){return new F(await super._call(e))}},sf=class extends Yr{async _call(e){return new Ae(await super._call(e))}},nf=class extends Yr{async _call(e){return new we(await super._call(e))}};var Rn=class extends y{},of=class extends Rn{},af=class extends Rn{};var Un=class extends y{},lf=class extends Un{},cf=class extends Un{};var Bn=class extends y{},uf=class extends Bn{},pf=class extends Bn{};var Ls=class extends y{},df=class extends Ls{},ff=class extends Ls{},mf=class extends Ls{async _call(e){return new F(await super._call(e))}};var Dn=class extends y{},hf=class extends Dn{},_f=class extends Dn{async _call(e){return new F(await super._call(e))}};var yr=class extends y{},gf=class extends yr{},wf=class extends yr{async _call(e){return new we(await super._call(e))}},xf=class extends yr{async _call(e){return new F(await super._call(e))}},yf=class extends yr{async _call(e){return new _e(await super._call(e))}},bf=class extends yr{async _call(e){return new Ae(await super._call(e))}};var Fn=class extends y{},vf=class extends Fn{},kf=class extends Fn{};var jn=class extends y{},Ef=class extends jn{},Af=class extends jn{};var Gn=class extends y{},Mf=class extends Gn{},Tf=class extends Gn{};var br=class extends y{},Sf=class extends br{},Of=class extends br{async _call(e){return new we(await super._call(e))}},If=class extends br{async _call(e){return new F(await super._call(e))}},Cf=class extends br{async _call(e){return new _e(await super._call(e))}},Pf=class extends br{async _call(e){return new Ae(await super._call(e))}};var ez=4299n,EA=6561n,Ji=class extends y{forward_params=["input_ids","inputs_embeds","attention_mask","position_ids","audio_values","exaggeration","audio_features","audio_tokens","speaker_embeddings","speaker_features","past_key_values"];main_input_name="input_ids";_return_dict_in_generate_keys=["audio_tokens","speaker_embeddings","speaker_features"]},qn=class extends Ji{async encode_speech(e){return ce(this.sessions.speech_encoder,{audio_values:e})}async forward({input_ids:e=null,attention_mask:r=null,audio_values:s=null,exaggeration:n=null,position_ids:o=null,inputs_embeds:a=null,past_key_values:i=null,generation_config:l=null,logits_processor:u=null,audio_features:d=null,audio_tokens:f=null,speaker_embeddings:m=null,speaker_features:_=null,...w}){let x;if(!a){let E=this.sessions.embed_tokens.inputNames,M={input_ids:e};if(E.includes("exaggeration")){if(!(n instanceof U)){let I=e.dims[0];if(n==null)n=Ge([I],.5);else if(typeof n=="number")n=Ge([I],n);else if(Array.isArray(n))n=new U("float32",n,[I]);else throw new Error("Unsupported type for `exaggeration` input")}M.exaggeration=n}if(E.includes("position_ids")&&(M.position_ids=o),{inputs_embeds:a}=await ce(this.sessions.embed_tokens,M),d&&f&&m&&_&&(x={audio_features:d,audio_tokens:f,speaker_embeddings:m,speaker_features:_}),x||s)x??=await this.encode_speech(s),a=Ee([x.audio_features,a],1),r=rt([a.dims[0],a.dims[1]]);else{let I=a.dims[1];if(!i||I!==1)throw new Error("Incorrect state encountered during generation.");let T=Object.values(i)[0].dims.at(-2);r=rt([a.dims[0],T+I])}}return{...await Tt(this,{inputs_embeds:a,past_key_values:i,attention_mask:r,generation_config:l,logits_processor:u},!1),...x}}prepare_inputs_for_generation(e,r,s){if(!r.position_ids&&this.sessions.embed_tokens.inputNames.includes("position_ids"))if(r.input_ids.dims[1]===1){let n=Array.from({length:e.length},(o,a)=>e[a].length-e[a].findLastIndex(i=>i==EA)-1);r.position_ids=new U("int64",n,[e.length,1])}else{let o=r.input_ids.tolist().map(a=>{let i=0;return a.map(l=>l>=EA?0:i++)});r.position_ids=new U("int64",o.flat(),r.input_ids.dims)}return r.input_ids.dims[1]===1&&(delete r.audio_values,delete r.audio_features,delete r.audio_tokens,delete r.speaker_embeddings,delete r.speaker_features),Yi(this,e,r,s)}async generate(e){let{sequences:r,audio_tokens:s,speaker_embeddings:n,speaker_features:o}=await super.generate({...e,return_dict_in_generate:!0}),a=r.slice(null,[e.input_ids.dims[1],-1]),i=Ge([a.dims[0],3],ez),l=Ee([s,a,i],1),{waveform:u}=await ce(this.sessions.conditional_decoder,{speech_tokens:l,speaker_features:o,speaker_embeddings:n});return u}};var Zi=class extends y{},zf=class extends Zi{};var Ns=class extends y{},Lf=class extends Ns{},Wn=class extends Ns{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Vn=class extends Ns{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"audio_model"})}};var er=class extends y{},Nf=class extends er{},$f=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Hn=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Rf=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"vision_model"})}},Uf=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"vision_model"})}};var Xn=class extends y{},Bf=class extends Xn{},Df=class extends Xn{};var Kn=class extends y{},Ff=class extends Kn{},jf=class extends Kn{};var Yn=class extends y{},Gf=class extends Yn{},qf=class extends Yn{};var vr=class extends y{},Wf=class extends vr{},Vf=class extends vr{async _call(e){return new we(await super._call(e))}},Hf=class extends vr{async _call(e){return new F(await super._call(e))}},Xf=class extends vr{async _call(e){return new _e(await super._call(e))}},Kf=class extends vr{async _call(e){return new Ae(await super._call(e))}};var Qn=class extends y{},Yf=class extends Qn{},Qf=class extends Qn{async _call(e){return new F(await super._call(e))}};var Jn=class extends y{},Jf=class extends Jn{},Zf=class extends Jn{async _call(e){return new F(await super._call(e))}};var Zn=class extends y{},em=class extends Zn{},tm=class extends Zn{async _call(e){return new tr(await super._call(e))}},tr=class extends Ne{constructor({logits:e,pred_boxes:r}){super(),this.logits=e,this.pred_boxes=r}};var eo=class extends y{},rm=class extends eo{},sm=class extends eo{async _call(e){return new tr(await super._call(e))}};var el=class extends Ne{constructor({audio_codes:e}){super(),this.audio_codes=e}},tl=class extends Ne{constructor({audio_values:e}){super(),this.audio_values=e}},$s=class extends y{main_input_name="input_values";forward_params=["input_values"]},nm=class extends $s{async encode(e){return new el(await ce(this.sessions.encoder_model,e))}async decode(e){return new tl(await ce(this.sessions.decoder_model,e))}},to=class extends $s{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"encoder_model"})}},ro=class extends $s{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"decoder_model"})}};var kr=class extends y{},om=class extends kr{},am=class extends kr{async _call(e){return new we(await super._call(e))}},im=class extends kr{async _call(e){return new F(await super._call(e))}},lm=class extends kr{async _call(e){return new _e(await super._call(e))}},cm=class extends kr{async _call(e){return new Ae(await super._call(e))}};var Er=class extends y{},um=class extends Er{},pm=class extends Er{async _call(e){return new we(await super._call(e))}},dm=class extends Er{async _call(e){return new F(await super._call(e))}},fm=class extends Er{async _call(e){return new _e(await super._call(e))}},mm=class extends Er{async _call(e){return new Ae(await super._call(e))}};var rl=class extends y{},hm=class extends rl{};var so=class extends y{},_m=class extends so{},gm=class extends so{async _call(e){return new F(await super._call(e))}};var sl=class extends y{},wm=class extends sl{};var nl=class extends y{},xm=class extends nl{};var Rs=class extends y{},ym=class extends Rs{},bm=class extends Rs{async _call(e){return new Us(await super._call(e))}},vm=class extends Rs{async _call(e){return new ol(await super._call(e))}},Us=class extends Ne{constructor({logits:e,pred_boxes:r}){super(),this.logits=e,this.pred_boxes=r}},ol=class extends Ne{constructor({logits:e,pred_boxes:r,pred_masks:s}){super(),this.logits=e,this.pred_boxes=r,this.pred_masks=s}};var no=class extends y{},km=class extends no{},Em=class extends no{async _call(e){return new F(await super._call(e))}};var oo=class extends y{},Am=class extends oo{},Mm=class extends oo{async _call(e){return new F(await super._call(e))}};var al=class extends y{},Tm=class extends al{};var il=class extends y{},Sm=class extends il{};var Ar=class extends y{},Om=class extends Ar{},Im=class extends Ar{async _call(e){return new F(await super._call(e))}},Cm=class extends Ar{async _call(e){return new _e(await super._call(e))}},Pm=class extends Ar{async _call(e){return new Ae(await super._call(e))}},zm=class extends Ar{async _call(e){return new we(await super._call(e))}};var ll=class extends y{},Lm=class extends ll{};var ao=class extends y{},Nm=class extends ao{},$m=class extends ao{};var io=class extends y{},Rm=class extends io{},Um=class extends io{async _call(e){return new F(await super._call(e))}};var Mr=class extends y{},Bm=class extends Mr{},Dm=class extends Mr{async _call(e){return new we(await super._call(e))}},Fm=class extends Mr{async _call(e){return new F(await super._call(e))}},jm=class extends Mr{async _call(e){return new _e(await super._call(e))}},Gm=class extends Mr{async _call(e){return new Ae(await super._call(e))}};var lo=class extends y{},qm=class extends lo{},Wm=class extends lo{};var Qr=class extends y{},Vm=class extends Qr{},Hm=class extends Qr{async _call(e){return new we(await super._call(e))}},Xm=class extends Qr{async _call(e){return new F(await super._call(e))}},Km=class extends Qr{async _call(e){return new _e(await super._call(e))}};var co=class extends y{},Ym=class extends co{},Qm=class extends co{};var uo=class extends y{},Jm=class extends uo{},Zm=class extends uo{};var po=class extends y{},eh=class extends po{},th=class extends po{};var fo=class extends y{},rh=class extends fo{},sh=class extends fo{async _call(e){return new F(await super._call(e))}};var cl=class extends y{forward_params=["input_ids","inputs_embeds","attention_mask","pixel_values","encoder_outputs","decoder_input_ids","decoder_inputs_embeds","decoder_attention_mask","past_key_values"];main_input_name="inputs_embeds"},nh=class extends cl{_merge_input_ids_with_image_features({inputs_embeds:e,image_features:r,input_ids:s,attention_mask:n}){return{inputs_embeds:Ee([r,e],1),attention_mask:Ee([rt(r.dims.slice(0,2)),n],1)}}async _prepare_inputs_embeds({input_ids:e,pixel_values:r,inputs_embeds:s,attention_mask:n}){if(!e&&!r)throw new Error("Either `input_ids` or `pixel_values` should be provided.");let o,a;return e&&(o=await this.encode_text({input_ids:e})),r&&(a=await this.encode_image({pixel_values:r})),o&&a?{inputs_embeds:s,attention_mask:n}=this._merge_input_ids_with_image_features({inputs_embeds:o,image_features:a,input_ids:e,attention_mask:n}):s=o||a,{inputs_embeds:s,attention_mask:n}}async forward({input_ids:e,pixel_values:r,attention_mask:s,decoder_input_ids:n,decoder_attention_mask:o,encoder_outputs:a,past_key_values:i,inputs_embeds:l,decoder_inputs_embeds:u}){if(l||({inputs_embeds:l,attention_mask:s}=await this._prepare_inputs_embeds({input_ids:e,pixel_values:r,inputs_embeds:l,attention_mask:s})),!a){let{last_hidden_state:f}=await qt(this,{inputs_embeds:l,attention_mask:s});a=f}if(!u){if(!n)throw new Error("Either `decoder_input_ids` or `decoder_inputs_embeds` should be provided.");u=await this.encode_text({input_ids:n})}return await Tt(this,{inputs_embeds:u,attention_mask:o,encoder_attention_mask:s,encoder_hidden_states:a,past_key_values:i},!0)}};var mo=class extends y{},oh=class extends mo{},ah=class extends mo{};var ho=class extends y{},ih=class extends ho{},lh=class extends ho{};var _o=class extends y{},ch=class extends _o{},uh=class extends _o{};var ul=class extends y{forward_params=["input_ids","attention_mask","inputs_embeds","per_layer_inputs","position_ids","pixel_values","input_features","input_features_mask","past_key_values"]},go=class extends ul{async forward({input_ids:e=null,attention_mask:r=null,pixel_values:s=null,input_features:n=null,input_features_mask:o=null,position_ids:a=null,inputs_embeds:i=null,per_layer_inputs:l=null,past_key_values:u=null,generation_config:d=null,logits_processor:f=null,...m}){if((!i||!l)&&({inputs_embeds:i,per_layer_inputs:l}=await ce(this.sessions.embed_tokens,{input_ids:e}),e.dims[1]!==1)){if(s){let{image_features:w}=await ce(this.sessions.vision_encoder,{pixel_values:s});({inputs_embeds:i,attention_mask:r}=this._merge_input_ids_with_image_features({image_features:w,inputs_embeds:i,input_ids:e,attention_mask:r}))}if(n){let{audio_features:w}=await ce(this.sessions.audio_encoder,{input_features:n,input_features_mask:o});({inputs_embeds:i,attention_mask:r}=this._merge_input_ids_with_audio_features({audio_features:w,inputs_embeds:i,input_ids:e,attention_mask:r}))}}return await Tt(this,{inputs_embeds:i,per_layer_inputs:l,past_key_values:u,attention_mask:r,position_ids:a,generation_config:d,logits_processor:f},!0)}_merge_input_ids_with_image_features(e){let r=e.image_features.dims.at(-1),s=e.image_features.view(-1,r);return ur({image_token_id:this.config.image_token_id,...e,image_features:s})}_merge_input_ids_with_audio_features(e){let r=e.audio_features.dims.at(-1),s=e.audio_features.view(-1,r);return ef({audio_token_id:this.config.audio_token_id,...e,audio_features:s})}};var wo=class extends y{},ph=class extends wo{},dh=class extends wo{};var xo=class extends y{},fh=class extends xo{},mh=class extends xo{};var yo=class extends y{},hh=class extends yo{},_h=class extends yo{};var bo=class extends y{},gh=class extends bo{},wh=class extends bo{};var vo=class extends y{},xh=class extends vo{},yh=class extends vo{};var ko=class extends y{},bh=class extends ko{},vh=class extends ko{};var Eo=class extends y{},kh=class extends Eo{},Eh=class extends Eo{};var Ao=class extends y{},Ah=class extends Ao{},Mh=class extends Ao{};var Mo=class extends y{},Th=class extends Mo{},Sh=class extends Mo{};var To=class extends y{},Oh=class extends To{},Ih=class extends To{};var pl=class extends y{},Ch=class extends pl{};var dl=class extends y{},Ph=class extends dl{};var So=class extends y{},zh=class extends So{},Lh=class extends So{};var Oo=class extends y{},Nh=class extends Oo{},$h=class extends Oo{async _call(e){return new F(await super._call(e))}};var Wt=class extends y{},Rh=class extends Wt{},Uh=class extends Wt{async _call(e){return new gt(await super._call(e))}},Bh=class extends Wt{async _call(e){return new F(await super._call(e))}},Dh=class extends Wt{async _call(e){return new _e(await super._call(e))}};var Fh=class extends y{},jh=class extends Wt{},Gh=class extends Wt{async _call(e){return new gt(await super._call(e))}},qh=class extends Wt{async _call(e){return new F(await super._call(e))}};var Io=class extends y{},Wh=class extends Io{},Vh=class extends Io{};var fl=class extends y{forward_params=["input_ids","attention_mask","pixel_values","pixel_attention_mask","position_ids","past_key_values"]},ml=class extends fl{async encode_image({pixel_values:e,pixel_attention_mask:r}){return(await ce(this.sessions.vision_encoder,{pixel_values:e,pixel_attention_mask:r})).image_features}_merge_input_ids_with_image_features(e){let r=e.image_features.dims.at(-1),s=e.image_features.view(-1,r);return ur({image_token_id:this.config.image_token_id,...e,image_features:s})}},Hh=class extends ml{};var Co=class extends y{},Xh=class extends Co{},Kh=class extends Co{async _call(e){return new F(await super._call(e))}};var Po=class extends y{},Yh=class extends Po{},Qh=class extends Po{};var Bs=class extends y{},Jh=class extends Bs{async forward(e){let r=!e.input_ids,s=!e.pixel_values;if(r&&s)throw new Error("Either `input_ids` or `pixel_values` should be provided.");if(r&&(e.input_ids=rt([e.pixel_values.dims[0],1])),s){let{image_size:u}=this.config.vision_config;e.pixel_values=Ge([0,3,u,u],0)}let{text_embeddings:n,image_embeddings:o,l2norm_text_embeddings:a,l2norm_image_embeddings:i}=await super.forward(e),l={};return r||(l.text_embeddings=n,l.l2norm_text_embeddings=a),s||(l.image_embeddings=o,l.l2norm_image_embeddings=i),l}},zo=class extends Bs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Zh=class extends Bs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"vision_model"})}};var Lo=class extends y{},e_=class extends Lo{},t_=class extends Lo{};var No=class extends y{},r_=class extends No{},s_=class extends No{};var $o=class extends y{},n_=class extends $o{},o_=class extends $o{};var hl=class extends y{},a_=class extends hl{};var _l=class extends y{forward_params=["input_ids","attention_mask","pixel_values","position_ids","past_key_values"]},Ds=class extends _l{_merge_input_ids_with_image_features(e){let r=e.image_features.dims.at(-1),s=e.image_features.view(-1,r);return ur({image_token_id:this.config.image_token_index,...e,image_features:s})}},i_=class extends Ds{},l_=class extends Ds{};var Ro=class extends y{},c_=class extends Ro{},u_=class extends Ro{};var Uo=class extends y{},p_=class extends Uo{},d_=class extends Uo{};var Bo=class extends y{},f_=class extends Bo{},m_=class extends Bo{};var Do=class extends y{},h_=class extends Do{},__=class extends Do{};var Jr=class extends y{},g_=class extends Jr{},w_=class extends Jr{},x_=class extends Jr{async _call(e){return new F(await super._call(e))}},y_=class extends Jr{};var gl=class extends y{},b_=class extends gl{};var wl=class extends y{},v_=class extends wl{};var xl=class extends Ne{constructor({char_logits:e,bpe_logits:r,wp_logits:s}){super(),this.char_logits=e,this.bpe_logits=r,this.wp_logits=s}get logits(){return[this.char_logits,this.bpe_logits,this.wp_logits]}},yl=class extends y{},k_=class extends yl{async _call(e){return new xl(await super._call(e))}};var bl=class extends Ne{constructor({audio_codes:e}){super(),this.audio_codes=e}},vl=class extends Ne{constructor({audio_values:e}){super(),this.audio_values=e}},Fs=class extends y{main_input_name="input_values";forward_params=["input_values"]},E_=class extends Fs{async encode(e){return new bl(await ce(this.sessions.encoder_model,e))}async decode(e){return new vl(await ce(this.sessions.decoder_model,e))}},Fo=class extends Fs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"encoder_model"})}},jo=class extends Fs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"decoder_model"})}};var Go=class extends y{},A_=class extends Go{},M_=class extends Go{};var Zr=class extends y{},T_=class extends Zr{},S_=class extends Zr{async _call(e){return new we(await super._call(e))}},O_=class extends Zr{async _call(e){return new F(await super._call(e))}},I_=class extends Zr{async _call(e){return new Ae(await super._call(e))}};var qo=class extends y{},C_=class extends qo{},P_=class extends qo{};var js=class extends y{},z_=class extends js{},L_=class extends js{async _call(e){return new F(await super._call(e))}},N_=class extends js{};var Gs=class extends y{},$_=class extends Gs{},R_=class extends Gs{async _call(e){return new F(await super._call(e))}},U_=class extends Gs{};var qs=class extends y{},B_=class extends qs{},D_=class extends qs{async _call(e){return new F(await super._call(e))}},F_=class extends qs{};var Ws=class extends y{},j_=class extends Ws{},G_=class extends Ws{async _call(e){return new F(await super._call(e))}},q_=class extends Ws{};var Wo=class extends y{},W_=class extends Wo{},V_=class extends Wo{async _call(e){return new F(await super._call(e))}};var Vo=class extends y{},H_=class extends Vo{},X_=class extends Vo{async _call(e){return new F(await super._call(e))}};var es=class extends y{},K_=class extends es{},Y_=class extends es{async _call(e){return new we(await super._call(e))}},Q_=class extends es{async _call(e){return new F(await super._call(e))}},J_=class extends es{async _call(e){return new _e(await super._call(e))}};var Ho=class extends y{},Z_=class extends Ho{},eg=class extends Ho{};var Xo=class extends y{requires_attention_mask=!1;main_input_name="input_values";forward_params=["input_values","decoder_input_ids","past_key_values"]},tg=class extends Xo{},rg=class extends Xo{};var Tr=class extends y{},sg=class extends Tr{},ng=class extends Tr{async _call(e){return new we(await super._call(e))}},og=class extends Tr{async _call(e){return new F(await super._call(e))}},ag=class extends Tr{async _call(e){return new _e(await super._call(e))}},ig=class extends Tr{async _call(e){return new Ae(await super._call(e))}};var Ko=class extends y{},lg=class extends Ko{},cg=class extends Ko{};var Yo=class extends y{},ug=class extends Yo{},pg=class extends Yo{};var kl=class extends y{},dg=class extends kl{forward_params=["input_ids","pixel_values","images_seq_mask","images_emb_mask","attention_mask","position_ids","past_key_values"];constructor(...e){super(...e),this._generation_mode="text"}async forward(e){let r=this._generation_mode??"text",s;if(r==="text"||!e.past_key_values){let l=this.sessions.prepare_inputs_embeds,u=at(e,l.inputNames);s=await ce(l,u)}else{let l=this.sessions.gen_img_embeds,u=at({image_ids:e.input_ids},l.inputNames);s=await ce(l,u)}let n={...e,...s},o=await Tt(this,n),a=this.sessions[r==="text"?"lm_head":"gen_head"];if(!a)throw new Error(`Unable to find "${a}" generation head`);let i=await ce(a,at(o,a.inputNames));return{...s,...o,...i}}prepare_inputs_for_generation(e,r,s){let n=!!r.past_key_values;return s.guidance_scale!==null&&s.guidance_scale>1&&(n?r.input_ids=Ee([r.input_ids,r.input_ids],0):(r.input_ids=Ee([r.input_ids,yn(r.input_ids,BigInt(s.pad_token_id))],0),r.attention_mask=Ee([r.attention_mask,yn(r.attention_mask,0n)],0))),(n||!r.pixel_values)&&(r.pixel_values=Ge([0,0,3,384,384],1)),n&&(r.images_seq_mask=new U("bool",new Array(1).fill(!0).fill(!1,0,1),[1,1]),r.images_emb_mask=new U("bool",new Array(0).fill(!1),[1,1,0])),r}async generate(e){return this._generation_mode="text",super.generate(e)}async generate_images(e){this._generation_mode="image";let r=(e.inputs??e[this.main_input_name]).dims[1],n=(await super.generate(e)).slice(null,[r,null]),o=this.sessions.image_decode,{decoded_image:a}=await ce(o,{generated_tokens:n}),i=a.add_(1).mul_(255/2).clamp_(0,255).to("uint8"),l=[];for(let u of i){let d=Xe.fromTensor(u);l.push(d)}return l}};var Qo=class extends y{},fg=class extends Qo{},mg=class extends Qo{},Jo=class extends y{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"];_apply_and_filter_by_delay_pattern_mask(e){let[r,s]=e.dims,n=this.config.decoder.num_codebooks,o=s-n,a=0;for(let u=0;u<e.size;++u){if(e.data[u]==this.config.decoder.pad_token_id)continue;let d=u%s,f=Math.floor(u/s)%n,m=d-f;m>0&&m<=o&&(e.data[a++]=e.data[u])}let i=Math.floor(r/n),l=a/(i*n);return new U(e.type,e.data.slice(0,a),[i,n,l])}prepare_inputs_for_generation(e,r,s){let n=BigInt(this.config.decoder.pad_token_id),o=structuredClone(e);for(let a=0;a<o.length;++a)for(let i=0;i<o[a].length;++i)a%this.config.decoder.num_codebooks>=i&&(o[a][i]=n);return s.guidance_scale!==null&&s.guidance_scale>1&&(o=o.concat(o)),Qi(this,o,r,s)}async generate(e){let r=await super.generate(e),s=this._apply_and_filter_by_delay_pattern_mask(r).unsqueeze_(0),{audio_values:n}=await ce(this.sessions.encodec_decode,{audio_codes:s});return n}};var Zo=class extends y{},hg=class extends Zo{},_g=class extends Zo{};var Sr=class extends y{},gg=class extends Sr{},wg=class extends Sr{async _call(e){return new we(await super._call(e))}},xg=class extends Sr{async _call(e){return new F(await super._call(e))}},yg=class extends Sr{async _call(e){return new _e(await super._call(e))}},bg=class extends Sr{async _call(e){return new Ae(await super._call(e))}};var El=class extends y{},vg=class extends El{};var ea=class extends y{},kg=class extends ea{},Eg=class extends ea{};var ta=class extends y{},Ag=class extends ta{},Mg=class extends ta{};var ra=class extends y{},Tg=class extends ra{},Sg=class extends ra{};var sa=class extends y{},Og=class extends sa{},Ig=class extends sa{};var na=class extends y{},Cg=class extends na{},Pg=class extends na{};var oa=class extends y{},zg=class extends oa{},Lg=class extends oa{};var aa=class extends y{},Ng=class extends aa{},$g=class extends aa{};var Al=class extends y{forward_params=["input_ids","attention_mask","pixel_values","position_ids","past_key_values"]},Rg=class extends Al{_merge_input_ids_with_image_features(e){let r=e.image_features.dims.at(-1),s=e.image_features.view(-1,r);return ur({image_token_id:this.config.image_token_index,...e,image_features:s})}};var Ml=class extends y{},Ug=class extends Ml{async _call(e){return new gt(await super._call(e))}};var ia=class extends y{},Bg=class extends ia{},Dg=class extends ia{};var la=class extends y{},Fg=class extends la{},jg=class extends la{};var ca=class extends y{},Gg=class extends ca{},qg=class extends ca{};var ua=class extends y{},Wg=class extends ua{},Vg=class extends ua{};var Tl=class extends y{forward_params=["input_ids","inputs_embeds","attention_mask","position_ids","pixel_values","image_sizes","past_key_values"]},pa=class extends Tl{async forward({input_ids:e=null,attention_mask:r=null,pixel_values:s=null,image_sizes:n=null,position_ids:o=null,inputs_embeds:a=null,past_key_values:i=null,generation_config:l=null,logits_processor:u=null,...d}){if(!a){let m;if(s&&e.dims[1]!==1){if(!n)throw new Error("`image_sizes` must be provided when `pixel_values` is provided.");({image_features:m}=await ce(this.sessions.vision_encoder,{pixel_values:s,image_sizes:n}))}else{let _=this.config.normalized_config.hidden_size;m=new U("float32",[],[0,_])}({inputs_embeds:a}=await ce(this.sessions.prepare_inputs_embeds,{input_ids:e,image_features:m}))}return await Tt(this,{inputs_embeds:a,past_key_values:i,attention_mask:r,position_ids:o,generation_config:l,logits_processor:u},!1)}};var da=class extends y{},Hg=class extends da{},Xg=class extends da{async _call(e){return new F(await super._call(e))}};var fa=class extends y{},Kg=class extends fa{},Yg=class extends fa{async _call(e){return new _e(await super._call(e))}};var ma=class extends y{},Qg=class extends ma{},Jg=class extends ma{};var Sl=class extends y{forward_params=["input_ids","attention_mask","position_ids","past_key_values","pixel_values","image_grid_thw"]},Zg=class extends Sl{get_rope_index(e,r,s,n){let{vision_config:o,image_token_id:a,video_token_id:i,vision_start_token_id:l}=this.config,u=o.spatial_merge_size??2,d=[];if(r||s){let f=e.tolist();n||(n=mi(e));let m=n.tolist(),_=Array.from({length:3},M=>Array.from({length:e.dims[0]},I=>Array.from({length:e.dims[1]},T=>1))),w=r?r.tolist():[],x=s?s.tolist():[],k=0,E=0;for(let M=0;M<f.length;++M){let I=f[M].filter((S,L)=>m[M][L]==1),z=I.reduce((S,L,R)=>(L==l&&S.push(R),S),[]).map(S=>I[S+1]),C=z.filter(S=>S==a).length,v=z.filter(S=>S==i).length,G=[],X=0,V=C,Q=v;for(let S=0;S<z.length;++S){let L=I.findIndex((Et,tt)=>tt>X&&Et==a),R=I.findIndex((Et,tt)=>tt>X&&Et==i),te=V>0&&L!==-1?L:I.length+1,ue=Q>0&&R!==-1?R:I.length+1,Be,Pe,vt,Qe;te<ue?([Pe,vt,Qe]=w[k],++k,--V,Be=te):([Pe,vt,Qe]=x[E],++E,--Q,Be=ue);let[et,st,Me]=[Number(Pe),Math.floor(Number(vt)/u),Math.floor(Number(Qe)/u)],xe=Be-X,qe=G.length>0?Te(G.at(-1))[0]+1:0;G.push(Array.from({length:3*xe},(Et,tt)=>qe+tt%xe));let kt=xe+qe,ge=et*st*Me,$e=Array.from({length:ge},(Et,tt)=>kt+Math.floor(tt/(st*Me))),Nr=Array.from({length:ge},(Et,tt)=>kt+Math.floor(tt/Me)%st),ns=Array.from({length:ge},(Et,tt)=>kt+tt%Me);G.push([$e,Nr,ns].flat()),X=Be+ge}if(X<I.length){let S=G.length>0?Te(G.at(-1))[0]+1:0,L=I.length-X;G.push(Array.from({length:3*L},(R,te)=>S+te%L))}let K=G.reduce((S,L)=>S+L.length,0),Y=new Array(K),B=0;for(let S=0;S<3;++S)for(let L=0;L<G.length;++L){let R=G[L],te=R.length/3;for(let ue=S*te;ue<(S+1)*te;++ue)Y[B++]=R[ue]}let P=0,se=m[M];for(let S=0;S<se.length;++S)if(se[S]==1){for(let L=0;L<3;++L)_[L][M][S]=Y[L*K/3+P];++P}let ie=Te(Y)[0];d.push(ie+1-f[M].length)}return[new U("int64",_.flat(1/0),[3,e.dims[0],e.dims[1]]),new U("int64",d,[d.length,1])]}else if(n){let{data:f,dims:m}=J0(n),_=BigInt64Array.from({length:3*f.length},(x,k)=>f[k%f.length]),w=Array.from({length:m[0]},(x,k)=>Te(f.subarray(m[1]*k,m[1]*(k+1)))[0]+1n+BigInt(m[1]));return[new U("int64",_,[3,...m]),new U("int64",w,[w.length,1])]}else{let[f,m]=e.dims,_=BigInt64Array.from({length:3*f*m},(w,x)=>BigInt(Math.floor(x%m/f)));return[new U("int64",_,[3,...e.dims]),Iu([f,1])]}}async encode_image({pixel_values:e,image_grid_thw:r}){return(await ce(this.sessions.vision_encoder,{pixel_values:e,grid_thw:r})).image_features}_merge_input_ids_with_image_features(e){return ur({image_token_id:this.config.image_token_id,...e})}prepare_inputs_for_generation(e,r,s){if(r.attention_mask&&!r.position_ids)if(!r.past_key_values)[r.position_ids,r.rope_deltas]=this.get_rope_index(r.input_ids,r.image_grid_thw,r.video_grid_thw,r.attention_mask);else{r.pixel_values=null;let n=BigInt(Object.values(r.past_key_values)[0].dims.at(-2)),o=r.rope_deltas.map(a=>n+a);r.position_ids=zt([o,o,o],0)}return r}};var ha=class extends y{},ew=class extends ha{},tw=class extends ha{};var _a=class extends y{},rw=class extends _a{},sw=class extends _a{async _call(e){return new F(await super._call(e))}};var ga=class extends y{},nw=class extends ga{},ow=class extends ga{async _call(e){return new Ol(await super._call(e))}},Ol=class extends tr{};var Or=class extends y{},aw=class extends Or{},iw=class extends Or{async _call(e){return new we(await super._call(e))}},lw=class extends Or{async _call(e){return new F(await super._call(e))}},cw=class extends Or{async _call(e){return new _e(await super._call(e))}},uw=class extends Or{async _call(e){return new Ae(await super._call(e))}};var Ir=class extends y{},pw=class extends Ir{},dw=class extends Ir{async _call(e){return new we(await super._call(e))}},fw=class extends Ir{async _call(e){return new F(await super._call(e))}},mw=class extends Ir{async _call(e){return new _e(await super._call(e))}},hw=class extends Ir{async _call(e){return new Ae(await super._call(e))}};var wa=class extends y{},_w=class extends wa{},gw=class extends wa{async _call(e){return new Il(await super._call(e))}},Il=class extends tr{};var Cl=class extends Ne{constructor({iou_scores:e,pred_masks:r}){super(),this.iou_scores=e,this.pred_masks=r}},Pl=class extends y{},ww=class extends Pl{async get_image_embeddings({pixel_values:e}){return await qt(this,{pixel_values:e})}async forward(e){!e.image_embeddings||!e.image_positional_embeddings?e={...e,...await this.get_image_embeddings(e)}:e={...e},e.input_labels??=rt(e.input_points.dims.slice(0,-1));let r={image_embeddings:e.image_embeddings,image_positional_embeddings:e.image_positional_embeddings};return e.input_points&&(r.input_points=e.input_points),e.input_labels&&(r.input_labels=e.input_labels),e.input_boxes&&(r.input_boxes=e.input_boxes),await ce(this.sessions.prompt_encoder_mask_decoder,r)}async _call(e){return new Cl(await super._call(e))}};var zl=class extends Ne{constructor({iou_scores:e,pred_masks:r,object_score_logits:s}){super(),this.iou_scores=e,this.pred_masks=r,this.object_score_logits=s}},Ll=class extends y{},xa=class extends Ll{async get_image_embeddings({pixel_values:e}){return await qt(this,{pixel_values:e})}async forward(e){let{num_feature_levels:r}=this.config.vision_config;if(Array.from({length:r},(a,i)=>`image_embeddings.${i}`).some(a=>!e[a])?e={...e,...await this.get_image_embeddings(e)}:e={...e},e.input_points){if(e.input_boxes&&e.input_boxes.dims[1]!==1)throw new Error("When both `input_points` and `input_boxes` are provided, the number of boxes per image must be 1.");let a=e.input_points.dims;e.input_labels??=rt(a.slice(0,-1)),e.input_boxes??=Ge([a[0],0,4],0)}else if(e.input_boxes){let a=e.input_boxes.dims;e.input_labels=Ge([a[0],a[1],0],-1n),e.input_points=Ge([a[0],1,0,2],0)}else throw new Error("At least one of `input_points` or `input_boxes` must be provided.");let n=this.sessions.prompt_encoder_mask_decoder,o=at(e,n.inputNames);return await ce(n,o)}async _call(e){return new zl(await super._call(e))}},xw=class extends xa{},yw=class extends xa{};var Vs=class extends y{},bw=class extends Vs{},vw=class extends Vs{},kw=class extends Vs{};var Hs=class extends y{},Ew=class extends Hs{},Aw=class extends Hs{},Mw=class extends Hs{};var ya=class extends y{},Tw=class extends ya{},ba=class extends ya{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"text_model"})}},Sw=class extends er{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"vision_model"})}};var va=class extends y{},Ow=class extends va{},Iw=class extends va{};var Xs=class extends y{main_input_name="input_values";forward_params=["input_values"]},Cw=class extends Xs{async encode(e){return await ce(this.sessions.encoder_model,e)}async decode(e){return await ce(this.sessions.decoder_model,e)}},ka=class extends Xs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"encoder_model"})}},Ea=class extends Xs{static async from_pretrained(e,r={}){return super.from_pretrained(e,{...r,model_file_name:r.model_file_name??"decoder_model"})}};var Ks=class extends y{},Pw=class extends Ks{},zw=class extends Ks{},Lw=class extends Ks{async generate_speech(e,r,{threshold:s=.5,minlenratio:n=0,maxlenratio:o=20,vocoder:a=null}={}){let i={input_ids:e},{encoder_outputs:l,encoder_attention_mask:u}=await qt(this,i),d=l.dims[1]/this.config.reduction_factor,f=Math.floor(d*o),m=Math.floor(d*n),_=this.config.num_mel_bins,w=[],x=null,k=null,E=0;for(;;){++E;let T=Q0(!!k),z;k?z=k.output_sequence_out:z=new U("float32",new Float32Array(_),[1,1,_]);let C={use_cache_branch:T,output_sequence:z,encoder_attention_mask:u,speaker_embeddings:r,encoder_hidden_states:l};this.addPastKeyValues(C,x),k=await ce(this.sessions.decoder_model_merged,C),x=this.getPastKeyValues(k,x);let{prob:v,spectrum:G}=k;if(w.push(G),E>=m&&(Array.from(v.data).filter(X=>X>=s).length>0||E>=f))break}let M=Ee(w),{waveform:I}=await ce(a.sessions.model,{spectrogram:M});return{spectrogram:M,waveform:I}}},Nw=class extends y{main_input_name="spectrogram"};var ts=class extends y{},$w=class extends ts{},Rw=class extends ts{async _call(e){return new we(await super._call(e))}},Uw=class extends ts{async _call(e){return new F(await super._call(e))}},Bw=class extends ts{async _call(e){return new Ae(await super._call(e))}};var Aa=class extends y{},Dw=class extends Aa{},Fw=class extends Aa{};var Ma=class extends y{},jw=class extends Ma{},Gw=class extends Ma{};var Nl=class extends y{},qw=class extends Nl{};var $l=class extends y{},Ta=class extends $l{async generate_speech({input_ids:e,attention_mask:r,style:s,num_inference_steps:n=5,speed:o=1.05}){let{sampling_rate:a,chunk_compress_factor:i,base_chunk_size:l,latent_dim:u}=this.config,{last_hidden_state:d,durations:f}=await ce(this.sessions.text_encoder,{input_ids:e,attention_mask:r,style:s}),m=f.div(o).mul_(a),_=l*i,w=m.data,x=Int32Array.from(w,V=>Math.ceil(V/_)),k=Math.max(...x),E=e.dims[0],M=new BigInt64Array(E*k);for(let V=0;V<E;++V)M.fill(1n,V*k,V*k+x[V]);let I=new U("int64",M,[E,k]),T=u*i,z=T*k,C=z0([E,T,k]),v=C.data;for(let V=0;V<E;++V)if(x[V]!==k)for(let Q=0;Q<T;++Q)v.fill(0,V*z+Q*k+x[V],V*z+(Q+1)*k);let G=Ge([E],n);for(let V=0;V<n;++V){let Q=Ge([E],V);({denoised_latents:C}=await ce(this.sessions.latent_denoiser,{style:s,noisy_latents:C,latent_mask:I,encoder_outputs:d,attention_mask:r,timestep:Q,num_inference_steps:G}))}let{waveform:X}=await ce(this.sessions.voice_decoder,{latents:C});return{waveform:X,durations:m}}};var Ys=class extends y{},Ww=class extends Ys{},Vw=class extends Ys{async _call(e){return new F(await super._call(e))}},Hw=class extends Ys{};var Sa=class extends y{},Xw=class extends Sa{},Kw=class extends Sa{};var Oa=class extends y{forward_params=["input_ids","attention_mask","encoder_outputs","decoder_input_ids","decoder_attention_mask","past_key_values"]},Yw=class extends Oa{},Qw=class extends Oa{};var Ia=class extends y{},Jw=class extends Ia{},Zw=class extends Ia{async _call(e){return new Rl(await super._call(e))}},Rl=class extends Us{};var Ul=class extends y{},ex=class extends Ul{};var Bl=class extends y{forward_params=["input_ids","attention_mask","position_ids","audio_values","past_key_values"]},Dl=class extends Bl{_merge_input_ids_with_audio_features(e){let r=e.audio_features.dims.at(-1),s=e.audio_features.view(-1,r);return ef({audio_token_id:this.config.ignore_index??this.config.audio_token_id,...e,audio_features:s})}},tx=class extends Dl{};var Qs=class extends y{},rx=class extends Qs{},sx=class extends Qs{async _call(e){return new gt(await super._call(e))}},nx=class extends Qs{async _call(e){return new F(await super._call(e))}};var rs=class extends y{},ox=class extends rs{},ax=class extends rs{async _call(e){return new gt(await super._call(e))}},ix=class extends rs{async _call(e){return new F(await super._call(e))}},lx=class extends rs{async _call(e){return new _e(await super._call(e))}};var Ca=class extends y{},cx=class extends Ca{},ux=class extends Ca{};var px=class extends y{main_input_name="pixel_values";forward_params=["pixel_values","decoder_input_ids","encoder_hidden_states","past_key_values"]};var Pa=class extends y{},dx=class extends Pa{},fx=class extends Pa{async _call(e){return new F(await super._call(e))}};var Fl=class extends y{},mx=class extends Fl{};var za=class extends y{},hx=class extends za{},_x=class extends za{async _call(e){return new F(await super._call(e))}};var jl=class extends y{},gx=class extends jl{async _call(e){return new Yd(await super._call(e))}};var Gl=class extends y{},wx=class extends Gl{};var ql=class extends Ne{constructor({waveform:e,spectrogram:r}){super(),this.waveform=e,this.spectrogram=r}},Wl=class extends y{},xx=class extends Wl{async _call(e){return new ql(await super._call(e))}};var Js=class extends y{},yx=class extends Js{},bx=class extends Js{async _call(e){return new gt(await super._call(e))}},vx=class extends Js{async _call(e){return new F(await super._call(e))}};var Vl=class extends Ne{constructor({logits:e,embeddings:r}){super(),this.logits=e,this.embeddings=r}},Cr=class extends y{},kx=class extends Cr{},Ex=class extends Cr{async _call(e){return new gt(await super._call(e))}},Ax=class extends Cr{async _call(e){return new F(await super._call(e))}},Mx=class extends Cr{async _call(e){return new Vl(await super._call(e))}},Tx=class extends Cr{async _call(e){return new _e(await super._call(e))}};var Hl=class extends y{},Sx=class extends Hl{};var Ox=class extends $n{return_timestamps=null;return_token_timestamps=null;num_frames=null;alignment_heads=null;task=null;language=null;no_timestamps_token_id=null;prompt_ids=null;is_multilingual=null;lang_to_id=null;task_to_id=null;max_initial_timestamp_index=1};var La=class extends y{requires_attention_mask=!1;main_input_name="input_features";forward_params=["input_features","attention_mask","decoder_input_ids","decoder_attention_mask","past_key_values"]},Ix=class extends La{},Xl=class extends La{_prepare_generation_config(e,r){return super._prepare_generation_config(e,r,Ox)}_retrieve_init_tokens(e){let r=[e.decoder_start_token_id],s=e.language,n=e.task;if(e.is_multilingual){s||(console.warn("No language specified - defaulting to English (en)."),s="en");let a=`<|${tA(s)}|>`;r.push(e.lang_to_id[a]),r.push(e.task_to_id[n??"transcribe"])}else if(s||n)throw new Error("Cannot specify `task` or `language` for an English-only model. If the model is intended to be multilingual, pass `is_multilingual=true` to generate, or update the generation config.");return!e.return_timestamps&&e.no_timestamps_token_id&&r.at(-1)!==e.no_timestamps_token_id?r.push(e.no_timestamps_token_id):e.return_timestamps&&r.at(-1)===e.no_timestamps_token_id&&(console.warn("<|notimestamps|> prompt token is removed from generation_config since `return_timestamps` is set to `true`."),r.pop()),r.filter(o=>o!=null)}async generate({inputs:e=null,generation_config:r=null,logits_processor:s=null,stopping_criteria:n=null,...o}){r=this._prepare_generation_config(r,o);let a=o.decoder_input_ids??this._retrieve_init_tokens(r);if(r.return_timestamps&&(s??=new Kr,s.push(new Ui(r,a))),r.begin_suppress_tokens&&(s??=new Kr,s.push(new Os(r.begin_suppress_tokens,a.length))),r.return_token_timestamps){if(!r.alignment_heads)throw new Error("Model generation config has no `alignment_heads`, token-level timestamps not available. See https://gist.github.com/hollance/42e32852f24243b748ae6bc1f985b13a on how to add this property to the generation config.");r.task==="translate"&&console.warn("Token-level timestamps may not be reliable for task 'translate'."),r.output_attentions=!0,r.return_dict_in_generate=!0}let i=await super.generate({inputs:e,generation_config:r,logits_processor:s,decoder_input_ids:a,...o});return r.return_token_timestamps&&(i.token_timestamps=this._extract_token_timestamps(i,r.alignment_heads,r.num_frames)),i}_extract_token_timestamps(e,r,s=null,n=.02){if(!e.cross_attentions)throw new Error("Model outputs must contain cross attentions to extract timestamps. This is most likely because the model was not exported with `output_attentions=True`.");s==null&&console.warn("`num_frames` has not been set, meaning the entire audio will be analyzed. This may lead to inaccurate token-level timestamps for short audios (< 30 seconds).");let o=this.config.median_filter_width;o===void 0&&(console.warn("Model config has no `median_filter_width`, using default value of 7."),o=7);let a=e.cross_attentions,i=Array.from({length:this.config.decoder_layers},(x,k)=>Ee(a.map(E=>E[k]),2)),l=zt(r.map(([x,k])=>{if(x>=i.length)throw new Error(`Layer index ${x} is out of bounds for cross attentions (length ${i.length}).`);return s?i[x].slice(null,k,null,[0,s]):i[x].slice(null,k)})).transpose(1,0,2,3),[u,d]=Ou(l,-2,0,!0),f=l.clone();for(let x=0;x<f.dims[0];++x){let k=f[x];for(let E=0;E<k.dims[0];++E){let M=k[E],I=u[x][E][0].data,T=d[x][E][0].data;for(let z=0;z<M.dims[0];++z){let C=M[z].data;for(let v=0;v<C.length;++v)C[v]=(C[v]-T[v])/I[v];C.set(_k(C,o))}}}let m=[fi(f,1)],_=e.sequences.dims,w=new U("float32",new Float32Array(_[0]*_[1]),_);for(let x=0;x<_[0];++x){let k=m[x].neg().squeeze_(0),[E,M]=wk(k.tolist()),I=Array.from({length:E.length-1},(C,v)=>E[v+1]-E[v]),T=dt([1],I).map(C=>!!C),z=[];for(let C=0;C<T.length;++C)T[C]&&z.push(M[C]*n);w[x].data.set(z,1)}return w}},Cx=class extends Xl{};var Pr=class extends y{},Px=class extends Pr{},zx=class extends Pr{async _call(e){return new we(await super._call(e))}},Lx=class extends Pr{async _call(e){return new F(await super._call(e))}},Nx=class extends Pr{async _call(e){return new _e(await super._call(e))}},$x=class extends Pr{async _call(e){return new Ae(await super._call(e))}};var zr=class extends y{},Rx=class extends zr{},Ux=class extends zr{async _call(e){return new we(await super._call(e))}},Bx=class extends zr{async _call(e){return new F(await super._call(e))}},Dx=class extends zr{async _call(e){return new _e(await super._call(e))}},Fx=class extends zr{async _call(e){return new Ae(await super._call(e))}};var Na=class extends y{},jx=class extends Na{},Gx=class extends Na{async _call(e){return new Kl(await super._call(e))}},Kl=class extends Ne{constructor({logits:e,pred_boxes:r}){super(),this.logits=e,this.pred_boxes=r}};var $a=class extends y{},qx=class extends $a{},Wx=class extends $a{};var tz=new Map([["bert","BertModel"],["neobert","NeoBertModel"],["modernbert","ModernBertModel"],["nomic_bert","NomicBertModel"],["roformer","RoFormerModel"],["electra","ElectraModel"],["esm","EsmModel"],["convbert","ConvBertModel"],["camembert","CamembertModel"],["deberta","DebertaModel"],["deberta-v2","DebertaV2Model"],["mpnet","MPNetModel"],["albert","AlbertModel"],["distilbert","DistilBertModel"],["roberta","RobertaModel"],["xlm","XLMModel"],["xlm-roberta","XLMRobertaModel"],["clap","ClapModel"],["clip","CLIPModel"],["clipseg","CLIPSegModel"],["chinese_clip","ChineseCLIPModel"],["siglip","SiglipModel"],["jina_clip","JinaCLIPModel"],["mobilebert","MobileBertModel"],["squeezebert","SqueezeBertModel"],["wav2vec2","Wav2Vec2Model"],["wav2vec2-bert","Wav2Vec2BertModel"],["unispeech","UniSpeechModel"],["unispeech-sat","UniSpeechSatModel"],["hubert","HubertModel"],["wavlm","WavLMModel"],["audio-spectrogram-transformer","ASTModel"],["vits","VitsModel"],["pyannote","PyAnnoteModel"],["wespeaker-resnet","WeSpeakerResNetModel"],["detr","DetrModel"],["rt_detr","RTDetrModel"],["rt_detr_v2","RTDetrV2Model"],["rf_detr","RFDetrModel"],["d_fine","DFineModel"],["table-transformer","TableTransformerModel"],["vit","ViTModel"],["ijepa","IJepaModel"],["pvt","PvtModel"],["vit_msn","ViTMSNModel"],["vit_mae","ViTMAEModel"],["groupvit","GroupViTModel"],["fastvit","FastViTModel"],["mobilevit","MobileViTModel"],["mobilevitv2","MobileViTV2Model"],["owlvit","OwlViTModel"],["owlv2","Owlv2Model"],["beit","BeitModel"],["deit","DeiTModel"],["hiera","HieraModel"],["convnext","ConvNextModel"],["convnextv2","ConvNextV2Model"],["dinov2","Dinov2Model"],["dinov2_with_registers","Dinov2WithRegistersModel"],["dinov3_vit","DINOv3ViTModel"],["dinov3_convnext","DINOv3ConvNextModel"],["resnet","ResNetModel"],["swin","SwinModel"],["swin2sr","Swin2SRModel"],["donut-swin","DonutSwinModel"],["yolos","YolosModel"],["dpt","DPTModel"],["glpn","GLPNModel"],["hifigan","SpeechT5HifiGan"],["efficientnet","EfficientNetModel"],["decision_transformer","DecisionTransformerModel"],["patchtst","PatchTSTModel"],["patchtsmixer","PatchTSMixerModel"],["mobilenet_v1","MobileNetV1Model"],["mobilenet_v2","MobileNetV2Model"],["mobilenet_v3","MobileNetV3Model"],["mobilenet_v4","MobileNetV4Model"],["maskformer","MaskFormerModel"],["mgp-str","MgpstrForSceneTextRecognition"],["style_text_to_speech_2","StyleTextToSpeech2Model"]]),rz=new Map([["t5","T5Model"],["longt5","LongT5Model"],["mt5","MT5Model"],["bart","BartModel"],["mbart","MBartModel"],["marian","MarianModel"],["whisper","WhisperModel"],["m2m_100","M2M100Model"],["blenderbot","BlenderbotModel"],["blenderbot-small","BlenderbotSmallModel"]]),sz=new Map([["mimi","MimiModel"],["dac","DacModel"],["snac","SnacModel"]]),nz=new Map([["bloom","BloomModel"],["jais","JAISModel"],["gpt2","GPT2Model"],["gpt_oss","GptOssModel"],["gptj","GPTJModel"],["gpt_bigcode","GPTBigCodeModel"],["gpt_neo","GPTNeoModel"],["gpt_neox","GPTNeoXModel"],["codegen","CodeGenModel"],["llama","LlamaModel"],["apertus","ApertusModel"],["nanochat","NanoChatModel"],["arcee","ArceeModel"],["lfm2","Lfm2Model"],["lfm2_moe","Lfm2MoeModel"],["smollm3","SmolLM3Model"],["exaone","ExaoneModel"],["olmo","OlmoModel"],["olmo2","Olmo2Model"],["olmo3","Olmo3Model"],["mobilellm","MobileLLMModel"],["granite","GraniteModel"],["granitemoehybrid","GraniteMoeHybridModel"],["cohere","CohereModel"],["gemma","GemmaModel"],["gemma2","Gemma2Model"],["vaultgemma","VaultGemmaModel"],["gemma3_text","Gemma3Model"],["helium","HeliumModel"],["glm","GlmModel"],["openelm","OpenELMModel"],["qwen2","Qwen2Model"],["qwen3","Qwen3Model"],["phi","PhiModel"],["phi3","Phi3Model"],["mpt","MptModel"],["opt","OPTModel"],["mistral","MistralModel"],["ministral","MinistralModel"],["ministral3","Ministral3Model"],["ernie4_5","Ernie4_5_Model"],["starcoder2","Starcoder2Model"],["falcon","FalconModel"],["falcon_h1","FalconH1Model"],["stablelm","StableLmModel"],["modernbert-decoder","ModernBertDecoderModel"],["hunyuan_v1_dense","HunYuanDenseV1Model"],["youtu","YoutuModel"]]),AA=new Map([["speecht5","SpeechT5ForSpeechToText"],["whisper","WhisperForConditionalGeneration"],["lite-whisper","LiteWhisperForConditionalGeneration"],["moonshine","MoonshineForConditionalGeneration"]]),MA=new Map([["speecht5","SpeechT5ForTextToSpeech"]]),TA=new Map([["vits","VitsModel"],["musicgen","MusicgenForConditionalGeneration"],["supertonic","SupertonicForConditionalGeneration"]]),SA=new Map([["bert","BertForSequenceClassification"],["neobert","NeoBertForSequenceClassification"],["modernbert","ModernBertForSequenceClassification"],["roformer","RoFormerForSequenceClassification"],["electra","ElectraForSequenceClassification"],["esm","EsmForSequenceClassification"],["convbert","ConvBertForSequenceClassification"],["camembert","CamembertForSequenceClassification"],["deberta","DebertaForSequenceClassification"],["deberta-v2","DebertaV2ForSequenceClassification"],["mpnet","MPNetForSequenceClassification"],["albert","AlbertForSequenceClassification"],["distilbert","DistilBertForSequenceClassification"],["roberta","RobertaForSequenceClassification"],["xlm","XLMForSequenceClassification"],["xlm-roberta","XLMRobertaForSequenceClassification"],["bart","BartForSequenceClassification"],["mbart","MBartForSequenceClassification"],["mobilebert","MobileBertForSequenceClassification"],["squeezebert","SqueezeBertForSequenceClassification"]]),OA=new Map([["bert","BertForTokenClassification"],["neobert","NeoBertForTokenClassification"],["modernbert","ModernBertForTokenClassification"],["roformer","RoFormerForTokenClassification"],["electra","ElectraForTokenClassification"],["esm","EsmForTokenClassification"],["convbert","ConvBertForTokenClassification"],["camembert","CamembertForTokenClassification"],["deberta","DebertaForTokenClassification"],["deberta-v2","DebertaV2ForTokenClassification"],["mpnet","MPNetForTokenClassification"],["distilbert","DistilBertForTokenClassification"],["roberta","RobertaForTokenClassification"],["xlm","XLMForTokenClassification"],["xlm-roberta","XLMRobertaForTokenClassification"]]),IA=new Map([["t5","T5ForConditionalGeneration"],["longt5","LongT5ForConditionalGeneration"],["mt5","MT5ForConditionalGeneration"],["bart","BartForConditionalGeneration"],["mbart","MBartForConditionalGeneration"],["marian","MarianMTModel"],["m2m_100","M2M100ForConditionalGeneration"],["blenderbot","BlenderbotForConditionalGeneration"],["blenderbot-small","BlenderbotSmallForConditionalGeneration"]]),CA=new Map([["bloom","BloomForCausalLM"],["gpt2","GPT2LMHeadModel"],["gpt_oss","GptOssForCausalLM"],["jais","JAISLMHeadModel"],["gptj","GPTJForCausalLM"],["gpt_bigcode","GPTBigCodeForCausalLM"],["gpt_neo","GPTNeoForCausalLM"],["gpt_neox","GPTNeoXForCausalLM"],["codegen","CodeGenForCausalLM"],["llama","LlamaForCausalLM"],["nanochat","NanoChatForCausalLM"],["apertus","ApertusForCausalLM"],["llama4_text","Llama4ForCausalLM"],["arcee","ArceeForCausalLM"],["lfm2","Lfm2ForCausalLM"],["lfm2_moe","Lfm2MoeForCausalLM"],["smollm3","SmolLM3ForCausalLM"],["exaone","ExaoneForCausalLM"],["olmo","OlmoForCausalLM"],["olmo2","Olmo2ForCausalLM"],["olmo3","Olmo3ForCausalLM"],["mobilellm","MobileLLMForCausalLM"],["granite","GraniteForCausalLM"],["granitemoehybrid","GraniteMoeHybridForCausalLM"],["cohere","CohereForCausalLM"],["gemma","GemmaForCausalLM"],["gemma2","Gemma2ForCausalLM"],["vaultgemma","VaultGemmaForCausalLM"],["gemma3_text","Gemma3ForCausalLM"],["helium","HeliumForCausalLM"],["glm","GlmForCausalLM"],["openelm","OpenELMForCausalLM"],["qwen2","Qwen2ForCausalLM"],["qwen3","Qwen3ForCausalLM"],["phi","PhiForCausalLM"],["phi3","Phi3ForCausalLM"],["mpt","MptForCausalLM"],["opt","OPTForCausalLM"],["mbart","MBartForCausalLM"],["mistral","MistralForCausalLM"],["ministral","MinistralForCausalLM"],["ministral3","Ministral3ForCausalLM"],["ernie4_5","Ernie4_5_ForCausalLM"],["starcoder2","Starcoder2ForCausalLM"],["falcon","FalconForCausalLM"],["falcon_h1","FalconH1ForCausalLM"],["trocr","TrOCRForCausalLM"],["stablelm","StableLmForCausalLM"],["modernbert-decoder","ModernBertDecoderForCausalLM"],["hunyuan_v1_dense","HunYuanDenseV1ForCausalLM"],["youtu","YoutuForCausalLM"],["phi3_v","Phi3VForCausalLM"]]),oz=new Map([["multi_modality","MultiModalityCausalLM"]]),PA=new Map([["bert","BertForMaskedLM"],["neobert","NeoBertForMaskedLM"],["modernbert","ModernBertForMaskedLM"],["roformer","RoFormerForMaskedLM"],["electra","ElectraForMaskedLM"],["esm","EsmForMaskedLM"],["convbert","ConvBertForMaskedLM"],["camembert","CamembertForMaskedLM"],["deberta","DebertaForMaskedLM"],["deberta-v2","DebertaV2ForMaskedLM"],["mpnet","MPNetForMaskedLM"],["albert","AlbertForMaskedLM"],["distilbert","DistilBertForMaskedLM"],["roberta","RobertaForMaskedLM"],["xlm","XLMWithLMHeadModel"],["xlm-roberta","XLMRobertaForMaskedLM"],["mobilebert","MobileBertForMaskedLM"],["squeezebert","SqueezeBertForMaskedLM"]]),zA=new Map([["bert","BertForQuestionAnswering"],["neobert","NeoBertForQuestionAnswering"],["roformer","RoFormerForQuestionAnswering"],["electra","ElectraForQuestionAnswering"],["convbert","ConvBertForQuestionAnswering"],["camembert","CamembertForQuestionAnswering"],["deberta","DebertaForQuestionAnswering"],["deberta-v2","DebertaV2ForQuestionAnswering"],["mpnet","MPNetForQuestionAnswering"],["albert","AlbertForQuestionAnswering"],["distilbert","DistilBertForQuestionAnswering"],["roberta","RobertaForQuestionAnswering"],["xlm","XLMForQuestionAnswering"],["xlm-roberta","XLMRobertaForQuestionAnswering"],["mobilebert","MobileBertForQuestionAnswering"],["squeezebert","SqueezeBertForQuestionAnswering"]]),LA=new Map([["vision-encoder-decoder","VisionEncoderDecoderModel"],["idefics3","Idefics3ForConditionalGeneration"],["smolvlm","SmolVLMForConditionalGeneration"]]),NA=new Map([["llava","LlavaForConditionalGeneration"],["llava_onevision","LlavaOnevisionForConditionalGeneration"],["moondream1","Moondream1ForConditionalGeneration"],["florence2","Florence2ForConditionalGeneration"],["qwen2-vl","Qwen2VLForConditionalGeneration"],["idefics3","Idefics3ForConditionalGeneration"],["smolvlm","SmolVLMForConditionalGeneration"],["paligemma","PaliGemmaForConditionalGeneration"],["llava_qwen2","LlavaQwen2ForCausalLM"],["gemma3n","Gemma3nForConditionalGeneration"],["mistral3","Mistral3ForConditionalGeneration"]]),$A=new Map([["ultravox","UltravoxModel"],["voxtral","VoxtralForConditionalGeneration"]]),az=new Map([["vision-encoder-decoder","VisionEncoderDecoderModel"]]),RA=new Map([["vit","ViTForImageClassification"],["ijepa","IJepaForImageClassification"],["pvt","PvtForImageClassification"],["vit_msn","ViTMSNForImageClassification"],["fastvit","FastViTForImageClassification"],["mobilevit","MobileViTForImageClassification"],["mobilevitv2","MobileViTV2ForImageClassification"],["beit","BeitForImageClassification"],["deit","DeiTForImageClassification"],["hiera","HieraForImageClassification"],["convnext","ConvNextForImageClassification"],["convnextv2","ConvNextV2ForImageClassification"],["dinov2","Dinov2ForImageClassification"],["dinov2_with_registers","Dinov2WithRegistersForImageClassification"],["resnet","ResNetForImageClassification"],["swin","SwinForImageClassification"],["segformer","SegformerForImageClassification"],["efficientnet","EfficientNetForImageClassification"],["mobilenet_v1","MobileNetV1ForImageClassification"],["mobilenet_v2","MobileNetV2ForImageClassification"],["mobilenet_v3","MobileNetV3ForImageClassification"],["mobilenet_v4","MobileNetV4ForImageClassification"]]),UA=new Map([["detr","DetrForObjectDetection"],["rt_detr","RTDetrForObjectDetection"],["rt_detr_v2","RTDetrV2ForObjectDetection"],["rf_detr","RFDetrForObjectDetection"],["d_fine","DFineForObjectDetection"],["table-transformer","TableTransformerForObjectDetection"],["yolos","YolosForObjectDetection"]]),BA=new Map([["owlvit","OwlViTForObjectDetection"],["owlv2","Owlv2ForObjectDetection"],["grounding-dino","GroundingDinoForObjectDetection"]]),Ra=new Map([["detr","DetrForSegmentation"],["clipseg","CLIPSegForImageSegmentation"]]),DA=new Map([["segformer","SegformerForSemanticSegmentation"],["sapiens","SapiensForSemanticSegmentation"],["swin","SwinForSemanticSegmentation"],["mobilenet_v1","MobileNetV1ForSemanticSegmentation"],["mobilenet_v2","MobileNetV2ForSemanticSegmentation"],["mobilenet_v3","MobileNetV3ForSemanticSegmentation"],["mobilenet_v4","MobileNetV4ForSemanticSegmentation"]]),FA=new Map([["detr","DetrForSegmentation"],["maskformer","MaskFormerForInstanceSegmentation"]]),jA=new Map([["sam","SamModel"],["sam2","Sam2Model"],["edgetam","EdgeTamModel"],["sam3_tracker","Sam3TrackerModel"]]),GA=new Map([["wav2vec2","Wav2Vec2ForCTC"],["wav2vec2-bert","Wav2Vec2BertForCTC"],["unispeech","UniSpeechForCTC"],["unispeech-sat","UniSpeechSatForCTC"],["wavlm","WavLMForCTC"],["hubert","HubertForCTC"],["parakeet_ctc","ParakeetForCTC"]]),qA=new Map([["wav2vec2","Wav2Vec2ForSequenceClassification"],["wav2vec2-bert","Wav2Vec2BertForSequenceClassification"],["unispeech","UniSpeechForSequenceClassification"],["unispeech-sat","UniSpeechSatForSequenceClassification"],["wavlm","WavLMForSequenceClassification"],["hubert","HubertForSequenceClassification"],["audio-spectrogram-transformer","ASTForAudioClassification"]]),WA=new Map([["wavlm","WavLMForXVector"]]),VA=new Map([["unispeech-sat","UniSpeechSatForAudioFrameClassification"],["wavlm","WavLMForAudioFrameClassification"],["wav2vec2","Wav2Vec2ForAudioFrameClassification"],["pyannote","PyAnnoteForAudioFrameClassification"]]),HA=new Map([["vitmatte","VitMatteForImageMatting"]]),iz=new Map([["patchtst","PatchTSTForPrediction"],["patchtsmixer","PatchTSMixerForPrediction"]]),XA=new Map([["swin2sr","Swin2SRForImageSuperResolution"]]),KA=new Map([["dpt","DPTForDepthEstimation"],["depth_anything","DepthAnythingForDepthEstimation"],["glpn","GLPNForDepthEstimation"],["sapiens","SapiensForDepthEstimation"],["depth_pro","DepthProForDepthEstimation"],["metric3d","Metric3DForDepthEstimation"],["metric3dv2","Metric3Dv2ForDepthEstimation"]]),YA=new Map([["sapiens","SapiensForNormalEstimation"]]),QA=new Map([["vitpose","VitPoseForPoseEstimation"]]),JA=new Map([["clip","CLIPVisionModelWithProjection"],["siglip","SiglipVisionModel"],["jina_clip","JinaCLIPVisionModel"]]),Z0=[[tz,H.EncoderOnly],[rz,H.EncoderDecoder],[nz,H.DecoderOnlyWithoutHead],[sz,H.AutoEncoder],[SA,H.EncoderOnly],[OA,H.EncoderOnly],[IA,H.Seq2Seq],[AA,H.Seq2Seq],[CA,H.DecoderOnly],[oz,H.MultiModality],[PA,H.EncoderOnly],[zA,H.EncoderOnly],[LA,H.Vision2Seq],[NA,H.ImageTextToText],[$A,H.AudioTextToText],[RA,H.EncoderOnly],[Ra,H.EncoderOnly],[FA,H.EncoderOnly],[DA,H.EncoderOnly],[HA,H.EncoderOnly],[iz,H.EncoderOnly],[XA,H.EncoderOnly],[KA,H.EncoderOnly],[YA,H.EncoderOnly],[QA,H.EncoderOnly],[UA,H.EncoderOnly],[BA,H.EncoderOnly],[jA,H.MaskGeneration],[GA,H.EncoderOnly],[qA,H.EncoderOnly],[MA,H.Seq2Seq],[TA,H.EncoderOnly],[WA,H.EncoderOnly],[VA,H.EncoderOnly],[JA,H.EncoderOnly]];for(let[t,e]of Z0)for(let r of t.values()){zs.set(r,e);let s=Yl[r];Ps.set(s,r),Zd.set(r,s)}var lz=[["MusicgenForConditionalGeneration",Jo,H.Musicgen],["Phi3VForCausalLM",pa,H.Phi3V],["CLIPTextModelWithProjection",Hn,H.EncoderOnly],["SiglipTextModel",ba,H.EncoderOnly],["JinaCLIPTextModel",zo,H.EncoderOnly],["ClapTextModelWithProjection",Wn,H.EncoderOnly],["ClapAudioModelWithProjection",Vn,H.EncoderOnly],["DacEncoderModel",to,H.EncoderOnly],["DacDecoderModel",ro,H.EncoderOnly],["MimiEncoderModel",Fo,H.EncoderOnly],["MimiDecoderModel",jo,H.EncoderOnly],["SnacEncoderModel",ka,H.EncoderOnly],["SnacDecoderModel",Ea,H.EncoderOnly],["Gemma3nForConditionalGeneration",go,H.ImageAudioTextToText],["SupertonicForConditionalGeneration",Ta,H.Supertonic],["ChatterboxModel",qn,H.Chatterbox]];for(let[t,e,r]of lz)zs.set(t,r),Ps.set(e,t),Zd.set(t,e);var eb=new Map([["modnet",Ra],["birefnet",Ra],["isnet",Ra],["ben",Ra]]);for(let[t,e]of eb.entries())e.set(t,"PreTrainedModel"),zs.set(t,H.EncoderOnly),Zd.set(t,y);zs.set("PreTrainedModel",H.EncoderOnly);Ps.set(y,"PreTrainedModel");var Ce={MODEL_FOR_SEQUENCE_CLASSIFICATION_MAPPING_NAMES:SA,MODEL_FOR_TOKEN_CLASSIFICATION_MAPPING_NAMES:OA,MODEL_FOR_TEXT_TO_SPECTROGRAM_MAPPING_NAMES:MA,MODEL_FOR_TEXT_TO_WAVEFORM_MAPPING_NAMES:TA,MODEL_FOR_MASKED_LM_MAPPING_NAMES:PA,MODEL_FOR_QUESTION_ANSWERING_MAPPING_NAMES:zA,MODEL_FOR_IMAGE_CLASSIFICATION_MAPPING_NAMES:RA,MODEL_FOR_IMAGE_SEGMENTATION_MAPPING_NAMES:Ra,MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPING_NAMES:DA,MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPING_NAMES:FA,MODEL_FOR_OBJECT_DETECTION_MAPPING_NAMES:UA,MODEL_FOR_ZERO_SHOT_OBJECT_DETECTION_MAPPING_NAMES:BA,MODEL_FOR_MASK_GENERATION_MAPPING_NAMES:jA,MODEL_FOR_CTC_MAPPING_NAMES:GA,MODEL_FOR_AUDIO_CLASSIFICATION_MAPPING_NAMES:qA,MODEL_FOR_AUDIO_XVECTOR_MAPPING_NAMES:WA,MODEL_FOR_AUDIO_FRAME_CLASSIFICATION_MAPPING_NAMES:VA,MODEL_FOR_DOCUMENT_QUESTION_ANSWERING_MAPPING_NAMES:az,MODEL_FOR_IMAGE_MATTING_MAPPING_NAMES:HA,MODEL_FOR_IMAGE_TO_IMAGE_MAPPING_NAMES:XA,MODEL_FOR_DEPTH_ESTIMATION_MAPPING_NAMES:KA,MODEL_FOR_NORMAL_ESTIMATION_MAPPING_NAMES:YA,MODEL_FOR_POSE_ESTIMATION_MAPPING_NAMES:QA,MODEL_FOR_IMAGE_FEATURE_EXTRACTION_MAPPING_NAMES:JA,MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPING_NAMES:NA,MODEL_FOR_AUDIO_TEXT_TO_TEXT_MAPPING_NAMES:$A,MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMES:IA,MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPING_NAMES:AA,MODEL_FOR_CAUSAL_LM_MAPPING_NAMES:CA,MODEL_FOR_VISION_2_SEQ_MAPPING_NAMES:LA};bA(Ce);var Se=class{static MODEL_CLASS_MAPPINGS=null;static BASE_IF_FAIL=!1;static async from_pretrained(e,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main",model_file_name:i=null,subfolder:l="onnx",device:u=null,dtype:d=null,use_external_data_format:f=null,session_options:m={}}={}){let _={progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a,model_file_name:i,subfolder:l,device:u,dtype:d,use_external_data_format:f,session_options:m};if(_.config=await Xr.from_pretrained(e,_),!this.MODEL_CLASS_MAPPINGS)throw new Error("`MODEL_CLASS_MAPPINGS` not implemented for this type of `AutoClass`: "+this.name);let w=_.config.model_type;for(let x of this.MODEL_CLASS_MAPPINGS){let k=x.get(w);if(!k){for(let E of x.values())if(E[0]===w){k=E;break}if(!k)continue}return await Yl[k].from_pretrained(e,_)}if(this.BASE_IF_FAIL)return eb.has(w)||console.warn(`Unknown model class "${w}", attempting to construct from base class.`),await y.from_pretrained(e,_);throw Error(`Unsupported model type: ${w}`)}},pr=class extends Se{static MODEL_CLASS_MAPPINGS=Z0.map(e=>e[0]);static BASE_IF_FAIL=!0},Ua=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_SEQUENCE_CLASSIFICATION_MAPPING_NAMES]},Ql=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_TOKEN_CLASSIFICATION_MAPPING_NAMES]},Zs=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMES]},Jl=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_SPEECH_SEQ_2_SEQ_MAPPING_NAMES]},Zl=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_TEXT_TO_SPECTROGRAM_MAPPING_NAMES]},ec=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_TEXT_TO_WAVEFORM_MAPPING_NAMES]},tc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_CAUSAL_LM_MAPPING_NAMES]},rc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_MASKED_LM_MAPPING_NAMES]},sc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_QUESTION_ANSWERING_MAPPING_NAMES]},nc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_VISION_2_SEQ_MAPPING_NAMES]},oc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_CLASSIFICATION_MAPPING_NAMES]},Ba=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_SEGMENTATION_MAPPING_NAMES]},Da=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_SEMANTIC_SEGMENTATION_MAPPING_NAMES]},Fa=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_UNIVERSAL_SEGMENTATION_MAPPING_NAMES]},ac=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_OBJECT_DETECTION_MAPPING_NAMES]},ic=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_ZERO_SHOT_OBJECT_DETECTION_MAPPING_NAMES]},tb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_MASK_GENERATION_MAPPING_NAMES]},lc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_CTC_MAPPING_NAMES]},cc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_AUDIO_CLASSIFICATION_MAPPING_NAMES]},rb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_AUDIO_XVECTOR_MAPPING_NAMES]},sb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_AUDIO_FRAME_CLASSIFICATION_MAPPING_NAMES]},uc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_DOCUMENT_QUESTION_ANSWERING_MAPPING_NAMES]},nb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_MATTING_MAPPING_NAMES]},pc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_TO_IMAGE_MAPPING_NAMES]},dc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_DEPTH_ESTIMATION_MAPPING_NAMES]},ob=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_NORMAL_ESTIMATION_MAPPING_NAMES]},ab=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_POSE_ESTIMATION_MAPPING_NAMES]},fc=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_FEATURE_EXTRACTION_MAPPING_NAMES]},ib=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_IMAGE_TEXT_TO_TEXT_MAPPING_NAMES]},lb=class extends Se{static MODEL_CLASS_MAPPINGS=[Ce.MODEL_FOR_AUDIO_TEXT_TO_TEXT_MAPPING_NAMES]};async function Ye(t){return Array.isArray(t)||(t=[t]),await Promise.all(t.map(e=>Xe.read(e)))}async function ss(t,e){return Array.isArray(t)||(t=[t]),await Promise.all(t.map(r=>typeof r=="string"||r instanceof URL?kp(r,e):r instanceof Float64Array?new Float32Array(r):r))}function mc(t,e){e&&(t=t.map(a=>a|0));let[r,s,n,o]=t;return{xmin:r,ymin:s,xmax:n,ymax:o}}var pe=class extends Je{constructor({task:e,model:r,tokenizer:s=null,processor:n=null}){super(),this.task=e,this.model=r,this.tokenizer=s,this.processor=n}async dispose(){await this.model.dispose()}};var hc=class extends pe{async _call(e,{top_k:r=1}={}){let s=this.tokenizer(e,{padding:!0,truncation:!0}),n=await this.model(s),{problem_type:o,id2label:a}=this.model.config,i=o==="multi_label_classification"?u=>u.sigmoid():u=>new U("float32",Oe(u.data),u.dims),l=[];for(let u of n.logits){let d=i(u),f=await Gt(d,r),m=f[0].tolist(),w=f[1].tolist().map((x,k)=>({label:a?a[x]:`LABEL_${x}`,score:m[k]}));r===1?l.push(...w):l.push(w)}return Array.isArray(e)||r===1?l:l[0]}};var _c=class extends pe{async _call(e,{ignore_labels:r=["O"]}={}){let s=Array.isArray(e),n=this.tokenizer(s?e:[e],{padding:!0,truncation:!0}),a=(await this.model(n)).logits,i=this.model.config.id2label,l=[];for(let u=0;u<a.dims[0];++u){let d=n.input_ids[u],f=a[u],m=[];for(let _=0;_<f.dims[0];++_){let w=f[_],x=Te(w.data)[1],k=i?i[x]:`LABEL_${x}`;if(r.includes(k))continue;let E=this.tokenizer.decode([d[_].item()],{skip_special_tokens:!0});if(E==="")continue;let M=Oe(w.data);m.push({entity:k,score:M[x],index:_,word:E})}l.push(m)}return s?l:l[0]}};var gc=class extends pe{async _call(e,r,{top_k:s=1}={}){let n=this.tokenizer(e,{text_pair:r,padding:!0,truncation:!0}),o=Array.isArray(e),{start_logits:a,end_logits:i}=await this.model(n),l=n.input_ids.tolist(),u=n.attention_mask.tolist(),{all_special_ids:d,sep_token_id:f}=this.tokenizer,m=[];for(let _=0;_<a.dims[0];++_){let w=l[_],x=w.findIndex(C=>C==f),k=a[_].tolist(),E=i[_].tolist();for(let C=1;C<k.length;++C)(u[_]==0||C<=x||d.findIndex(v=>v==w[C])!==-1)&&(k[C]=-1/0,E[C]=-1/0);let M=Oe(k).map((C,v)=>[C,v]),I=Oe(E).map((C,v)=>[C,v]);M[0][0]=0,I[0][0]=0;let T=sk(M,I).filter(C=>C[0][1]<=C[1][1]).map(C=>[C[0][1],C[1][1],C[0][0]*C[1][0]]).sort((C,v)=>v[2]-C[2]),z=[];for(let C=0;C<Math.min(T.length,s);++C){let[v,G,X]=T[C],V=w.slice(v,G+1),Q=this.tokenizer.decode(V,{skip_special_tokens:!0});z.push({answer:Q,score:X})}s===1?m.push(...z):m.push(z)}return o?m:m[0]}};var wc=class extends pe{async _call(e,{top_k:r=5}={}){let{mask_token_id:s,mask_token:n}=this.tokenizer,o=this.tokenizer(e,{padding:!0,truncation:!0}),{logits:a}=await this.model(o),i=[],l=o.input_ids.tolist();for(let u=0;u<l.length;++u){let d=l[u],f=d.findIndex(k=>k==s);if(f===-1)throw Error(`Mask token (${n}) not found in text.`);let m=a[u][f],_=await Gt(new U("float32",Oe(m.data),m.dims),r),w=_[0].tolist(),x=_[1].tolist();i.push(x.map((k,E)=>{let M=d.slice();return M[f]=k,{score:w[E],token:Number(k),token_str:this.tokenizer.decode([k]),sequence:this.tokenizer.decode(M,{skip_special_tokens:!0})}}))}return Array.isArray(e)?i:i[0]}};var Lr=class extends pe{_key="generated_text";async _call(e,r={}){Array.isArray(e)||(e=[e]),this.model.config.prefix&&(e=e.map(l=>this.model.config.prefix+l));let s=this.model.config.task_specific_params;s&&s[this.task]&&s[this.task].prefix&&(e=e.map(l=>s[this.task].prefix+l));let n=this.tokenizer,o={padding:!0,truncation:!0},a;this.task==="translation"&&"_build_translation_inputs"in n?a=n._build_translation_inputs(e,o,r):a=n(e,o);let i=await this.model.generate({...a,...r});return n.batch_decode(i,{skip_special_tokens:!0}).map(l=>({[this._key]:l}))}};var xc=class extends Lr{_key="summary_text"};var yc=class extends Lr{_key="translation_text"};function ZA(t){return Array.isArray(t)&&t.every(e=>"role"in e&&"content"in e)}var bc=class extends pe{async _call(e,r={}){let s=!1,n=!1,o=r.add_special_tokens??(this.tokenizer.add_bos_token||this.tokenizer.add_eos_token)??!1,a=r.tokenizer_encode_kwargs,i;if(typeof e=="string")i=e=[e];else if(Array.isArray(e)&&e.every(w=>typeof w=="string"))s=!0,i=e;else{if(ZA(e))e=[e];else if(Array.isArray(e)&&e.every(ZA))s=!0;else throw new Error("Input must be a string, an array of strings, a Chat, or an array of Chats");n=!0,i=e.map(w=>this.tokenizer.apply_chat_template(w,{tokenize:!1,add_generation_prompt:!0,...a})),o=!1,a=void 0}let l=n?!1:r.return_full_text??!0;this.tokenizer.padding_side="left";let u=this.tokenizer(i,{add_special_tokens:o,padding:!0,truncation:!0,...a}),d=await this.model.generate({...u,...r}),f=this.tokenizer.batch_decode(d,{skip_special_tokens:!0}),m;!l&&u.input_ids.dims.at(-1)>0&&(m=this.tokenizer.batch_decode(u.input_ids,{skip_special_tokens:!0}).map(w=>w.length));let _=Array.from({length:e.length},w=>[]);for(let w=0;w<f.length;++w){let x=Math.floor(w/d.dims[0]*e.length);m&&(f[w]=f[w].slice(m[x])),_[x].push({generated_text:n?[...e[x],{role:"assistant",content:f[w]}]:f[w]})}return!s&&_.length===1?_[0]:_}};var vc=class extends pe{constructor(e){super(e),this.label2id=Object.fromEntries(Object.entries(this.model.config.label2id).map(([r,s])=>[r.toLowerCase(),s])),this.entailment_id=this.label2id.entailment,this.entailment_id===void 0&&(console.warn("Could not find 'entailment' in label2id mapping. Using 2 as entailment_id."),this.entailment_id=2),this.contradiction_id=this.label2id.contradiction??this.label2id.not_entailment,this.contradiction_id===void 0&&(console.warn("Could not find 'contradiction' in label2id mapping. Using 0 as contradiction_id."),this.contradiction_id=0)}async _call(e,r,{hypothesis_template:s="This example is {}.",multi_label:n=!1}={}){let o=Array.isArray(e);o||(e=[e]),Array.isArray(r)||(r=[r]);let a=r.map(u=>s.replace("{}",u)),i=n||r.length===1,l=[];for(let u of e){let d=[];for(let _ of a){let w=this.tokenizer(u,{text_pair:_,padding:!0,truncation:!0}),x=await this.model(w);i?d.push([x.logits.data[this.contradiction_id],x.logits.data[this.entailment_id]]):d.push(x.logits.data[this.entailment_id])}let m=(i?d.map(_=>Oe(_)[1]):Oe(d)).map((_,w)=>[_,w]).sort((_,w)=>w[0]-_[0]);l.push({sequence:u,labels:m.map(_=>r[_[1]]),scores:m.map(_=>_[0])})}return o?l:l[0]}};var kc=class extends pe{async _call(e,{top_k:r=5}={}){let s=this.processor.feature_extractor.config.sampling_rate,n=await ss(e,s),o=this.model.config.id2label,a=[];for(let i of n){let l=await this.processor(i),d=(await this.model(l)).logits[0],f=await Gt(new U("float32",Oe(d.data),d.dims),r),m=f[0].tolist(),w=f[1].tolist().map((x,k)=>({label:o?o[x]:`LABEL_${x}`,score:m[k]}));a.push(w)}return Array.isArray(e)?a:a[0]}};var Ec=class extends pe{async _call(e,r,{hypothesis_template:s="This is a sound of {}."}={}){let n=!Array.isArray(e);n&&(e=[e]);let o=r.map(d=>s.replace("{}",d)),a=this.tokenizer(o,{padding:!0,truncation:!0}),i=this.processor.feature_extractor.config.sampling_rate,l=await ss(e,i),u=[];for(let d of l){let f=await this.processor(d),m=await this.model({...a,...f}),_=Oe(m.logits_per_audio.data);u.push([..._].map((w,x)=>({score:w,label:r[x]})))}return n?u[0]:u}};var Ac=class extends pe{async _call(e,r={}){switch(this.model.config.model_type){case"whisper":case"lite-whisper":return this._call_whisper(e,r);case"wav2vec2":case"wav2vec2-bert":case"unispeech":case"unispeech-sat":case"hubert":case"parakeet_ctc":return this._call_wav2vec2(e,r);case"moonshine":return this._call_moonshine(e,r);default:throw new Error(`AutomaticSpeechRecognitionPipeline does not support model type '${this.model.config.model_type}'.`)}}async _call_wav2vec2(e,r){r.language&&console.warn('`language` parameter is not yet supported for `wav2vec2` models, defaulting to "English".'),r.task&&console.warn('`task` parameter is not yet supported for `wav2vec2` models, defaulting to "transcribe".');let s=!Array.isArray(e),n=s?[e]:e,o=this.processor.feature_extractor.config.sampling_rate,a=await ss(n,o),i=[];for(let l of a){let u=await this.processor(l),f=(await this.model(u)).logits[0],m=[];for(let w of f)m.push(Te(w.data)[1]);let _=this.tokenizer.decode(m,{skip_special_tokens:!0}).trim();i.push({text:_})}return s?i[0]:i}async _call_whisper(e,r){let s=r.return_timestamps??!1,n=r.chunk_length_s??0,o=r.force_full_sequences??!1,a=r.stride_length_s??null,i={...r};s==="word"&&(i.return_token_timestamps=!0,i.return_timestamps=!1);let l=!Array.isArray(e),u=l?[e]:e,d=this.processor.feature_extractor.config,f=d.chunk_length/this.model.config.max_source_positions,m=d.hop_length,_=d.sampling_rate,w=await ss(u,_),x=[];for(let k of w){let E=[];if(n>0){if(a===null)a=n/6;else if(n<=a)throw Error("`chunk_length_s` must be larger than `stride_length_s`.");let T=_*n,z=_*a,C=T-2*z,v=0;for(;;){let G=v+T,X=k.subarray(v,G),V=await this.processor(X),Q=v===0,K=G>=k.length;if(E.push({stride:[X.length,Q?0:z,K?0:z],input_features:V.input_features,is_last:K}),K)break;v+=C}}else E=[{stride:[k.length,0,0],input_features:(await this.processor(k)).input_features,is_last:!0}];for(let T of E){i.num_frames=Math.floor(T.stride[0]/m);let z=await this.model.generate({inputs:T.input_features,...i});s==="word"?(T.tokens=z.sequences.tolist()[0],T.token_timestamps=z.token_timestamps.tolist()[0].map(C=>ms(C,2))):T.tokens=z[0].tolist(),T.stride=T.stride.map(C=>C/_)}let[M,I]=this.tokenizer._decode_asr(E,{time_precision:f,return_timestamps:s,force_full_sequences:o});x.push({text:M,...I})}return l?x[0]:x}async _call_moonshine(e,r){let s=!Array.isArray(e),n=s?[e]:e,o=this.processor.feature_extractor.config.sampling_rate,a=await ss(n,o),i=[];for(let l of a){let u=await this.processor(l),d=Math.floor(l.length/o)*6,f=await this.model.generate({max_new_tokens:d,...r,...u}),m=this.processor.batch_decode(f,{skip_special_tokens:!0})[0];i.push({text:m})}return s?i[0]:i}};var Mc=class extends pe{DEFAULT_VOCODER_ID="Xenova/speecht5_hifigan";constructor(e){super(e),this.vocoder=e.vocoder??null}async _prepare_speaker_embeddings(e,r){if((typeof e=="string"||e instanceof URL)&&(e=new Float32Array(await(await fetch(e)).arrayBuffer())),e instanceof Float32Array)e=new U("float32",e,[e.length]);else if(!(e instanceof U))throw new Error("Speaker embeddings must be a `Tensor`, `Float32Array`, `string`, or `URL`.");if(r>1){if(e.dims[0]===1)e=e.repeat(r,1);else if(e.dims[0]!==r)throw new Error(`Expected speaker embeddings batch size to be 1 or ${r}, but got ${e.dims[0]}.`)}return e}_postprocess_waveform(e,r,s,n=null){let o=r.data,[a,i]=r.dims,l=n?n.data:null,u=[];for(let d=0;d<a;++d){let f=l?Math.min(Math.ceil(l[d]),i):i,m=d*i;u.push(new An(o.slice(m,m+f),s))}return Array.isArray(e)?u:u[0]}async _call(e,r){return this.processor?this._call_text_to_spectrogram(e,r):this.model.config.model_type==="supertonic"?this._call_supertonic(e,r):this._call_text_to_waveform(e)}async _call_supertonic(e,{speaker_embeddings:r,num_inference_steps:s,speed:n}){if(!r)throw new Error("Speaker embeddings must be provided for Supertonic models.");let{sampling_rate:o,style_dim:a}=this.model.config,i=this.tokenizer(e,{padding:!0,truncation:!0}),l=i.input_ids.dims[0];r=await this._prepare_speaker_embeddings(r,l),r=r.view(l,-1,a);let{waveform:u,durations:d}=await this.model.generate_speech({...i,style:r,num_inference_steps:s,speed:n});return this._postprocess_waveform(e,u,o,d)}async _call_text_to_waveform(e){let r=this.tokenizer(e,{padding:!0,truncation:!0}),{waveform:s}=await this.model(r),n=this.model.config.sampling_rate;return this._postprocess_waveform(e,s,n)}async _call_text_to_spectrogram(e,{speaker_embeddings:r}){this.vocoder||(console.log("No vocoder specified, using default HifiGan vocoder."),this.vocoder=await pr.from_pretrained(this.DEFAULT_VOCODER_ID,{dtype:"fp32"}));let{input_ids:s}=this.tokenizer(e,{padding:!0,truncation:!0}),n=s.dims[0];r=await this._prepare_speaker_embeddings(r,n),r=r.view(n,-1);let{waveform:o}=await this.model.generate_speech(s,r,{vocoder:this.vocoder}),a=this.processor.feature_extractor.config.sampling_rate;return this._postprocess_waveform(e,o,a)}};var Tc=class extends pe{async _call(e,r={}){let s=Array.isArray(e),n=await Ye(e),{pixel_values:o}=await this.processor(n),a=[];for(let i of o){i.dims=[1,...i.dims];let l=await this.model.generate({inputs:i,...r}),u=this.tokenizer.batch_decode(l,{skip_special_tokens:!0}).map(d=>({generated_text:d.trim()}));a.push(u)}return s?a:a[0]}};var Sc=class extends pe{async _call(e,{top_k:r=5}={}){let s=await Ye(e),{pixel_values:n}=await this.processor(s),o=await this.model({pixel_values:n}),{id2label:a}=this.model.config,i=[];for(let l of o.logits){let u=await Gt(new U("float32",Oe(l.data),l.dims),r),d=u[0].tolist(),m=u[1].tolist().map((_,w)=>({label:a?a[_]:`LABEL_${_}`,score:d[w]}));i.push(m)}return Array.isArray(e)?i:i[0]}};var e2={panoptic:"post_process_panoptic_segmentation",instance:"post_process_instance_segmentation",semantic:"post_process_semantic_segmentation"},en=class extends pe{async _call(e,{threshold:r=.5,mask_threshold:s=.5,overlap_mask_area_threshold:n=.8,label_ids_to_fuse:o=null,target_sizes:a=null,subtask:i=null}={}){if(Array.isArray(e)&&e.length!==1)throw Error("Image segmentation pipeline currently only supports a batch size of 1.");let u=await Ye(e),d=u.map(M=>[M.height,M.width]),f=await this.processor(u),{inputNames:m,outputNames:_}=this.model.sessions.model;if(!m.includes("pixel_values")){if(m.length!==1)throw Error(`Expected a single input name, but got ${m.length} inputs: ${m}.`);let M=m[0];if(M in f)throw Error(`Input name ${M} already exists in the inputs.`);f[M]=f.pixel_values}let w=await this.model(f),x=null;if(i!==null)x=e2[i];else if(this.processor.image_processor){for(let[M,I]of Object.entries(e2))if(I in this.processor.image_processor){x=this.processor.image_processor[I].bind(this.processor.image_processor),i=M;break}}let k=this.model.config.id2label,E=[];if(i)if(i==="panoptic"||i==="instance"){let M=x(w,r,s,n,o,a??d)[0],I=M.segmentation;for(let T of M.segments_info){let z=new Uint8ClampedArray(I.data.length);for(let v=0;v<I.data.length;++v)I.data[v]===T.id&&(z[v]=255);let C=new Xe(z,I.dims[1],I.dims[0],1);E.push({score:T.score,label:k[T.label_id],mask:C})}}else if(i==="semantic"){let{segmentation:M,labels:I}=x(w,a??d)[0];for(let T of I){let z=new Uint8ClampedArray(M.data.length);for(let v=0;v<M.data.length;++v)M.data[v]===T&&(z[v]=255);let C=new Xe(z,M.dims[1],M.dims[0],1);E.push({score:null,label:k[T],mask:C})}}else throw Error(`Subtask ${i} not supported.`);else{let I=w[_[0]];for(let T=0;T<d.length;++T){let z=d[T],C=I[T];C.data.some(G=>G<-1e-5||G>1+1e-5)&&C.sigmoid_();let v=await Xe.fromTensor(C.mul_(255).to("uint8")).resize(z[1],z[0]);E.push({label:null,score:null,mask:v})}}return E}};var Oc=class extends en{async _call(e,r={}){let s=await Ye(e),n=await super._call(e,r),o=s.map((a,i)=>{let l=a.clone();return l.putAlpha(n[i].mask),l});return Array.isArray(e)?o:o[0]}};var Ic=class extends pe{async _call(e,r,{hypothesis_template:s="This is a photo of {}"}={}){let n=Array.isArray(e),o=await Ye(e),a=r.map(m=>s.replace("{}",m)),i=this.tokenizer(a,{padding:this.model.config.model_type==="siglip"?"max_length":!0,truncation:!0}),{pixel_values:l}=await this.processor(o),u=await this.model({...i,pixel_values:l}),d=this.model.config.model_type==="siglip"?m=>m.sigmoid().data:m=>Oe(m.data),f=[];for(let m of u.logits_per_image){let w=[...d(m)].map((x,k)=>({score:x,label:r[k]}));w.sort((x,k)=>k.score-x.score),f.push(w)}return n?f:f[0]}};var Cc=class extends pe{async _call(e,{threshold:r=.9,percentage:s=!1}={}){let n=Array.isArray(e);if(n&&e.length!==1)throw Error("Object detection pipeline currently only supports a batch size of 1.");let o=await Ye(e),a=s?null:o.map(_=>[_.height,_.width]),{pixel_values:i,pixel_mask:l}=await this.processor(o),u=await this.model({pixel_values:i,pixel_mask:l}),d=this.processor.image_processor.post_process_object_detection(u,r,a),{id2label:f}=this.model.config,m=d.map(_=>_.boxes.map((w,x)=>({score:_.scores[x],label:f[_.classes[x]],box:mc(w,!s)})));return n?m:m[0]}};var Pc=class extends pe{async _call(e,r,{threshold:s=.1,top_k:n=null,percentage:o=!1}={}){let a=Array.isArray(e),i=await Ye(e),l=this.tokenizer(r,{padding:!0,truncation:!0}),u=await this.processor(i),d=[];for(let f=0;f<i.length;++f){let m=i[f],_=o?null:[[m.height,m.width]],w=u.pixel_values[f].unsqueeze_(0),x=await this.model({...l,pixel_values:w}),k;if("post_process_grounded_object_detection"in this.processor){let E=this.processor.post_process_grounded_object_detection(x,l.input_ids,{box_threshold:s,text_threshold:s,target_sizes:_})[0];k=E.boxes.map((M,I)=>({score:E.scores[I],label:E.labels[I],box:mc(M,!o)}))}else{let E=this.processor.image_processor.post_process_object_detection(x,s,_,!0)[0];k=E.boxes.map((M,I)=>({score:E.scores[I],label:r[E.classes[I]],box:mc(M,!o)}))}k.sort((E,M)=>M.score-E.score),n!==null&&(k=k.slice(0,n)),d.push(k)}return a?d:d[0]}};var zc=class extends pe{async _call(e,r,s={}){if(Array.isArray(e)){if(e.length!==1)throw Error("Document Question Answering pipeline currently only supports a batch size of 1.");e=e[0]}let n=(await Ye(e))[0],{pixel_values:o}=await this.processor(n),a=`<s_docvqa><s_question>${r}</s_question><s_answer>`,i=this.tokenizer(a,{add_special_tokens:!1,padding:!0,truncation:!0}).input_ids,l=await this.model.generate({inputs:o,max_length:this.model.config.decoder.max_position_embeddings,decoder_input_ids:i,...s}),d=this.tokenizer.batch_decode(l)[0].match(/<s_answer>(.*?)<\/s_answer>/),f=null;return d&&d.length>=2&&(f=d[1].trim()),[{answer:f}]}};var Lc=class extends pe{async _call(e){let r=await Ye(e),s=await this.processor(r),n=await this.model(s),o=[];for(let a of n.reconstruction){let i=a.squeeze().clamp_(0,1).mul_(255).round_().to("uint8");o.push(Xe.fromTensor(i))}return Array.isArray(e)?o:o[0]}};var Nc=class extends pe{async _call(e){let r=await Ye(e),s=await this.processor(r),{predicted_depth:n}=await this.model(s),o=[];for(let a=0;a<r.length;++a){let i=n[a],[l,u]=i.dims.slice(-2),[d,f]=r[a].size,m=(await Pt(i.view(1,1,l,u),{size:[f,d],mode:"bilinear"})).view(f,d),_=m.min().item(),w=m.max().item(),x=m.sub(_).div_(w-_).mul_(255).to("uint8").unsqueeze(0),k=Xe.fromTensor(x);o.push({predicted_depth:m,depth:k})}return Array.isArray(e)?o:o[0]}};var $c=class extends pe{async _call(e,{pooling:r="none",normalize:s=!1,quantize:n=!1,precision:o="binary"}={}){let a=this.tokenizer(e,{padding:!0,truncation:!0}),i=await this.model(a),l=i.last_hidden_state??i.logits??i.token_embeddings;switch(r){case"none":break;case"mean":l=C0(l,a.attention_mask);break;case"first_token":case"cls":l=l.slice(null,0);break;case"last_token":case"eos":l=l.slice(null,-1);break;default:throw Error(`Pooling method '${r}' not supported.`)}return s&&(l=l.normalize(2,-1)),n&&(l=L0(l,o)),l}};var Rc=class extends pe{async _call(e,{pool:r=null}={}){let s=await Ye(e),{pixel_values:n}=await this.processor(s),o=await this.model({pixel_values:n}),a;if(r){if(!("pooler_output"in o))throw Error("No pooled output was returned. Make sure the model has a 'pooler' layer when using the 'pool' option.");a=o.pooler_output}else a=o.last_hidden_state??o.logits??o.image_embeds;return a}};var t2=Object.freeze({"text-classification":{tokenizer:J,pipeline:hc,model:Ua,default:{model:"Xenova/distilbert-base-uncased-finetuned-sst-2-english"},type:"text"},"token-classification":{tokenizer:J,pipeline:_c,model:Ql,default:{model:"Xenova/bert-base-multilingual-cased-ner-hrl"},type:"text"},"question-answering":{tokenizer:J,pipeline:gc,model:sc,default:{model:"Xenova/distilbert-base-cased-distilled-squad"},type:"text"},"fill-mask":{tokenizer:J,pipeline:wc,model:rc,default:{model:"onnx-community/ettin-encoder-32m-ONNX",dtype:"fp32"},type:"text"},summarization:{tokenizer:J,pipeline:xc,model:Zs,default:{model:"Xenova/distilbart-cnn-6-6"},type:"text"},translation:{tokenizer:J,pipeline:yc,model:Zs,default:{model:"Xenova/t5-small"},type:"text"},"text2text-generation":{tokenizer:J,pipeline:Lr,model:Zs,default:{model:"Xenova/flan-t5-small"},type:"text"},"text-generation":{tokenizer:J,pipeline:bc,model:tc,default:{model:"onnx-community/Qwen3-0.6B-ONNX",dtype:"q4"},type:"text"},"zero-shot-classification":{tokenizer:J,pipeline:vc,model:Ua,default:{model:"Xenova/distilbert-base-uncased-mnli"},type:"text"},"audio-classification":{pipeline:kc,model:cc,processor:lt,default:{model:"Xenova/wav2vec2-base-superb-ks"},type:"audio"},"zero-shot-audio-classification":{tokenizer:J,pipeline:Ec,model:pr,processor:lt,default:{model:"Xenova/clap-htsat-unfused"},type:"multimodal"},"automatic-speech-recognition":{tokenizer:J,pipeline:Ac,model:[Jl,lc],processor:lt,default:{model:"Xenova/whisper-tiny.en"},type:"multimodal"},"text-to-audio":{tokenizer:J,pipeline:Mc,model:[ec,Zl],processor:[lt,null],default:{model:"onnx-community/Supertonic-TTS-ONNX",dtype:"fp32"},type:"text"},"image-to-text":{tokenizer:J,pipeline:Tc,model:nc,processor:lt,default:{model:"Xenova/vit-gpt2-image-captioning"},type:"multimodal"},"image-classification":{pipeline:Sc,model:oc,processor:lt,default:{model:"Xenova/vit-base-patch16-224"},type:"multimodal"},"image-segmentation":{pipeline:en,model:[Ba,Da,Fa],processor:lt,default:{model:"Xenova/detr-resnet-50-panoptic"},type:"multimodal"},"background-removal":{pipeline:Oc,model:[Ba,Da,Fa],processor:lt,default:{model:"Xenova/modnet"},type:"image"},"zero-shot-image-classification":{tokenizer:J,pipeline:Ic,model:pr,processor:lt,default:{model:"Xenova/clip-vit-base-patch32"},type:"multimodal"},"object-detection":{pipeline:Cc,model:ac,processor:lt,default:{model:"Xenova/detr-resnet-50"},type:"multimodal"},"zero-shot-object-detection":{tokenizer:J,pipeline:Pc,model:ic,processor:lt,default:{model:"Xenova/owlvit-base-patch32"},type:"multimodal"},"document-question-answering":{tokenizer:J,pipeline:zc,model:uc,processor:lt,default:{model:"Xenova/donut-base-finetuned-docvqa"},type:"multimodal"},"image-to-image":{pipeline:Lc,model:pc,processor:lt,default:{model:"Xenova/swin2SR-classical-sr-x2-64"},type:"image"},"depth-estimation":{pipeline:Nc,model:dc,processor:lt,default:{model:"onnx-community/depth-anything-v2-small"},type:"image"},"feature-extraction":{tokenizer:J,pipeline:$c,model:pr,default:{model:"onnx-community/all-MiniLM-L6-v2-ONNX",dtype:"fp32"},type:"text"},"image-feature-extraction":{processor:lt,pipeline:Rc,model:[fc,pr],default:{model:"onnx-community/dinov3-vits16-pretrain-lvd1689m-ONNX",dtype:"fp32"},type:"image"}}),cz=Object.freeze({"sentiment-analysis":"text-classification",ner:"token-classification",asr:"automatic-speech-recognition","text-to-speech":"text-to-audio",embeddings:"feature-extraction"});async function uz(t,e=null,{progress_callback:r=null,config:s=null,cache_dir:n=null,local_files_only:o=!1,revision:a="main",device:i=null,dtype:l=null,subfolder:u="onnx",use_external_data_format:d=null,model_file_name:f=null,session_options:m={}}={}){t=cz[t]??t;let _=t2[t.split("_",1)[0]];if(!_)throw Error(`Unsupported pipeline: ${t}. Must be one of [${Object.keys(t2)}]`);e||(e=_.default.model,console.log(`No model specified. Using default model: "${e}".`),!l&&_.default.dtype&&(l=_.default.dtype));let w={progress_callback:r,config:s,cache_dir:n,local_files_only:o,revision:a,device:i,dtype:l,subfolder:u,use_external_data_format:d,model_file_name:f,session_options:m},x=new Map([["tokenizer",_.tokenizer],["model",_.model],["processor",_.processor]]),k=await pz(x,e,w);k.task=t,wr(r,{status:"ready",task:t,model:e});let E=_.pipeline;return new E(k)}async function pz(t,e,r){let s=Object.create(null),n=[];for(let[o,a]of t.entries()){if(!a)continue;let i;Array.isArray(a)?i=new Promise(async(l,u)=>{let d;for(let f of a){if(f===null){l(null);return}try{l(await f.from_pretrained(e,r));return}catch(m){if(m.message?.includes("Unsupported model type"))d=m;else if(m.message?.includes("Could not locate file"))d=m;else{u(m);return}}}u(d)}):i=a.from_pretrained(e,r),s[o]=i,n.push(i)}await Promise.all(n);for(let[o,a]of Object.entries(s))s[o]=await a;return s}var dz=t=>t>=19968&&t<=40959||t>=13312&&t<=19903||t>=131072&&t<=173791||t>=173824&&t<=177983||t>=177984&&t<=178207||t>=178208&&t<=183983||t>=63744&&t<=64255||t>=194560&&t<=195103,Vx=class{put(e){throw Error("Not implemented")}end(){throw Error("Not implemented")}},r2=be.IS_PROCESS_AVAILABLE?t=>process.stdout.write(t):t=>console.log(t),Hx=class extends Vx{constructor(e,{skip_prompt:r=!1,callback_function:s=null,token_callback_function:n=null,skip_special_tokens:o=!0,decode_kwargs:a={},...i}={}){super(),this.tokenizer=e,this.skip_prompt=r,this.callback_function=s??r2,this.token_callback_function=n,this.decode_kwargs={skip_special_tokens:o,...a,...i},this.token_cache=[],this.print_len=0,this.next_tokens_are_prompt=!0,this.special_ids=new Set(this.tokenizer.all_special_ids.map(BigInt))}put(e){if(e.length>1)throw Error("TextStreamer only supports batch size of 1");let r=this.next_tokens_are_prompt;if(r&&(this.next_tokens_are_prompt=!1,this.skip_prompt))return;let s=e[0];if(this.token_callback_function?.(s),s.length===1&&this.special_ids.has(s[0])){if(this.decode_kwargs.skip_special_tokens)return;if(this.token_cache.length>0){let l=this.tokenizer.decode(this.token_cache,this.decode_kwargs).slice(this.print_len);this.on_finalized_text(l,!1),this.token_cache=[],this.print_len=0}let a=this.tokenizer.decode(s,this.decode_kwargs);this.on_finalized_text(a,!1);return}this.token_cache=dt(this.token_cache,s);let n=this.tokenizer.decode(this.token_cache,this.decode_kwargs),o;r||n.endsWith(`
|
|
28
28
|
`)?(o=n.slice(this.print_len),this.token_cache=[],this.print_len=0):n.length>0&&dz(n.charCodeAt(n.length-1))?(o=n.slice(this.print_len),this.print_len+=o.length):(o=n.slice(this.print_len,n.lastIndexOf(" ")+1),this.print_len+=o.length),this.on_finalized_text(o,!1)}end(){let e;this.token_cache.length>0?(e=this.tokenizer.decode(this.token_cache,this.decode_kwargs).slice(this.print_len),this.token_cache=[],this.print_len=0):e="",this.next_tokens_are_prompt=!0,this.on_finalized_text(e,!0)}on_finalized_text(e,r){e.length>0&&this.callback_function?.(e),r&&this.callback_function===r2&&be.IS_PROCESS_AVAILABLE&&this.callback_function?.(`
|
|
29
29
|
`)}},cb=class extends Hx{constructor(e,{skip_prompt:r=!1,callback_function:s=null,token_callback_function:n=null,on_chunk_start:o=null,on_chunk_end:a=null,on_finalize:i=null,time_precision:l=.02,skip_special_tokens:u=!0,decode_kwargs:d={}}={}){super(e,{skip_prompt:r,skip_special_tokens:u,callback_function:s,token_callback_function:n,decode_kwargs:d}),this.timestamp_begin=e.timestamp_begin,this.on_chunk_start=o,this.on_chunk_end=a,this.on_finalize=i,this.time_precision=l,this.waiting_for_timestamp=!1}put(e){if(e.length>1)throw Error("WhisperTextStreamer only supports batch size of 1");let r=e[0];if(r.length===1){let s=Number(r[0])-this.timestamp_begin;if(s>=0){let n=s*this.time_precision;this.waiting_for_timestamp?this.on_chunk_end?.(n):this.on_chunk_start?.(n),this.waiting_for_timestamp=!this.waiting_for_timestamp,this.token_callback_function?.(r);return}}return super.put(e)}end(){super.end(),this.on_finalize?.()}};var ja=class{constructor(e,r){this.image=e,this.timestamp=r}},Uc=class{constructor(e,r){e.length>0&&e[0]instanceof Xe&&(e=e.map((s,n)=>new ja(s,(n+1)/(e.length+1)*r))),this.frames=e,this.duration=r}get width(){return this.frames[0].image.width}get height(){return this.frames[0].image.height}get fps(){return this.frames.length/this.duration}};async function s2(t,{num_frames:e=null,fps:r=null}={}){if(!be.IS_BROWSER_ENV)throw new Error("`load_video` is currently only supported in browser environments.");if(e==null&&r==null)throw new Error("Either num_frames or fps must be provided.");let s=[],n=document.createElement("video");if(n.crossOrigin="anonymous",n.muted=!0,typeof t=="string")n.src=t;else if(t instanceof Blob)n.src=URL.createObjectURL(t);else if(t instanceof HTMLVideoElement)n.src=t.src;else throw new Error("Invalid URL or video element provided.");if(await new Promise(f=>n.onloadedmetadata=f),n.seekable.start(0)===n.seekable.end(0)){let m=await(await fetch(n.src)).blob();n.src=URL.createObjectURL(m),await new Promise(_=>n.onloadedmetadata=_)}let o=n.duration,a,i;e!=null?(a=e,i=e===1?0:o/(e-1)):(i=1/r,a=Math.floor(o/i));let l=[];for(let f=0;f<a;++f)l.push(e===1?o/2:f*i);let u=document.createElement("canvas");u.width=n.videoWidth,u.height=n.videoHeight;let d=u.getContext("2d",{willReadFrequently:!0});for(let f of l){n.currentTime=f,await new Promise(x=>{n.onseeked=x}),d.drawImage(n,0,0,u.width,u.height);let m=d.getImageData(0,0,u.width,u.height),_=new Xe(m.data,u.width,u.height,4),w=new ja(_,f);s.push(w)}return n.remove(),new Uc(s,o)}0&&(module.exports={ASTFeatureExtractor,ASTForAudioClassification,ASTModel,ASTPreTrainedModel,AlbertForMaskedLM,AlbertForQuestionAnswering,AlbertForSequenceClassification,AlbertModel,AlbertPreTrainedModel,AlbertTokenizer,ApertusForCausalLM,ApertusModel,ApertusPreTrainedModel,ArceeForCausalLM,ArceeModel,ArceePreTrainedModel,AudioClassificationPipeline,AutoConfig,AutoFeatureExtractor,AutoImageProcessor,AutoModel,AutoModelForAudioClassification,AutoModelForAudioFrameClassification,AutoModelForAudioTextToText,AutoModelForCTC,AutoModelForCausalLM,AutoModelForDepthEstimation,AutoModelForDocumentQuestionAnswering,AutoModelForImageClassification,AutoModelForImageFeatureExtraction,AutoModelForImageMatting,AutoModelForImageSegmentation,AutoModelForImageTextToText,AutoModelForImageToImage,AutoModelForMaskGeneration,AutoModelForMaskedLM,AutoModelForNormalEstimation,AutoModelForObjectDetection,AutoModelForPoseEstimation,AutoModelForQuestionAnswering,AutoModelForSemanticSegmentation,AutoModelForSeq2SeqLM,AutoModelForSequenceClassification,AutoModelForSpeechSeq2Seq,AutoModelForTextToSpectrogram,AutoModelForTextToWaveform,AutoModelForTokenClassification,AutoModelForUniversalSegmentation,AutoModelForVision2Seq,AutoModelForXVector,AutoModelForZeroShotObjectDetection,AutoProcessor,AutoTokenizer,AutomaticSpeechRecognitionPipeline,BackgroundRemovalPipeline,BartForConditionalGeneration,BartForSequenceClassification,BartModel,BartPretrainedModel,BartTokenizer,BaseStreamer,BeitFeatureExtractor,BeitForImageClassification,BeitModel,BeitPreTrainedModel,BertForMaskedLM,BertForQuestionAnswering,BertForSequenceClassification,BertForTokenClassification,BertModel,BertPreTrainedModel,BertTokenizer,BitImageProcessor,BlenderbotForConditionalGeneration,BlenderbotModel,BlenderbotPreTrainedModel,BlenderbotSmallForConditionalGeneration,BlenderbotSmallModel,BlenderbotSmallPreTrainedModel,BlenderbotSmallTokenizer,BlenderbotTokenizer,BloomForCausalLM,BloomModel,BloomPreTrainedModel,BloomTokenizer,CLIPFeatureExtractor,CLIPImageProcessor,CLIPModel,CLIPPreTrainedModel,CLIPSegForImageSegmentation,CLIPSegModel,CLIPSegPreTrainedModel,CLIPTextModel,CLIPTextModelWithProjection,CLIPTokenizer,CLIPVisionModel,CLIPVisionModelWithProjection,CamembertForMaskedLM,CamembertForQuestionAnswering,CamembertForSequenceClassification,CamembertForTokenClassification,CamembertModel,CamembertPreTrainedModel,CamembertTokenizer,ChatterboxFeatureExtractor,ChatterboxModel,ChatterboxPreTrainedModel,ChatterboxProcessor,ChineseCLIPFeatureExtractor,ChineseCLIPModel,ChineseCLIPPreTrainedModel,ClapAudioModelWithProjection,ClapFeatureExtractor,ClapModel,ClapPreTrainedModel,ClapTextModelWithProjection,ClassifierFreeGuidanceLogitsProcessor,CodeGenForCausalLM,CodeGenModel,CodeGenPreTrainedModel,CodeGenTokenizer,CodeLlamaTokenizer,CohereForCausalLM,CohereModel,CoherePreTrainedModel,CohereTokenizer,ConvBertForMaskedLM,ConvBertForQuestionAnswering,ConvBertForSequenceClassification,ConvBertForTokenClassification,ConvBertModel,ConvBertPreTrainedModel,ConvBertTokenizer,ConvNextFeatureExtractor,ConvNextForImageClassification,ConvNextImageProcessor,ConvNextModel,ConvNextPreTrainedModel,ConvNextV2ForImageClassification,ConvNextV2Model,ConvNextV2PreTrainedModel,DFineForObjectDetection,DFineModel,DFinePreTrainedModel,DINOv3ConvNextModel,DINOv3ConvNextPreTrainedModel,DINOv3ViTImageProcessor,DINOv3ViTModel,DINOv3ViTPreTrainedModel,DPTFeatureExtractor,DPTForDepthEstimation,DPTImageProcessor,DPTModel,DPTPreTrainedModel,DacDecoderModel,DacDecoderOutput,DacEncoderModel,DacEncoderOutput,DacFeatureExtractor,DacModel,DacPreTrainedModel,DebertaForMaskedLM,DebertaForQuestionAnswering,DebertaForSequenceClassification,DebertaForTokenClassification,DebertaModel,DebertaPreTrainedModel,DebertaTokenizer,DebertaV2ForMaskedLM,DebertaV2ForQuestionAnswering,DebertaV2ForSequenceClassification,DebertaV2ForTokenClassification,DebertaV2Model,DebertaV2PreTrainedModel,DebertaV2Tokenizer,DecisionTransformerModel,DecisionTransformerPreTrainedModel,DeiTFeatureExtractor,DeiTForImageClassification,DeiTImageProcessor,DeiTModel,DeiTPreTrainedModel,DepthAnythingForDepthEstimation,DepthAnythingPreTrainedModel,DepthEstimationPipeline,DepthProForDepthEstimation,DepthProPreTrainedModel,DetrFeatureExtractor,DetrForObjectDetection,DetrForSegmentation,DetrImageProcessor,DetrModel,DetrObjectDetectionOutput,DetrPreTrainedModel,DetrSegmentationOutput,Dinov2ForImageClassification,Dinov2Model,Dinov2PreTrainedModel,Dinov2WithRegistersForImageClassification,Dinov2WithRegistersModel,Dinov2WithRegistersPreTrainedModel,DistilBertForMaskedLM,DistilBertForQuestionAnswering,DistilBertForSequenceClassification,DistilBertForTokenClassification,DistilBertModel,DistilBertPreTrainedModel,DistilBertTokenizer,DocumentQuestionAnsweringPipeline,DonutFeatureExtractor,DonutImageProcessor,DonutSwinModel,DonutSwinPreTrainedModel,EdgeTamModel,EfficientNetForImageClassification,EfficientNetImageProcessor,EfficientNetModel,EfficientNetPreTrainedModel,ElectraForMaskedLM,ElectraForQuestionAnswering,ElectraForSequenceClassification,ElectraForTokenClassification,ElectraModel,ElectraPreTrainedModel,ElectraTokenizer,EncodecFeatureExtractor,EosTokenCriteria,Ernie4_5ForCausalLM,Ernie4_5Model,Ernie4_5PretrainedModel,EsmForMaskedLM,EsmForSequenceClassification,EsmForTokenClassification,EsmModel,EsmPreTrainedModel,EsmTokenizer,ExaoneForCausalLM,ExaoneModel,ExaonePreTrainedModel,FalconForCausalLM,FalconH1ForCausalLM,FalconH1Model,FalconH1PreTrainedModel,FalconModel,FalconPreTrainedModel,FalconTokenizer,FastViTForImageClassification,FastViTModel,FastViTPreTrainedModel,FeatureExtractionPipeline,FeatureExtractor,FillMaskPipeline,Florence2ForConditionalGeneration,Florence2PreTrainedModel,Florence2Processor,ForcedBOSTokenLogitsProcessor,ForcedEOSTokenLogitsProcessor,GLPNFeatureExtractor,GLPNForDepthEstimation,GLPNModel,GLPNPreTrainedModel,GPT2LMHeadModel,GPT2Model,GPT2PreTrainedModel,GPT2Tokenizer,GPTBigCodeForCausalLM,GPTBigCodeModel,GPTBigCodePreTrainedModel,GPTJForCausalLM,GPTJModel,GPTJPreTrainedModel,GPTNeoForCausalLM,GPTNeoModel,GPTNeoPreTrainedModel,GPTNeoXForCausalLM,GPTNeoXModel,GPTNeoXPreTrainedModel,GPTNeoXTokenizer,Gemma2ForCausalLM,Gemma2Model,Gemma2PreTrainedModel,Gemma3ForCausalLM,Gemma3Model,Gemma3PreTrainedModel,Gemma3nAudioFeatureExtractor,Gemma3nForConditionalGeneration,Gemma3nPreTrainedModel,Gemma3nProcessor,GemmaForCausalLM,GemmaModel,GemmaPreTrainedModel,GemmaTokenizer,GlmForCausalLM,GlmModel,GlmPreTrainedModel,GptOssForCausalLM,GptOssModel,GptOssPreTrainedModel,GraniteForCausalLM,GraniteModel,GraniteMoeHybridForCausalLM,GraniteMoeHybridModel,GraniteMoeHybridPreTrainedModel,GranitePreTrainedModel,GroundingDinoForObjectDetection,GroundingDinoImageProcessor,GroundingDinoPreTrainedModel,GroundingDinoProcessor,GroupViTModel,GroupViTPreTrainedModel,HeliumForCausalLM,HeliumModel,HeliumPreTrainedModel,HerbertTokenizer,HieraForImageClassification,HieraModel,HieraPreTrainedModel,HubertForCTC,HubertForSequenceClassification,HubertModel,HubertPreTrainedModel,HunYuanDenseV1ForCausalLM,HunYuanDenseV1Model,HunYuanDenseV1PreTrainedModel,IJepaForImageClassification,IJepaModel,IJepaPreTrainedModel,Idefics3ForConditionalGeneration,Idefics3ImageProcessor,Idefics3PreTrainedModel,Idefics3Processor,ImageClassificationPipeline,ImageFeatureExtractionPipeline,ImageFeatureExtractor,ImageProcessor,ImageSegmentationPipeline,ImageToImagePipeline,ImageToTextPipeline,InterruptableStoppingCriteria,JAISLMHeadModel,JAISModel,JAISPreTrainedModel,JinaCLIPImageProcessor,JinaCLIPModel,JinaCLIPPreTrainedModel,JinaCLIPProcessor,JinaCLIPTextModel,JinaCLIPVisionModel,Lfm2ForCausalLM,Lfm2Model,Lfm2MoeForCausalLM,Lfm2MoeModel,Lfm2MoePreTrainedModel,Lfm2PreTrainedModel,LiteWhisperForConditionalGeneration,Llama4ForCausalLM,Llama4PreTrainedModel,LlamaForCausalLM,LlamaModel,LlamaPreTrainedModel,LlamaTokenizer,LlavaForConditionalGeneration,LlavaOnevisionForConditionalGeneration,LlavaOnevisionImageProcessor,LlavaPreTrainedModel,LlavaProcessor,LlavaQwen2ForCausalLM,LogitsProcessor,LogitsProcessorList,LogitsWarper,LongT5ForConditionalGeneration,LongT5Model,LongT5PreTrainedModel,M2M100ForConditionalGeneration,M2M100Model,M2M100PreTrainedModel,M2M100Tokenizer,MBart50Tokenizer,MBartForCausalLM,MBartForConditionalGeneration,MBartForSequenceClassification,MBartModel,MBartPreTrainedModel,MBartTokenizer,MPNetForMaskedLM,MPNetForQuestionAnswering,MPNetForSequenceClassification,MPNetForTokenClassification,MPNetModel,MPNetPreTrainedModel,MPNetTokenizer,MT5ForConditionalGeneration,MT5Model,MT5PreTrainedModel,MarianMTModel,MarianModel,MarianPreTrainedModel,MarianTokenizer,Mask2FormerImageProcessor,MaskFormerFeatureExtractor,MaskFormerForInstanceSegmentation,MaskFormerImageProcessor,MaskFormerModel,MaskFormerPreTrainedModel,MaxLengthCriteria,Metric3DForDepthEstimation,Metric3DPreTrainedModel,Metric3Dv2ForDepthEstimation,Metric3Dv2PreTrainedModel,MgpstrForSceneTextRecognition,MgpstrModelOutput,MgpstrPreTrainedModel,MgpstrProcessor,MgpstrTokenizer,MimiDecoderModel,MimiDecoderOutput,MimiEncoderModel,MimiEncoderOutput,MimiModel,MimiPreTrainedModel,MinLengthLogitsProcessor,MinNewTokensLengthLogitsProcessor,MistralForCausalLM,MistralModel,MistralPreTrainedModel,MobileBertForMaskedLM,MobileBertForQuestionAnswering,MobileBertForSequenceClassification,MobileBertModel,MobileBertPreTrainedModel,MobileBertTokenizer,MobileLLMForCausalLM,MobileLLMModel,MobileLLMPreTrainedModel,MobileNetV1FeatureExtractor,MobileNetV1ForImageClassification,MobileNetV1ForSemanticSegmentation,MobileNetV1ImageProcessor,MobileNetV1Model,MobileNetV1PreTrainedModel,MobileNetV2FeatureExtractor,MobileNetV2ForImageClassification,MobileNetV2ForSemanticSegmentation,MobileNetV2ImageProcessor,MobileNetV2Model,MobileNetV2PreTrainedModel,MobileNetV3FeatureExtractor,MobileNetV3ForImageClassification,MobileNetV3ForSemanticSegmentation,MobileNetV3ImageProcessor,MobileNetV3Model,MobileNetV3PreTrainedModel,MobileNetV4FeatureExtractor,MobileNetV4ForImageClassification,MobileNetV4ForSemanticSegmentation,MobileNetV4ImageProcessor,MobileNetV4Model,MobileNetV4PreTrainedModel,MobileViTFeatureExtractor,MobileViTForImageClassification,MobileViTImageProcessor,MobileViTModel,MobileViTPreTrainedModel,MobileViTV2ForImageClassification,MobileViTV2Model,MobileViTV2PreTrainedModel,ModernBertDecoderForCausalLM,ModernBertDecoderModel,ModernBertDecoderPreTrainedModel,ModernBertForMaskedLM,ModernBertForSequenceClassification,ModernBertForTokenClassification,ModernBertModel,ModernBertPreTrainedModel,Moondream1ForConditionalGeneration,MoonshineFeatureExtractor,MoonshineForConditionalGeneration,MoonshineModel,MoonshinePreTrainedModel,MoonshineProcessor,MptForCausalLM,MptModel,MptPreTrainedModel,MultiModalityCausalLM,MultiModalityPreTrainedModel,MusicgenForCausalLM,MusicgenForConditionalGeneration,MusicgenModel,MusicgenPreTrainedModel,NanoChatForCausalLM,NanoChatModel,NanoChatPreTrainedModel,NeoBertForMaskedLM,NeoBertForQuestionAnswering,NeoBertForSequenceClassification,NeoBertForTokenClassification,NeoBertModel,NeoBertPreTrainedModel,NllbTokenizer,NoBadWordsLogitsProcessor,NoRepeatNGramLogitsProcessor,NomicBertModel,NomicBertPreTrainedModel,NougatImageProcessor,NougatTokenizer,OPTForCausalLM,OPTModel,OPTPreTrainedModel,ObjectDetectionPipeline,Olmo2ForCausalLM,Olmo2Model,Olmo2PreTrainedModel,Olmo3ForCausalLM,Olmo3Model,Olmo3PreTrainedModel,OlmoForCausalLM,OlmoModel,OlmoPreTrainedModel,OpenELMForCausalLM,OpenELMModel,OpenELMPreTrainedModel,OwlViTFeatureExtractor,OwlViTForObjectDetection,OwlViTImageProcessor,OwlViTModel,OwlViTPreTrainedModel,OwlViTProcessor,Owlv2ForObjectDetection,Owlv2ImageProcessor,Owlv2Model,Owlv2PreTrainedModel,PaliGemmaForConditionalGeneration,PaliGemmaPreTrainedModel,PaliGemmaProcessor,ParakeetFeatureExtractor,ParakeetForCTC,ParakeetPreTrainedModel,PatchTSMixerForPrediction,PatchTSMixerModel,PatchTSMixerPreTrainedModel,PatchTSTForPrediction,PatchTSTModel,PatchTSTPreTrainedModel,Phi3ForCausalLM,Phi3Model,Phi3PreTrainedModel,Phi3VForCausalLM,Phi3VImageProcessor,Phi3VPreTrainedModel,Phi3VProcessor,PhiForCausalLM,PhiModel,PhiPreTrainedModel,PixtralImageProcessor,PixtralProcessor,PreTrainedModel,PreTrainedTokenizer,PretrainedConfig,Processor,PvtForImageClassification,PvtImageProcessor,PvtModel,PvtPreTrainedModel,PyAnnoteFeatureExtractor,PyAnnoteForAudioFrameClassification,PyAnnoteModel,PyAnnotePreTrainedModel,PyAnnoteProcessor,QuestionAnsweringPipeline,Qwen2ForCausalLM,Qwen2Model,Qwen2PreTrainedModel,Qwen2Tokenizer,Qwen2VLForConditionalGeneration,Qwen2VLImageProcessor,Qwen2VLPreTrainedModel,Qwen2VLProcessor,Qwen3ForCausalLM,Qwen3Model,Qwen3PreTrainedModel,RFDetrForObjectDetection,RFDetrModel,RFDetrObjectDetectionOutput,RFDetrPreTrainedModel,RTDetrForObjectDetection,RTDetrImageProcessor,RTDetrModel,RTDetrObjectDetectionOutput,RTDetrPreTrainedModel,RTDetrV2ForObjectDetection,RTDetrV2Model,RTDetrV2ObjectDetectionOutput,RTDetrV2PreTrainedModel,RawAudio,RawImage,RawVideo,RawVideoFrame,RepetitionPenaltyLogitsProcessor,ResNetForImageClassification,ResNetModel,ResNetPreTrainedModel,RoFormerForMaskedLM,RoFormerForQuestionAnswering,RoFormerForSequenceClassification,RoFormerForTokenClassification,RoFormerModel,RoFormerPreTrainedModel,RoFormerTokenizer,RobertaForMaskedLM,RobertaForQuestionAnswering,RobertaForSequenceClassification,RobertaForTokenClassification,RobertaModel,RobertaPreTrainedModel,RobertaTokenizer,Sam2ImageProcessor,Sam2ImageSegmentationOutput,Sam2Model,Sam2PreTrainedModel,Sam2Processor,Sam2VideoProcessor,Sam3ImageProcessor,Sam3TrackerModel,SamImageProcessor,SamImageSegmentationOutput,SamModel,SamPreTrainedModel,SamProcessor,SapiensFeatureExtractor,SapiensForDepthEstimation,SapiensForNormalEstimation,SapiensForSemanticSegmentation,SapiensImageProcessor,SapiensPreTrainedModel,SeamlessM4TFeatureExtractor,SegformerFeatureExtractor,SegformerForImageClassification,SegformerForSemanticSegmentation,SegformerImageProcessor,SegformerModel,SegformerPreTrainedModel,SiglipImageProcessor,SiglipModel,SiglipPreTrainedModel,SiglipTextModel,SiglipTokenizer,SiglipVisionModel,SmolLM3ForCausalLM,SmolLM3Model,SmolLM3PreTrainedModel,SmolVLMForConditionalGeneration,SmolVLMImageProcessor,SmolVLMProcessor,SnacDecoderModel,SnacEncoderModel,SnacFeatureExtractor,SnacModel,SnacPreTrainedModel,SpeechT5FeatureExtractor,SpeechT5ForSpeechToText,SpeechT5ForTextToSpeech,SpeechT5HifiGan,SpeechT5Model,SpeechT5PreTrainedModel,SpeechT5Processor,SpeechT5Tokenizer,SqueezeBertForMaskedLM,SqueezeBertForQuestionAnswering,SqueezeBertForSequenceClassification,SqueezeBertModel,SqueezeBertPreTrainedModel,SqueezeBertTokenizer,StableLmForCausalLM,StableLmModel,StableLmPreTrainedModel,Starcoder2ForCausalLM,Starcoder2Model,Starcoder2PreTrainedModel,StoppingCriteria,StoppingCriteriaList,StyleTextToSpeech2Model,StyleTextToSpeech2PreTrainedModel,SummarizationPipeline,SupertonicForConditionalGeneration,SupertonicPreTrainedModel,SuppressTokensAtBeginLogitsProcessor,Swin2SRForImageSuperResolution,Swin2SRImageProcessor,Swin2SRModel,Swin2SRPreTrainedModel,SwinForImageClassification,SwinForSemanticSegmentation,SwinModel,SwinPreTrainedModel,T5ForConditionalGeneration,T5Model,T5PreTrainedModel,T5Tokenizer,TableTransformerForObjectDetection,TableTransformerModel,TableTransformerObjectDetectionOutput,TableTransformerPreTrainedModel,TemperatureLogitsWarper,Tensor,Text2TextGenerationPipeline,TextClassificationPipeline,TextGenerationPipeline,TextStreamer,TextToAudioPipeline,TokenClassificationPipeline,TokenizersBackend,TopKLogitsWarper,TopPLogitsWarper,TrOCRForCausalLM,TrOCRPreTrainedModel,TranslationPipeline,UltravoxModel,UltravoxPreTrainedModel,UltravoxProcessor,UniSpeechForCTC,UniSpeechForSequenceClassification,UniSpeechModel,UniSpeechPreTrainedModel,UniSpeechSatForAudioFrameClassification,UniSpeechSatForCTC,UniSpeechSatForSequenceClassification,UniSpeechSatModel,UniSpeechSatPreTrainedModel,VLChatProcessor,VLMImageProcessor,VaultGemmaForCausalLM,VaultGemmaModel,VaultGemmaPreTrainedModel,ViTFeatureExtractor,ViTForImageClassification,ViTImageProcessor,ViTMAEModel,ViTMAEPreTrainedModel,ViTMSNForImageClassification,ViTMSNModel,ViTMSNPreTrainedModel,ViTModel,ViTPreTrainedModel,VisionEncoderDecoderModel,VitMatteForImageMatting,VitMatteImageProcessor,VitMattePreTrainedModel,VitPoseForPoseEstimation,VitPoseImageProcessor,VitPosePreTrainedModel,VitsModel,VitsModelOutput,VitsPreTrainedModel,VitsTokenizer,VoxtralForConditionalGeneration,VoxtralProcessor,Wav2Vec2BertForCTC,Wav2Vec2BertForSequenceClassification,Wav2Vec2BertModel,Wav2Vec2BertPreTrainedModel,Wav2Vec2CTCTokenizer,Wav2Vec2FeatureExtractor,Wav2Vec2ForAudioFrameClassification,Wav2Vec2ForCTC,Wav2Vec2ForSequenceClassification,Wav2Vec2Model,Wav2Vec2PreTrainedModel,Wav2Vec2Processor,Wav2Vec2ProcessorWithLM,WavLMForAudioFrameClassification,WavLMForCTC,WavLMForSequenceClassification,WavLMForXVector,WavLMModel,WavLMPreTrainedModel,WeSpeakerFeatureExtractor,WeSpeakerResNetModel,WeSpeakerResNetPreTrainedModel,WhisperFeatureExtractor,WhisperForConditionalGeneration,WhisperModel,WhisperPreTrainedModel,WhisperProcessor,WhisperTextStreamer,WhisperTimeStampLogitsProcessor,WhisperTokenizer,XLMForQuestionAnswering,XLMForSequenceClassification,XLMForTokenClassification,XLMModel,XLMPreTrainedModel,XLMRobertaForMaskedLM,XLMRobertaForQuestionAnswering,XLMRobertaForSequenceClassification,XLMRobertaForTokenClassification,XLMRobertaModel,XLMRobertaPreTrainedModel,XLMRobertaTokenizer,XLMTokenizer,XLMWithLMHeadModel,XVectorOutput,YolosFeatureExtractor,YolosForObjectDetection,YolosImageProcessor,YolosModel,YolosObjectDetectionOutput,YolosPreTrainedModel,YoutuForCausalLM,YoutuModel,YoutuPreTrainedModel,ZeroShotAudioClassificationPipeline,ZeroShotClassificationPipeline,ZeroShotImageClassificationPipeline,ZeroShotObjectDetectionPipeline,cat,cos_sim,dot,env,full,full_like,interpolate,interpolate_4d,layer_norm,load_image,load_video,log_softmax,matmul,mean,mean_pooling,ones,ones_like,permute,pipeline,quantize_embeddings,rand,randn,read_audio,rfft,slice,softmax,stack,std_mean,topk,zeros,zeros_like});
|