npm - @huggingface/transformers - Versions diffs - 3.0.2 → 3.1.1 - Mend

@huggingface/transformers 3.0.2 → 3.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (258) hide show

package/types/models/janus/processing_janus.d.ts ADDED Viewed

@@ -0,0 +1,77 @@
+export class VLChatProcessor extends Processor {
+    static image_processor_class: typeof AutoImageProcessor;
+    static tokenizer_class: typeof AutoTokenizer;
+    constructor(config: any, components: any);
+    image_tag: any;
+    image_start_tag: any;
+    image_end_tag: any;
+    num_image_tokens: any;
+    /**
+     * @typedef {Object} MultimodalMessageProperties Additional properties for multimodal messages.
+     * @property {(RawImage | string | URL)[]} [images] The images in the message.
+     * @typedef {(import('../../tokenizers.js').Message & MultimodalMessageProperties)[]} MultimodalConversation The conversation possibly containing multimodal inputs.
+     */
+    /**
+     * @typedef {Object} VLCChatProcessorResult The processed input.
+     * @property {Tensor} input_ids The input IDs.
+     * @property {Tensor} attention_mask The attention mask.
+     * @property {Tensor} images_seq_mask The image sequence mask.
+     * @property {Tensor} images_emb_mask The image embedding mask.
+     */
+    /**
+     * @param {MultimodalConversation} conversation The chat messages to process.
+     * @param {Object} options Additional options for processing.
+     * @param {RawImage|RawImage[]} [options.images] The images to process, if not set in the conversation.
+     * @param {string} [options.chat_template="default"] The chat template to use.
+     * @returns {Promise<VLCChatProcessorResult | VLCChatProcessorResult & import('../../base/image_processors_utils.js').ImageProcessorResult>} The processed input.
+     */
+    _call(conversation: (import("../../tokenizers.js").Message & {
+        /**
+         * The images in the message.
+         */
+        images?: (RawImage | string | URL)[];
+    })[], { images, chat_template, }?: {
+        images?: RawImage | RawImage[];
+        chat_template?: string;
+    }): Promise<{
+        /**
+         * The input IDs.
+         */
+        input_ids: Tensor;
+        /**
+         * The attention mask.
+         */
+        attention_mask: Tensor;
+        /**
+         * The image sequence mask.
+         */
+        images_seq_mask: Tensor;
+        /**
+         * The image embedding mask.
+         */
+        images_emb_mask: Tensor;
+    } | ({
+        /**
+         * The input IDs.
+         */
+        input_ids: Tensor;
+        /**
+         * The attention mask.
+         */
+        attention_mask: Tensor;
+        /**
+         * The image sequence mask.
+         */
+        images_seq_mask: Tensor;
+        /**
+         * The image embedding mask.
+         */
+        images_emb_mask: Tensor;
+    } & import("../../base/image_processors_utils.js").ImageProcessorResult)>;
+}
+import { Processor } from "../../base/processing_utils.js";
+import { RawImage } from "../../utils/image.js";
+import { Tensor } from "../../utils/tensor.js";
+import { AutoImageProcessor } from "../auto/image_processing_auto.js";
+import { AutoTokenizer } from "../../tokenizers.js";
+//# sourceMappingURL=processing_janus.d.ts.map

package/types/models/janus/processing_janus.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"processing_janus.d.ts","sourceRoot":"","sources":["../../../src/models/janus/processing_janus.js"],"names":[],"mappings":"AAQA;IACI,wDAAiD;IACjD,6CAAsC;IAGtC,0CAOC;IAJG,eAAsC;IACtC,qBAAkD;IAClD,mBAA8C;IAC9C,sBAAoD;IAGxD;;;;OAIG;IAEH;;;;;;OAMG;IAEH;;;;;;OAMG;IACH;;;;iBAnBc,CAAC,QAAQ,GAAG,MAAM,GAAG,GAAG,CAAC,EAAE;;QAeA,MAAM,GAApC,QAAQ,GAAC,QAAQ,EAAE;QACF,aAAa,GAA9B,MAAM;;;;;mBAVH,MAAM;;;;wBACN,MAAM;;;;yBACN,MAAM;;;;yBACN,MAAM;;;;;mBAHN,MAAM;;;;wBACN,MAAM;;;;yBACN,MAAM;;;;yBACN,MAAM;8EAwFnB;CACJ;0BAzHyB,gCAAgC;yBAKjC,sBAAsB;uBADxB,uBAAuB;mCAHX,kCAAkC;8BACvC,qBAAqB"}

package/types/models/jina_clip/image_processing_jina_clip.d.ts ADDED Viewed

@@ -0,0 +1,5 @@
+export class JinaCLIPImageProcessor extends ImageProcessor {
+    constructor(config: any);
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_jina_clip.d.ts.map

package/types/models/jina_clip/image_processing_jina_clip.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_jina_clip.d.ts","sourceRoot":"","sources":["../../../src/models/jina_clip/image_processing_jina_clip.js"],"names":[],"mappings":"AAIA;IACI,yBAmBC;CACJ;+BAvBM,sCAAsC"}

package/types/models/jina_clip/processing_jina_clip.d.ts ADDED Viewed

@@ -0,0 +1,9 @@
+export class JinaCLIPProcessor extends Processor {
+    static tokenizer_class: typeof AutoTokenizer;
+    static image_processor_class: typeof AutoImageProcessor;
+    _call(text?: any, images?: any, kwargs?: {}): Promise<any>;
+}
+import { Processor } from "../../base/processing_utils.js";
+import { AutoTokenizer } from "../../tokenizers.js";
+import { AutoImageProcessor } from "../auto/image_processing_auto.js";
+//# sourceMappingURL=processing_jina_clip.d.ts.map

package/types/models/jina_clip/processing_jina_clip.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"processing_jina_clip.d.ts","sourceRoot":"","sources":["../../../src/models/jina_clip/processing_jina_clip.js"],"names":[],"mappings":"AAKA;IACI,6CAAsC;IACtC,wDAAiD;IAEjD,2DAaC;CACJ;0BAtByB,gCAAgC;8BAE5B,qBAAqB;mCADhB,kCAAkC"}

package/types/models/llava_onevision/image_processing_llava_onevision.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export class LlavaOnevisionImageProcessor extends ImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_llava_onevision.d.ts.map

package/types/models/llava_onevision/image_processing_llava_onevision.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_llava_onevision.d.ts","sourceRoot":"","sources":["../../../src/models/llava_onevision/image_processing_llava_onevision.js"],"names":[],"mappings":"AAIA;CAAmE;+BAF5D,sCAAsC"}

package/types/models/mask2former/image_processing_mask2former.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export class Mask2FormerImageProcessor extends MaskFormerImageProcessor {
+}
+import { MaskFormerImageProcessor } from "../maskformer/image_processing_maskformer.js";
+//# sourceMappingURL=image_processing_mask2former.d.ts.map

package/types/models/mask2former/image_processing_mask2former.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_mask2former.d.ts","sourceRoot":"","sources":["../../../src/models/mask2former/image_processing_mask2former.js"],"names":[],"mappings":"AAIA;CAA2E;yCAHlC,8CAA8C"}

package/types/models/maskformer/image_processing_maskformer.d.ts ADDED Viewed

@@ -0,0 +1,22 @@
+export class MaskFormerImageProcessor extends ImageProcessor {
+    post_process_panoptic_segmentation(outputs: any, threshold?: number, mask_threshold?: number, overlap_mask_area_threshold?: number, label_ids_to_fuse?: Set<number>, target_sizes?: [number, number][]): {
+        segmentation: import("../../transformers.js").Tensor;
+        segments_info: {
+            id: number;
+            label_id: number;
+            score: number;
+        }[];
+    }[];
+    post_process_instance_segmentation(outputs: any, threshold?: number, target_sizes?: [number, number][]): {
+        segmentation: import("../../transformers.js").Tensor;
+        segments_info: {
+            id: number;
+            label_id: number;
+            score: number;
+        }[];
+    }[];
+}
+export class MaskFormerFeatureExtractor extends MaskFormerImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_maskformer.d.ts.map

package/types/models/maskformer/image_processing_maskformer.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_maskformer.d.ts","sourceRoot":"","sources":["../../../src/models/maskformer/image_processing_maskformer.js"],"names":[],"mappings":"AAMA;IAYure;;;;;;;QAA4qG;IAAA;;;;;;;QAAktB;CAFpjmB;AACD;CAA4E;+BAbrE,sCAAsC"}

package/types/models/mgp_str/processing_mgp_str.d.ts ADDED Viewed

@@ -0,0 +1,64 @@
+export class MgpstrProcessor extends Processor {
+    static tokenizer_class: typeof AutoTokenizer;
+    static image_processor_class: typeof AutoImageProcessor;
+    /**
+     * @returns {import('../../tokenizers.js').MgpstrTokenizer} The character tokenizer.
+     */
+    get char_tokenizer(): import("../../tokenizers.js").MgpstrTokenizer;
+    /**
+     * @returns {import('../../tokenizers.js').GPT2Tokenizer} The BPE tokenizer.
+     */
+    get bpe_tokenizer(): import("../../tokenizers.js").GPT2Tokenizer;
+    /**
+     * @returns {import('../../tokenizers.js').BertTokenizer} The WordPiece tokenizer.
+     */
+    get wp_tokenizer(): import("../../tokenizers.js").BertTokenizer;
+    /**
+     * Helper function to decode the model prediction logits.
+     * @param {import('../../utils/tensor.js').Tensor} pred_logits Model prediction logits.
+     * @param {string} format Type of model prediction. Must be one of ['char', 'bpe', 'wp'].
+     * @returns {[string[], number[]]} The decoded sentences and their confidence scores.
+     */
+    _decode_helper(pred_logits: import('../../utils/tensor.js').Tensor, format: string): [string[], number[]];
+    /**
+     * Convert a list of lists of char token ids into a list of strings by calling char tokenizer.
+     * @param {number[][]} sequences List of tokenized input ids.
+     * @returns {string[]} The list of char decoded sentences.
+     */
+    char_decode(sequences: number[][]): string[];
+    /**
+     * Convert a list of lists of BPE token ids into a list of strings by calling BPE tokenizer.
+     * @param {number[][]} sequences List of tokenized input ids.
+     * @returns {string[]} The list of BPE decoded sentences.
+     */
+    bpe_decode(sequences: number[][]): string[];
+    /**
+     * Convert a list of lists of word piece token ids into a list of strings by calling word piece tokenizer.
+     * @param {number[][]} sequences List of tokenized input ids.
+     * @returns {string[]} The list of wp decoded sentences.
+     */
+    wp_decode(sequences: number[][]): string[];
+    /**
+     * Convert a list of lists of token ids into a list of strings by calling decode.
+     * @param {import('../../utils/tensor.js').Tensor[]} sequences List of tokenized input ids.
+     * @returns {{generated_text: string[], scores: number[], char_preds: string[], bpe_preds: string[], wp_preds: string[]}}
+     * Dictionary of all the outputs of the decoded results.
+     * - generated_text: The final results after fusion of char, bpe, and wp.
+     * - scores: The final scores after fusion of char, bpe, and wp.
+     * - char_preds: The list of character decoded sentences.
+     * - bpe_preds: The list of BPE decoded sentences.
+     * - wp_preds: The list of wp decoded sentences.
+     */
+    batch_decode([char_logits, bpe_logits, wp_logits]: import('../../utils/tensor.js').Tensor[]): {
+        generated_text: string[];
+        scores: number[];
+        char_preds: string[];
+        bpe_preds: string[];
+        wp_preds: string[];
+    };
+    _call(images: any, text?: any): Promise<any>;
+}
+import { Processor } from "../../base/processing_utils.js";
+import { AutoTokenizer } from "../../tokenizers.js";
+import { AutoImageProcessor } from "../auto/image_processing_auto.js";
+//# sourceMappingURL=processing_mgp_str.d.ts.map

package/types/models/mgp_str/processing_mgp_str.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"processing_mgp_str.d.ts","sourceRoot":"","sources":["../../../src/models/mgp_str/processing_mgp_str.js"],"names":[],"mappings":"AAUA;IACI,6CAAsC;IACtC,wDAAiD;IAEjD;;OAEG;IACH,oEAEC;IAED;;OAEG;IACH,iEAEC;IAED;;OAEG;IACH,gEAEC;IAED;;;;;OAKG;IACH,4BAJW,OAAO,uBAAuB,EAAE,MAAM,UACtC,MAAM,GACJ,CAAC,MAAM,EAAE,EAAE,MAAM,EAAE,CAAC,CA0ChC;IAED;;;;OAIG;IACH,uBAHW,MAAM,EAAE,EAAE,GACR,MAAM,EAAE,CAIpB;IAED;;;;OAIG;IACH,sBAHW,MAAM,EAAE,EAAE,GACR,MAAM,EAAE,CAIpB;IAED;;;;OAIG;IACH,qBAHW,MAAM,EAAE,EAAE,GACR,MAAM,EAAE,CAIpB;IAED;;;;;;;;;;OAUG;IACH,mDATW,OAAO,uBAAuB,EAAE,MAAM,EAAE;wBACrB,MAAM,EAAE;gBAAU,MAAM,EAAE;oBAAc,MAAM,EAAE;mBAAa,MAAM,EAAE;kBAAY,MAAM,EAAE;MA4BtH;IAmBD,6CAQC;CACJ;0BAzKyB,gCAAgC;8BAE5B,qBAAqB;mCADhB,kCAAkC"}

package/types/models/mobilenet_v1/image_processing_mobilenet_v1.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+export class MobileNetV1ImageProcessor extends ImageProcessor {
+}
+export class MobileNetV1FeatureExtractor extends MobileNetV1ImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_mobilenet_v1.d.ts.map

package/types/models/mobilenet_v1/image_processing_mobilenet_v1.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_mobilenet_v1.d.ts","sourceRoot":"","sources":["../../../src/models/mobilenet_v1/image_processing_mobilenet_v1.js"],"names":[],"mappings":"AAKA;CAAiE;AACjE;CAA8E;+BAJvE,sCAAsC"}

package/types/models/mobilenet_v2/image_processing_mobilenet_v2.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+export class MobileNetV2ImageProcessor extends ImageProcessor {
+}
+export class MobileNetV2FeatureExtractor extends MobileNetV2ImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_mobilenet_v2.d.ts.map

package/types/models/mobilenet_v2/image_processing_mobilenet_v2.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_mobilenet_v2.d.ts","sourceRoot":"","sources":["../../../src/models/mobilenet_v2/image_processing_mobilenet_v2.js"],"names":[],"mappings":"AAKA;CAAiE;AACjE;CAA8E;+BAJvE,sCAAsC"}

package/types/models/mobilenet_v3/image_processing_mobilenet_v3.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+export class MobileNetV3ImageProcessor extends ImageProcessor {
+}
+export class MobileNetV3FeatureExtractor extends MobileNetV3ImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_mobilenet_v3.d.ts.map

package/types/models/mobilenet_v3/image_processing_mobilenet_v3.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_mobilenet_v3.d.ts","sourceRoot":"","sources":["../../../src/models/mobilenet_v3/image_processing_mobilenet_v3.js"],"names":[],"mappings":"AAKA;CAAiE;AACjE;CAA8E;+BAJvE,sCAAsC"}

package/types/models/mobilenet_v4/image_processing_mobilenet_v4.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+export class MobileNetV4ImageProcessor extends ImageProcessor {
+}
+export class MobileNetV4FeatureExtractor extends MobileNetV4ImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_mobilenet_v4.d.ts.map

package/types/models/mobilenet_v4/image_processing_mobilenet_v4.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_mobilenet_v4.d.ts","sourceRoot":"","sources":["../../../src/models/mobilenet_v4/image_processing_mobilenet_v4.js"],"names":[],"mappings":"AAKA;CAAiE;AACjE;CAA8E;+BAJvE,sCAAsC"}

package/types/models/mobilevit/image_processing_mobilevit.d.ts ADDED Viewed

@@ -0,0 +1,6 @@
+export class MobileViTImageProcessor extends ImageProcessor {
+}
+export class MobileViTFeatureExtractor extends MobileViTImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_mobilevit.d.ts.map

package/types/models/mobilevit/image_processing_mobilevit.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_mobilevit.d.ts","sourceRoot":"","sources":["../../../src/models/mobilevit/image_processing_mobilevit.js"],"names":[],"mappings":"AAIA;CAA+D;AAC/D;CAA0E;+BAHnE,sCAAsC"}

package/types/models/nougat/image_processing_nougat.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export class NougatImageProcessor extends DonutImageProcessor {
+}
+import { DonutImageProcessor } from "../donut/image_processing_donut.js";
+//# sourceMappingURL=image_processing_nougat.d.ts.map

package/types/models/nougat/image_processing_nougat.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_nougat.d.ts","sourceRoot":"","sources":["../../../src/models/nougat/image_processing_nougat.js"],"names":[],"mappings":"AAIA;CAAiE;oCAH7B,oCAAoC"}

package/types/models/owlv2/image_processing_owlv2.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export class Owlv2ImageProcessor extends OwlViTImageProcessor {
+}
+import { OwlViTImageProcessor } from "../owlvit/image_processing_owlvit.js";
+//# sourceMappingURL=image_processing_owlv2.d.ts.map

package/types/models/owlv2/image_processing_owlv2.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_owlv2.d.ts","sourceRoot":"","sources":["../../../src/models/owlv2/image_processing_owlv2.js"],"names":[],"mappings":"AAIA;CAAiE;qCAH5B,sCAAsC"}

package/types/models/owlvit/image_processing_owlvit.d.ts ADDED Viewed

@@ -0,0 +1,10 @@
+export class OwlViTImageProcessor extends ImageProcessor {
+    post_process_object_detection(outputs: {
+        logits: import("../../transformers.js").Tensor;
+        pred_boxes: import("../../transformers.js").Tensor;
+    }, threshold?: number, target_sizes?: [number, number][], is_zero_shot?: boolean): any[];
+}
+export class OwlViTFeatureExtractor extends OwlViTImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_owlvit.d.ts.map

package/types/models/owlvit/image_processing_owlvit.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_owlvit.d.ts","sourceRoot":"","sources":["../../../src/models/owlvit/image_processing_owlvit.js"],"names":[],"mappings":"AAKA;IAO4tE;;;6FAAu6F;CAFloK;AACD;CAAoE;+BAR7D,sCAAsC"}

package/types/models/owlvit/processing_owlvit.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+export class OwlViTProcessor extends Processor {
+    static tokenizer_class: typeof AutoTokenizer;
+    static image_processor_class: typeof AutoImageProcessor;
+}
+import { Processor } from "../../base/processing_utils.js";
+import { AutoTokenizer } from "../../tokenizers.js";
+import { AutoImageProcessor } from "../auto/image_processing_auto.js";
+//# sourceMappingURL=processing_owlvit.d.ts.map

package/types/models/owlvit/processing_owlvit.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"processing_owlvit.d.ts","sourceRoot":"","sources":["../../../src/models/owlvit/processing_owlvit.js"],"names":[],"mappings":"AAGA;IACI,6CAAsC;IACtC,wDAAiD;CACpD;0BANyB,gCAAgC;8BAE5B,qBAAqB;mCADhB,kCAAkC"}

package/types/models/processors.d.ts ADDED Viewed

@@ -0,0 +1,13 @@
+export * from "./florence2/processing_florence2.js";
+export * from "./mgp_str/processing_mgp_str.js";
+export * from "./idefics3/processing_idefics3.js";
+export * from "./janus/processing_janus.js";
+export * from "./jina_clip/processing_jina_clip.js";
+export * from "./owlvit/processing_owlvit.js";
+export * from "./pyannote/processing_pyannote.js";
+export * from "./qwen2_vl/processing_qwen2_vl.js";
+export * from "./sam/processing_sam.js";
+export * from "./speecht5/processing_speecht5.js";
+export * from "./wav2vec2/processing_wav2vec2.js";
+export * from "./whisper/processing_whisper.js";
+//# sourceMappingURL=processors.d.ts.map

package/types/models/processors.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"processors.d.ts","sourceRoot":"","sources":["../../src/models/processors.js"],"names":[],"mappings":""}

package/types/models/pvt/image_processing_pvt.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export class PvtImageProcessor extends ImageProcessor {
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_pvt.d.ts.map

package/types/models/pvt/image_processing_pvt.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_pvt.d.ts","sourceRoot":"","sources":["../../../src/models/pvt/image_processing_pvt.js"],"names":[],"mappings":"AAIA;CAAyD;+BAFlD,sCAAsC"}

package/types/models/pyannote/feature_extraction_pyannote.d.ts ADDED Viewed

@@ -0,0 +1,13 @@
+export class PyAnnoteFeatureExtractor extends FeatureExtractor {
+    /**
+     * Asynchronously extracts features from a given audio using the provided configuration.
+     * @param {Float32Array|Float64Array} audio The audio data as a Float32Array/Float64Array.
+     * @returns {Promise<{ input_values: Tensor; }>} The extracted input features.
+     */
+    _call(audio: Float32Array | Float64Array): Promise<{
+        input_values: Tensor;
+    }>;
+}
+import { FeatureExtractor } from '../../base/feature_extraction_utils.js';
+import { Tensor } from '../../utils/tensor.js';
+//# sourceMappingURL=feature_extraction_pyannote.d.ts.map

package/types/models/pyannote/feature_extraction_pyannote.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"feature_extraction_pyannote.d.ts","sourceRoot":"","sources":["../../../src/models/pyannote/feature_extraction_pyannote.js"],"names":[],"mappings":"AAIA;IACI;;;;OAIG;IACH,aAHW,YAAY,GAAC,YAAY,GACvB,QAAQ;QAAE,YAAY,EAAE,MAAM,CAAC;KAAE,CAAC,CAiB9C;CAEJ;iCA3BuD,wCAAwC;uBACzE,uBAAuB"}

package/types/models/pyannote/processing_pyannote.d.ts ADDED Viewed

@@ -0,0 +1,30 @@
+export class PyAnnoteProcessor extends Processor {
+    static feature_extractor_class: typeof AutoFeatureExtractor;
+    /**
+     * Calls the feature_extractor function with the given audio input.
+     * @param {any} audio The audio input to extract features from.
+     * @returns {Promise<any>} A Promise that resolves with the extracted features.
+     */
+    _call(audio: any): Promise<any>;
+    /**
+     * NOTE: Can return fractional values. `Math.ceil` will ensure correct value.
+     * @param {number} samples The number of frames in the audio.
+     * @returns {number} The number of frames in the audio.
+     */
+    samples_to_frames(samples: number): number;
+    /**
+     * Post-processes the speaker diarization logits output by the model.
+     * @param {import('../../utils/tensor.js').Tensor} logits The speaker diarization logits output by the model.
+     * @param {number} num_samples Number of samples in the input audio.
+     * @returns {Array<Array<{ id: number, start: number, end: number, confidence: number }>>} The post-processed speaker diarization results.
+     */
+    post_process_speaker_diarization(logits: import('../../utils/tensor.js').Tensor, num_samples: number): Array<Array<{
+        id: number;
+        start: number;
+        end: number;
+        confidence: number;
+    }>>;
+}
+import { Processor } from '../../base/processing_utils.js';
+import { AutoFeatureExtractor } from '../auto/feature_extraction_auto.js';
+//# sourceMappingURL=processing_pyannote.d.ts.map

package/types/models/pyannote/processing_pyannote.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"processing_pyannote.d.ts","sourceRoot":"","sources":["../../../src/models/pyannote/processing_pyannote.js"],"names":[],"mappings":"AAIA;IACI,4DAAqD;IAErD;;;;OAIG;IACH,aAHW,GAAG,GACD,QAAQ,GAAG,CAAC,CAIxB;IAED;;;;OAIG;IACH,2BAHW,MAAM,GACJ,MAAM,CAIlB;IAED;;;;;OAKG;IACH,yCAJW,OAAO,uBAAuB,EAAE,MAAM,eACtC,MAAM,GACJ,MAAM,MAAM;QAAE,EAAE,EAAE,MAAM,CAAC;QAAC,KAAK,EAAE,MAAM,CAAC;QAAC,GAAG,EAAE,MAAM,CAAC;QAAC,UAAU,EAAE,MAAM,CAAA;KAAE,CAAC,CAAC,CAwCxF;CACJ;0BAtEyB,gCAAgC;qCACrB,oCAAoC"}

package/types/models/qwen2_vl/image_processing_qwen2_vl.d.ts ADDED Viewed

@@ -0,0 +1,11 @@
+export class Qwen2VLImageProcessor extends ImageProcessor {
+    _call(images: any, ...args: any[]): Promise<{
+        pixel_values: Tensor;
+        image_grid_thw: Tensor;
+        original_sizes: import("../../base/image_processors_utils.js").HeightWidth[];
+        reshaped_input_sizes: import("../../base/image_processors_utils.js").HeightWidth[];
+    }>;
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+import { Tensor } from "../../utils/tensor.js";
+//# sourceMappingURL=image_processing_qwen2_vl.d.ts.map

package/types/models/qwen2_vl/image_processing_qwen2_vl.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_qwen2_vl.d.ts","sourceRoot":"","sources":["../../../src/models/qwen2_vl/image_processing_qwen2_vl.js"],"names":[],"mappings":"AAKA;IACI;;;;;OA2CC;CACJ;+BAhDM,sCAAsC;uBACjB,uBAAuB"}

package/types/models/qwen2_vl/processing_qwen2_vl.d.ts ADDED Viewed

@@ -0,0 +1,17 @@
+export class Qwen2VLProcessor extends Processor {
+    static image_processor_class: typeof AutoImageProcessor;
+    static tokenizer_class: typeof AutoTokenizer;
+    /**
+     *
+     * @param {string|string[]} text
+     * @param {RawImage|RawImage[]} images
+     * @param  {...any} args
+     * @returns {Promise<any>}
+     */
+    _call(text: string | string[], images?: RawImage | RawImage[], ...args: any[]): Promise<any>;
+}
+import { Processor } from "../../base/processing_utils.js";
+import { RawImage } from "../../utils/image.js";
+import { AutoImageProcessor } from "../auto/image_processing_auto.js";
+import { AutoTokenizer } from "../../tokenizers.js";
+//# sourceMappingURL=processing_qwen2_vl.d.ts.map

package/types/models/qwen2_vl/processing_qwen2_vl.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"processing_qwen2_vl.d.ts","sourceRoot":"","sources":["../../../src/models/qwen2_vl/processing_qwen2_vl.js"],"names":[],"mappings":"AAKA;IACI,wDAAiD;IACjD,6CAAsC;IAEtC;;;;;;OAMG;IACH,YALW,MAAM,GAAC,MAAM,EAAE,WACf,QAAQ,GAAC,QAAQ,EAAE,WACf,GAAG,KACL,QAAQ,GAAG,CAAC,CAoCxB;CACJ;0BAnDyB,gCAAgC;yBAGjC,sBAAsB;mCAFZ,kCAAkC;8BACvC,qBAAqB"}

package/types/models/rt_detr/image_processing_rt_detr.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+export class RTDetrImageProcessor extends ImageProcessor {
+    post_process_object_detection(outputs: {
+        logits: import("../../transformers.js").Tensor;
+        pred_boxes: import("../../transformers.js").Tensor;
+    }, threshold?: number, target_sizes?: [number, number][], is_zero_shot?: boolean): any[];
+}
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+//# sourceMappingURL=image_processing_rt_detr.d.ts.map

package/types/models/rt_detr/image_processing_rt_detr.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"image_processing_rt_detr.d.ts","sourceRoot":"","sources":["../../../src/models/rt_detr/image_processing_rt_detr.js"],"names":[],"mappings":"AAMA;IAMgyE;;;6FAAu6F;CADtsK;+BARM,sCAAsC"}

package/types/models/sam/image_processing_sam.d.ts ADDED Viewed

@@ -0,0 +1,103 @@
+/**
+ * @typedef {object} SamImageProcessorResult
+ * @property {Tensor} pixel_values
+ * @property {import("../../base/image_processors_utils.js").HeightWidth[]} original_sizes
+ * @property {import("../../base/image_processors_utils.js").HeightWidth[]} reshaped_input_sizes
+ * @property {Tensor} [input_points]
+ * @property {Tensor} [input_labels]
+ * @property {Tensor} [input_boxes]
+ */
+export class SamImageProcessor extends ImageProcessor {
+    /**
+     *
+     * @param {any} input_points
+     * @param {import("../../base/image_processors_utils.js").HeightWidth[]} original_sizes
+     * @param {import("../../base/image_processors_utils.js").HeightWidth[]} reshaped_input_sizes
+     * @returns {Tensor}
+     */
+    reshape_input_points(input_points: any, original_sizes: import("../../base/image_processors_utils.js").HeightWidth[], reshaped_input_sizes: import("../../base/image_processors_utils.js").HeightWidth[], is_bounding_box?: boolean): Tensor;
+    /**
+     *
+     * @param {any} input_labels
+     * @param {Tensor} input_points
+     * @returns {Tensor}
+     */
+    add_input_labels(input_labels: any, input_points: Tensor): Tensor;
+    /**
+     * @param {any[]} images The URL(s) of the image(s) to extract features from.
+     * @param {Object} [options] Additional options for the processor.
+     * @param {any} [options.input_points=null] A 3D or 4D array, representing the input points provided by the user.
+     * - 3D: `[point_batch_size, nb_points_per_image, 2]`. In this case, `batch_size` is assumed to be 1.
+     * - 4D: `[batch_size, point_batch_size, nb_points_per_image, 2]`.
+     * @param {any} [options.input_labels=null] A 2D or 3D array, representing the input labels for the points, used by the prompt encoder to encode the prompt.
+     * - 2D: `[point_batch_size, nb_points_per_image]`. In this case, `batch_size` is assumed to be 1.
+     * - 3D: `[batch_size, point_batch_size, nb_points_per_image]`.
+     * @param {number[][][]} [options.input_boxes=null] A 3D array of shape `(batch_size, num_boxes, 4)`, representing the input boxes provided by the user.
+     * This is used by the prompt encoder to encode the prompt. Generally yields to much better generated masks.
+     * The processor will generate a tensor, with each dimension corresponding respectively to the image batch size,
+     * the number of boxes per image and the coordinates of the top left and botton right point of the box.
+     * In the order (`x1`, `y1`, `x2`, `y2`):
+     * - `x1`: the x coordinate of the top left point of the input box
+     * - `y1`: the y coordinate of the top left point of the input box
+     * - `x2`: the x coordinate of the bottom right point of the input box
+     * - `y2`: the y coordinate of the bottom right point of the input box
+     * @returns {Promise<SamImageProcessorResult>}
+     */
+    _call(images: any[], { input_points, input_labels, input_boxes }?: {
+        input_points?: any;
+        input_labels?: any;
+        input_boxes?: number[][][];
+    }): Promise<SamImageProcessorResult>;
+    /**
+     * Remove padding and upscale masks to the original image size.
+     * @param {Tensor} masks Batched masks from the mask_decoder in (batch_size, num_channels, height, width) format.
+     * @param {[number, number][]} original_sizes The original sizes of each image before it was resized to the model's expected input shape, in (height, width) format.
+     * @param {[number, number][]} reshaped_input_sizes The size of each image as it is fed to the model, in (height, width) format. Used to remove padding.
+     * @param {Object} options Optional parameters for post-processing.
+     * @param {number} [options.mask_threshold] The threshold to use for binarizing the masks.
+     * @param {boolean} [options.binarize] Whether to binarize the masks.
+     * @param {Object} [options.pad_size] The target size the images were padded to before being passed to the model. If `null`, the target size is assumed to be the processor's `pad_size`.
+     * @param {number} [options.pad_size.height] The height the images were padded to.
+     * @param {number} [options.pad_size.width] The width the images were padded to.
+     * @returns {Promise<Tensor[]>} Batched masks in batch_size, num_channels, height, width) format, where (height, width) is given by original_size.
+     */
+    post_process_masks(masks: Tensor, original_sizes: [number, number][], reshaped_input_sizes: [number, number][], { mask_threshold, binarize, pad_size, }?: {
+        mask_threshold?: number;
+        binarize?: boolean;
+        pad_size?: {
+            height?: number;
+            width?: number;
+        };
+    }): Promise<Tensor[]>;
+    /**
+     * Generates a list of crop boxes of different sizes. Each layer has (2**i)**2 boxes for the ith layer.
+     * @param {import("../../utils/image.js").RawImage} image Input original image
+     * @param {number} target_size Target size of the resized image
+     * @param {Object} options Options for generating crop boxes
+     * @param {number} [options.crop_n_layers] If >0, mask prediction will be run again on crops of the image.
+     * Sets the number of layers to run, where each layer has 2**i_layer number of image crops.
+     * @param {number} [options.overlap_ratio] Sets the degree to which crops overlap. In the first crop layer,
+     * crops will overlap by this fraction of the image length. Later layers with more crops scale down this overlap.
+     * @param {number} [options.points_per_crop] Number of points to sample from each crop.
+     * @param {number} [options.crop_n_points_downscale_factor] The number of points-per-side sampled in layer n is
+     * scaled down by crop_n_points_downscale_factor**n.
+     * @returns {Object} An object containing the crop boxes, number of points per crop, cropped images, and input labels.
+     */
+    generate_crop_boxes(image: import("../../utils/image.js").RawImage, target_size: number, { crop_n_layers, overlap_ratio, points_per_crop, crop_n_points_downscale_factor, }?: {
+        crop_n_layers?: number;
+        overlap_ratio?: number;
+        points_per_crop?: number;
+        crop_n_points_downscale_factor?: number;
+    }): any;
+}
+export type SamImageProcessorResult = {
+    pixel_values: Tensor;
+    original_sizes: import("../../base/image_processors_utils.js").HeightWidth[];
+    reshaped_input_sizes: import("../../base/image_processors_utils.js").HeightWidth[];
+    input_points?: Tensor;
+    input_labels?: Tensor;
+    input_boxes?: Tensor;
+};
+import { ImageProcessor } from "../../base/image_processors_utils.js";
+import { Tensor } from "../../utils/tensor.js";
+//# sourceMappingURL=image_processing_sam.d.ts.map

package/types/models/sam/image_processing_sam.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"image_processing_sam.d.ts","sourceRoot":"","sources":["../../../src/models/sam/image_processing_sam.js"],"names":[],"mappings":"AAWA;;;;;;;;GAQG;AAEH;IAEI;;;;;;OAMG;IACH,mCALW,GAAG,kBACH,OAAO,sCAAsC,EAAE,WAAW,EAAE,wBAC5D,OAAO,sCAAsC,EAAE,WAAW,EAAE,8BAC1D,MAAM,CA4ClB;IAED;;;;;OAKG;IACH,+BAJW,GAAG,gBACH,MAAM,GACJ,MAAM,CAoBlB;IACD;;;;;;;;;;;;;;;;;;;OAmBG;IACH,cAnBW,GAAG,EAAE;QAES,YAAY,GAA1B,GAAG;QAGW,YAAY,GAA1B,GAAG;QAGoB,WAAW,GAAlC,MAAM,EAAE,EAAE,EAAE;QASV,QAAQ,uBAAuB,CAAC,CA+B5C;IAED;;;;;;;;;;;;OAYG;IACH,0BAXW,MAAM,kBACN,CAAC,MAAM,EAAE,MAAM,CAAC,EAAE,wBAClB,CAAC,MAAM,EAAE,MAAM,CAAC,EAAE;QAED,cAAc,GAA/B,MAAM;QACY,QAAQ,GAA1B,OAAO;QACU,QAAQ;YACC,MAAM,GAAhC,MAAM;YACoB,KAAK,GAA/B,MAAM;;QACJ,QAAQ,MAAM,EAAE,CAAC,CAsD7B;IAED;;;;;;;;;;;;;OAaG;IACH,2BAZW,OAAO,sBAAsB,EAAE,QAAQ,eACvC,MAAM;QAEW,aAAa,GAA9B,MAAM;QAEW,aAAa,GAA9B,MAAM;QAEW,eAAe,GAAhC,MAAM;QACW,8BAA8B,GAA/C,MAAM;YAYhB;CACJ;;kBAnOa,MAAM;oBACN,OAAO,sCAAsC,EAAE,WAAW,EAAE;0BAC5D,OAAO,sCAAsC,EAAE,WAAW,EAAE;mBAC5D,MAAM;mBACN,MAAM;kBACN,MAAM;;+BAhBb,sCAAsC;uBAMtC,uBAAuB"}

package/types/models/sam/processing_sam.d.ts ADDED Viewed

@@ -0,0 +1,9 @@
+export class SamProcessor extends Processor {
+    static image_processor_class: typeof AutoImageProcessor;
+    _call(...args: any[]): Promise<any>;
+    post_process_masks(...args: any[]): any;
+    reshape_input_points(...args: any[]): any;
+}
+import { Processor } from "../../base/processing_utils.js";
+import { AutoImageProcessor } from "../auto/image_processing_auto.js";
+//# sourceMappingURL=processing_sam.d.ts.map

package/types/models/sam/processing_sam.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"processing_sam.d.ts","sourceRoot":"","sources":["../../../src/models/sam/processing_sam.js"],"names":[],"mappings":"AAGA;IACI,wDAAiD;IAEjD,oCAEC;IAED,wCAGC;IAED,0CAGC;CACJ;0BAnByB,gCAAgC;mCACvB,kCAAkC"}