npm - @huggingface/transformers - Versions diffs - 4.0.0-next.4 → 4.0.0-next.6 - Mend

@huggingface/transformers 4.0.0-next.4 → 4.0.0-next.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (187) hide show

package/README.md +15 -5
package/dist/ort-wasm-simd-threaded.jsep.mjs +28 -28
package/dist/transformers.js +3446 -2296
package/dist/transformers.min.js +17 -19
package/dist/transformers.node.cjs +3456 -2263
package/dist/transformers.node.min.cjs +20 -22
package/dist/transformers.node.min.mjs +20 -22
package/dist/transformers.node.mjs +3426 -2258
package/dist/transformers.web.js +1647 -471
package/dist/transformers.web.min.js +18 -18
package/package.json +4 -4
package/src/backends/onnx.js +128 -53
package/src/backends/utils/cacheWasm.js +28 -46
package/src/configs.js +63 -3
package/src/env.js +93 -11
package/src/generation/logits_sampler.js +3 -15
package/src/image_processors_utils.js +2 -6
package/src/models/afmoe/modeling_afmoe.js +5 -0
package/src/models/auto/image_processing_auto.js +2 -1
package/src/models/auto/modeling_auto.js +16 -2
package/src/models/auto/tokenization_auto.js +2 -1
package/src/models/clap/feature_extraction_clap.js +2 -1
package/src/models/marian/tokenization_marian.js +3 -2
package/src/models/modeling_utils.js +45 -7
package/src/models/models.js +10 -0
package/src/models/olmo_hybrid/modeling_olmo_hybrid.js +5 -0
package/src/models/paligemma/processing_paligemma.js +3 -2
package/src/models/processors.js +2 -0
package/src/models/qwen2_5_vl/modeling_qwen2_5_vl.js +5 -0
package/src/models/qwen2_5_vl/processing_qwen2_5_vl.js +3 -0
package/src/models/qwen2_moe/modeling_qwen2_moe.js +5 -0
package/src/models/qwen2_vl/image_processing_qwen2_vl.js +54 -0
package/src/models/qwen2_vl/modeling_qwen2_vl.js +45 -6
package/src/models/qwen3_5/modeling_qwen3_5.js +3 -0
package/src/models/qwen3_5_moe/modeling_qwen3_5_moe.js +3 -0
package/src/models/qwen3_moe/modeling_qwen3_moe.js +5 -0
package/src/models/qwen3_next/modeling_qwen3_next.js +5 -0
package/src/models/qwen3_vl/modeling_qwen3_vl.js +3 -0
package/src/models/qwen3_vl/processing_qwen3_vl.js +3 -0
package/src/models/qwen3_vl_moe/modeling_qwen3_vl_moe.js +3 -0
package/src/models/registry.js +21 -5
package/src/models/session.js +16 -50
package/src/models/whisper/feature_extraction_whisper.js +2 -1
package/src/models/whisper/modeling_whisper.js +6 -5
package/src/models/xlm/tokenization_xlm.js +2 -1
package/src/pipelines/automatic-speech-recognition.js +3 -2
package/src/pipelines/index.js +313 -0
package/src/pipelines/text-generation.js +4 -0
package/src/pipelines/text-to-audio.js +4 -2
package/src/pipelines/zero-shot-classification.js +3 -2
package/src/pipelines.js +139 -428
package/src/tokenization_utils.js +42 -21
package/src/transformers.js +6 -1
package/src/utils/audio.js +2 -1
package/src/utils/cache/FileCache.js +128 -0
package/src/utils/cache.js +7 -4
package/src/utils/core.js +23 -1
package/src/utils/devices.js +22 -0
package/src/utils/dtypes.js +55 -0
package/src/utils/hub/{files.js → FileResponse.js} +0 -90
package/src/utils/hub/utils.js +45 -5
package/src/utils/hub.js +63 -22
package/src/utils/image.js +14 -14
package/src/utils/logger.js +67 -0
package/src/utils/model-loader.js +35 -17
package/src/utils/model_registry/ModelRegistry.js +346 -0
package/src/utils/model_registry/clear_cache.js +128 -0
package/src/utils/model_registry/get_file_metadata.js +149 -0
package/src/utils/model_registry/get_files.js +42 -0
package/src/utils/model_registry/get_model_files.js +193 -0
package/src/utils/model_registry/get_pipeline_files.js +44 -0
package/src/utils/model_registry/get_processor_files.js +20 -0
package/src/utils/model_registry/get_tokenizer_files.js +21 -0
package/src/utils/model_registry/is_cached.js +169 -0
package/src/utils/random.js +225 -0
package/src/utils/tensor.js +8 -21
package/src/utils/video.js +2 -2
package/types/backends/onnx.d.ts.map +1 -1
package/types/backends/utils/cacheWasm.d.ts +3 -17
package/types/backends/utils/cacheWasm.d.ts.map +1 -1
package/types/configs.d.ts.map +1 -1
package/types/env.d.ts +52 -27
package/types/env.d.ts.map +1 -1
package/types/generation/logits_sampler.d.ts +2 -2
package/types/generation/logits_sampler.d.ts.map +1 -1
package/types/image_processors_utils.d.ts.map +1 -1
package/types/models/afmoe/modeling_afmoe.d.ts +8 -0
package/types/models/afmoe/modeling_afmoe.d.ts.map +1 -0
package/types/models/auto/image_processing_auto.d.ts.map +1 -1
package/types/models/auto/modeling_auto.d.ts +6 -0
package/types/models/auto/modeling_auto.d.ts.map +1 -1
package/types/models/auto/tokenization_auto.d.ts.map +1 -1
package/types/models/clap/feature_extraction_clap.d.ts.map +1 -1
package/types/models/marian/tokenization_marian.d.ts.map +1 -1
package/types/models/modeling_utils.d.ts +13 -2
package/types/models/modeling_utils.d.ts.map +1 -1
package/types/models/models.d.ts +10 -0
package/types/models/olmo_hybrid/modeling_olmo_hybrid.d.ts +8 -0
package/types/models/olmo_hybrid/modeling_olmo_hybrid.d.ts.map +1 -0
package/types/models/paligemma/processing_paligemma.d.ts.map +1 -1
package/types/models/processors.d.ts +2 -0
package/types/models/qwen2_5_vl/modeling_qwen2_5_vl.d.ts +4 -0
package/types/models/qwen2_5_vl/modeling_qwen2_5_vl.d.ts.map +1 -0
package/types/models/qwen2_5_vl/processing_qwen2_5_vl.d.ts +4 -0
package/types/models/qwen2_5_vl/processing_qwen2_5_vl.d.ts.map +1 -0
package/types/models/qwen2_moe/modeling_qwen2_moe.d.ts +8 -0
package/types/models/qwen2_moe/modeling_qwen2_moe.d.ts.map +1 -0
package/types/models/qwen2_vl/image_processing_qwen2_vl.d.ts +3 -0
package/types/models/qwen2_vl/image_processing_qwen2_vl.d.ts.map +1 -1
package/types/models/qwen2_vl/modeling_qwen2_vl.d.ts +1 -0
package/types/models/qwen2_vl/modeling_qwen2_vl.d.ts.map +1 -1
package/types/models/qwen3_5/modeling_qwen3_5.d.ts +4 -0
package/types/models/qwen3_5/modeling_qwen3_5.d.ts.map +1 -0
package/types/models/qwen3_5_moe/modeling_qwen3_5_moe.d.ts +4 -0
package/types/models/qwen3_5_moe/modeling_qwen3_5_moe.d.ts.map +1 -0
package/types/models/qwen3_moe/modeling_qwen3_moe.d.ts +8 -0
package/types/models/qwen3_moe/modeling_qwen3_moe.d.ts.map +1 -0
package/types/models/qwen3_next/modeling_qwen3_next.d.ts +8 -0
package/types/models/qwen3_next/modeling_qwen3_next.d.ts.map +1 -0
package/types/models/qwen3_vl/modeling_qwen3_vl.d.ts +4 -0
package/types/models/qwen3_vl/modeling_qwen3_vl.d.ts.map +1 -0
package/types/models/qwen3_vl/processing_qwen3_vl.d.ts +4 -0
package/types/models/qwen3_vl/processing_qwen3_vl.d.ts.map +1 -0
package/types/models/qwen3_vl_moe/modeling_qwen3_vl_moe.d.ts +4 -0
package/types/models/qwen3_vl_moe/modeling_qwen3_vl_moe.d.ts.map +1 -0
package/types/models/registry.d.ts +2 -1
package/types/models/registry.d.ts.map +1 -1
package/types/models/session.d.ts.map +1 -1
package/types/models/whisper/feature_extraction_whisper.d.ts.map +1 -1
package/types/models/whisper/modeling_whisper.d.ts.map +1 -1
package/types/models/xlm/tokenization_xlm.d.ts.map +1 -1
package/types/pipelines/automatic-speech-recognition.d.ts.map +1 -1
package/types/pipelines/index.d.ts +265 -0
package/types/pipelines/index.d.ts.map +1 -0
package/types/pipelines/text-generation.d.ts +5 -1
package/types/pipelines/text-generation.d.ts.map +1 -1
package/types/pipelines/text-to-audio.d.ts.map +1 -1
package/types/pipelines/zero-shot-classification.d.ts.map +1 -1
package/types/pipelines.d.ts +50 -291
package/types/pipelines.d.ts.map +1 -1
package/types/tokenization_utils.d.ts +44 -26
package/types/tokenization_utils.d.ts.map +1 -1
package/types/transformers.d.ts +4 -1
package/types/transformers.d.ts.map +1 -1
package/types/utils/audio.d.ts.map +1 -1
package/types/utils/cache/FileCache.d.ts +39 -0
package/types/utils/cache/FileCache.d.ts.map +1 -0
package/types/utils/cache.d.ts +10 -4
package/types/utils/cache.d.ts.map +1 -1
package/types/utils/core.d.ts +59 -2
package/types/utils/core.d.ts.map +1 -1
package/types/utils/devices.d.ts +15 -0
package/types/utils/devices.d.ts.map +1 -1
package/types/utils/dtypes.d.ts +16 -0
package/types/utils/dtypes.d.ts.map +1 -1
package/types/utils/hub/{files.d.ts → FileResponse.d.ts} +1 -32
package/types/utils/hub/FileResponse.d.ts.map +1 -0
package/types/utils/hub/utils.d.ts +19 -3
package/types/utils/hub/utils.d.ts.map +1 -1
package/types/utils/hub.d.ts +36 -7
package/types/utils/hub.d.ts.map +1 -1
package/types/utils/logger.d.ts +28 -0
package/types/utils/logger.d.ts.map +1 -0
package/types/utils/model-loader.d.ts +15 -0
package/types/utils/model-loader.d.ts.map +1 -1
package/types/utils/model_registry/ModelRegistry.d.ts +271 -0
package/types/utils/model_registry/ModelRegistry.d.ts.map +1 -0
package/types/utils/model_registry/clear_cache.d.ts +74 -0
package/types/utils/model_registry/clear_cache.d.ts.map +1 -0
package/types/utils/model_registry/get_file_metadata.d.ts +20 -0
package/types/utils/model_registry/get_file_metadata.d.ts.map +1 -0
package/types/utils/model_registry/get_files.d.ts +23 -0
package/types/utils/model_registry/get_files.d.ts.map +1 -0
package/types/utils/model_registry/get_model_files.d.ts +22 -0
package/types/utils/model_registry/get_model_files.d.ts.map +1 -0
package/types/utils/model_registry/get_pipeline_files.d.ts +22 -0
package/types/utils/model_registry/get_pipeline_files.d.ts.map +1 -0
package/types/utils/model_registry/get_processor_files.d.ts +9 -0
package/types/utils/model_registry/get_processor_files.d.ts.map +1 -0
package/types/utils/model_registry/get_tokenizer_files.d.ts +9 -0
package/types/utils/model_registry/get_tokenizer_files.d.ts.map +1 -0
package/types/utils/model_registry/is_cached.d.ts +105 -0
package/types/utils/model_registry/is_cached.d.ts.map +1 -0
package/types/utils/random.d.ts +86 -0
package/types/utils/random.d.ts.map +1 -0
package/types/utils/tensor.d.ts.map +1 -1
package/types/utils/hub/files.d.ts.map +0 -1

package/src/pipelines/index.js ADDED Viewed

@@ -0,0 +1,313 @@
+/**
+ * @file Pipeline task configurations and aliases
+ *
+ * Defines which pipeline class and model class(es) each pipeline task needs.
+ * Tokenizer and processor loading is determined automatically from the model's files.
+ */
+import {
+    AutoModel,
+    AutoModelForSequenceClassification,
+    AutoModelForAudioClassification,
+    AutoModelForTokenClassification,
+    AutoModelForQuestionAnswering,
+    AutoModelForMaskedLM,
+    AutoModelForSeq2SeqLM,
+    AutoModelForSpeechSeq2Seq,
+    AutoModelForTextToWaveform,
+    AutoModelForTextToSpectrogram,
+    AutoModelForCTC,
+    AutoModelForCausalLM,
+    AutoModelForVision2Seq,
+    AutoModelForImageClassification,
+    AutoModelForImageSegmentation,
+    AutoModelForSemanticSegmentation,
+    AutoModelForUniversalSegmentation,
+    AutoModelForObjectDetection,
+    AutoModelForZeroShotObjectDetection,
+    AutoModelForDocumentQuestionAnswering,
+    AutoModelForImageToImage,
+    AutoModelForDepthEstimation,
+    AutoModelForImageFeatureExtraction,
+} from '../models/auto/modeling_auto.js';
+import { TextClassificationPipeline } from './text-classification.js';
+import { TokenClassificationPipeline } from './token-classification.js';
+import { QuestionAnsweringPipeline } from './question-answering.js';
+import { FillMaskPipeline } from './fill-mask.js';
+import { SummarizationPipeline } from './summarization.js';
+import { TranslationPipeline } from './translation.js';
+import { Text2TextGenerationPipeline } from './text2text-generation.js';
+import { TextGenerationPipeline } from './text-generation.js';
+import { ZeroShotClassificationPipeline } from './zero-shot-classification.js';
+import { AudioClassificationPipeline } from './audio-classification.js';
+import { ZeroShotAudioClassificationPipeline } from './zero-shot-audio-classification.js';
+import { AutomaticSpeechRecognitionPipeline } from './automatic-speech-recognition.js';
+import { TextToAudioPipeline } from './text-to-audio.js';
+import { ImageToTextPipeline } from './image-to-text.js';
+import { ImageClassificationPipeline } from './image-classification.js';
+import { ImageSegmentationPipeline } from './image-segmentation.js';
+import { BackgroundRemovalPipeline } from './background-removal.js';
+import { ZeroShotImageClassificationPipeline } from './zero-shot-image-classification.js';
+import { ObjectDetectionPipeline } from './object-detection.js';
+import { ZeroShotObjectDetectionPipeline } from './zero-shot-object-detection.js';
+import { DocumentQuestionAnsweringPipeline } from './document-question-answering.js';
+import { ImageToImagePipeline } from './image-to-image.js';
+import { DepthEstimationPipeline } from './depth-estimation.js';
+import { FeatureExtractionPipeline } from './feature-extraction.js';
+import { ImageFeatureExtractionPipeline } from './image-feature-extraction.js';
+export const SUPPORTED_TASKS = Object.freeze({
+    'text-classification': {
+        pipeline: TextClassificationPipeline,
+        model: AutoModelForSequenceClassification,
+        default: {
+            model: 'Xenova/distilbert-base-uncased-finetuned-sst-2-english',
+        },
+        type: 'text',
+    },
+    'token-classification': {
+        pipeline: TokenClassificationPipeline,
+        model: AutoModelForTokenClassification,
+        default: {
+            model: 'Xenova/bert-base-multilingual-cased-ner-hrl',
+        },
+        type: 'text',
+    },
+    'question-answering': {
+        pipeline: QuestionAnsweringPipeline,
+        model: AutoModelForQuestionAnswering,
+        default: {
+            model: 'Xenova/distilbert-base-cased-distilled-squad',
+        },
+        type: 'text',
+    },
+    'fill-mask': {
+        pipeline: FillMaskPipeline,
+        model: AutoModelForMaskedLM,
+        default: {
+            model: 'onnx-community/ettin-encoder-32m-ONNX',
+            dtype: 'fp32',
+        },
+        type: 'text',
+    },
+    summarization: {
+        pipeline: SummarizationPipeline,
+        model: AutoModelForSeq2SeqLM,
+        default: {
+            model: 'Xenova/distilbart-cnn-6-6',
+        },
+        type: 'text',
+    },
+    translation: {
+        pipeline: TranslationPipeline,
+        model: AutoModelForSeq2SeqLM,
+        default: {
+            model: 'Xenova/t5-small',
+        },
+        type: 'text',
+    },
+    'text2text-generation': {
+        pipeline: Text2TextGenerationPipeline,
+        model: AutoModelForSeq2SeqLM,
+        default: {
+            model: 'Xenova/flan-t5-small',
+        },
+        type: 'text',
+    },
+    'text-generation': {
+        pipeline: TextGenerationPipeline,
+        model: AutoModelForCausalLM,
+        default: {
+            model: 'onnx-community/Qwen3-0.6B-ONNX',
+            dtype: 'q4',
+        },
+        type: 'text',
+    },
+    'zero-shot-classification': {
+        pipeline: ZeroShotClassificationPipeline,
+        model: AutoModelForSequenceClassification,
+        default: {
+            model: 'Xenova/distilbert-base-uncased-mnli',
+        },
+        type: 'text',
+    },
+    'audio-classification': {
+        pipeline: AudioClassificationPipeline,
+        model: AutoModelForAudioClassification,
+        default: {
+            model: 'Xenova/wav2vec2-base-superb-ks',
+        },
+        type: 'audio',
+    },
+    'zero-shot-audio-classification': {
+        pipeline: ZeroShotAudioClassificationPipeline,
+        model: AutoModel,
+        default: {
+            model: 'Xenova/clap-htsat-unfused',
+        },
+        type: 'multimodal',
+    },
+    'automatic-speech-recognition': {
+        pipeline: AutomaticSpeechRecognitionPipeline,
+        model: [AutoModelForSpeechSeq2Seq, AutoModelForCTC],
+        default: {
+            model: 'Xenova/whisper-tiny.en',
+        },
+        type: 'multimodal',
+    },
+    'text-to-audio': {
+        pipeline: TextToAudioPipeline,
+        model: [AutoModelForTextToWaveform, AutoModelForTextToSpectrogram],
+        default: {
+            model: 'onnx-community/Supertonic-TTS-ONNX',
+            dtype: 'fp32',
+        },
+        type: 'text',
+    },
+    'image-to-text': {
+        pipeline: ImageToTextPipeline,
+        model: AutoModelForVision2Seq,
+        default: {
+            model: 'Xenova/vit-gpt2-image-captioning',
+        },
+        type: 'multimodal',
+    },
+    'image-classification': {
+        pipeline: ImageClassificationPipeline,
+        model: AutoModelForImageClassification,
+        default: {
+            model: 'Xenova/vit-base-patch16-224',
+        },
+        type: 'multimodal',
+    },
+    'image-segmentation': {
+        pipeline: ImageSegmentationPipeline,
+        model: [AutoModelForImageSegmentation, AutoModelForSemanticSegmentation, AutoModelForUniversalSegmentation],
+        default: {
+            model: 'Xenova/detr-resnet-50-panoptic',
+        },
+        type: 'multimodal',
+    },
+    'background-removal': {
+        pipeline: BackgroundRemovalPipeline,
+        model: [AutoModelForImageSegmentation, AutoModelForSemanticSegmentation, AutoModelForUniversalSegmentation],
+        default: {
+            model: 'Xenova/modnet',
+        },
+        type: 'image',
+    },
+    'zero-shot-image-classification': {
+        pipeline: ZeroShotImageClassificationPipeline,
+        model: AutoModel,
+        default: {
+            model: 'Xenova/clip-vit-base-patch32',
+        },
+        type: 'multimodal',
+    },
+    'object-detection': {
+        pipeline: ObjectDetectionPipeline,
+        model: AutoModelForObjectDetection,
+        default: {
+            model: 'Xenova/detr-resnet-50',
+        },
+        type: 'multimodal',
+    },
+    'zero-shot-object-detection': {
+        pipeline: ZeroShotObjectDetectionPipeline,
+        model: AutoModelForZeroShotObjectDetection,
+        default: {
+            model: 'Xenova/owlvit-base-patch32',
+        },
+        type: 'multimodal',
+    },
+    'document-question-answering': {
+        pipeline: DocumentQuestionAnsweringPipeline,
+        model: AutoModelForDocumentQuestionAnswering,
+        default: {
+            model: 'Xenova/donut-base-finetuned-docvqa',
+        },
+        type: 'multimodal',
+    },
+    'image-to-image': {
+        pipeline: ImageToImagePipeline,
+        model: AutoModelForImageToImage,
+        default: {
+            model: 'Xenova/swin2SR-classical-sr-x2-64',
+        },
+        type: 'image',
+    },
+    'depth-estimation': {
+        pipeline: DepthEstimationPipeline,
+        model: AutoModelForDepthEstimation,
+        default: {
+            model: 'onnx-community/depth-anything-v2-small',
+        },
+        type: 'image',
+    },
+    'feature-extraction': {
+        pipeline: FeatureExtractionPipeline,
+        model: AutoModel,
+        default: {
+            model: 'onnx-community/all-MiniLM-L6-v2-ONNX',
+            dtype: 'fp32',
+        },
+        type: 'text',
+    },
+    'image-feature-extraction': {
+        pipeline: ImageFeatureExtractionPipeline,
+        model: [AutoModelForImageFeatureExtraction, AutoModel],
+        default: {
+            model: 'onnx-community/dinov3-vits16-pretrain-lvd1689m-ONNX',
+            dtype: 'fp32',
+        },
+        type: 'image',
+    },
+});
+// TODO: Add types for TASK_ALIASES
+export const TASK_ALIASES = Object.freeze({
+    'sentiment-analysis': 'text-classification',
+    ner: 'token-classification',
+    // "vqa": "visual-question-answering", // TODO: Add
+    asr: 'automatic-speech-recognition',
+    'text-to-speech': 'text-to-audio',
+    // Add for backwards compatibility
+    embeddings: 'feature-extraction',
+});
+export {
+    TextClassificationPipeline,
+    TokenClassificationPipeline,
+    QuestionAnsweringPipeline,
+    FillMaskPipeline,
+    SummarizationPipeline,
+    TranslationPipeline,
+    Text2TextGenerationPipeline,
+    TextGenerationPipeline,
+    ZeroShotClassificationPipeline,
+    AudioClassificationPipeline,
+    ZeroShotAudioClassificationPipeline,
+    AutomaticSpeechRecognitionPipeline,
+    TextToAudioPipeline,
+    ImageToTextPipeline,
+    ImageClassificationPipeline,
+    ImageSegmentationPipeline,
+    BackgroundRemovalPipeline,
+    ZeroShotImageClassificationPipeline,
+    ObjectDetectionPipeline,
+    ZeroShotObjectDetectionPipeline,
+    DocumentQuestionAnsweringPipeline,
+    ImageToImagePipeline,
+    DepthEstimationPipeline,
+    FeatureExtractionPipeline,
+    ImageFeatureExtractionPipeline,
+};
+/**
+ * @typedef {keyof typeof SUPPORTED_TASKS} TaskType
+ * @typedef {keyof typeof TASK_ALIASES} AliasType
+ * @typedef {TaskType | AliasType} PipelineType All possible pipeline types.
+ */

package/src/pipelines/text-generation.js CHANGED Viewed

@@ -100,6 +100,10 @@ function isChat(x) {
 export class TextGenerationPipeline
     extends /** @type {new (options: TextPipelineConstructorArgs) => TextGenerationPipelineType} */ (Pipeline)
 {
+    /**
+     * @param {string | string[] | import('../tokenization_utils.js').Message[] | import('../tokenization_utils.js').Message[][]} texts
+     * @param {Partial<TextGenerationConfig>} generate_kwargs
+     */
     async _call(texts, generate_kwargs = {}) {
         let isBatched = false;
         let isChatInput = false;

package/src/pipelines/text-to-audio.js CHANGED Viewed

@@ -2,8 +2,10 @@ import { Pipeline } from './_base.js';
 import { Tensor } from '../utils/tensor.js';
 import { RawAudio } from '../utils/audio.js';
+import { logger } from '../utils/logger.js';
 import { AutoModel } from '../models/auto/modeling_auto.js';
+import { env } from '../env.js';
 /**
  * @typedef {import('./_base.js').TextAudioPipelineConstructorArgs} TextAudioPipelineConstructorArgs
@@ -92,7 +94,7 @@ export class TextToAudioPipeline
         // Load speaker embeddings as Float32Array from path/URL
         if (typeof speaker_embeddings === 'string' || speaker_embeddings instanceof URL) {
             // Load from URL with fetch
-            speaker_embeddings = new Float32Array(await (await fetch(speaker_embeddings)).arrayBuffer());
+            speaker_embeddings = new Float32Array(await (await env.fetch(speaker_embeddings)).arrayBuffer());
         }
         if (speaker_embeddings instanceof Float32Array) {
@@ -194,7 +196,7 @@ export class TextToAudioPipeline
     async _call_text_to_spectrogram(text_inputs, { speaker_embeddings }) {
         // Load vocoder, if not provided
         if (!this.vocoder) {
-            console.log('No vocoder specified, using default HifiGan vocoder.');
+            logger.info('No vocoder specified, using default HifiGan vocoder.');
             this.vocoder = await AutoModel.from_pretrained(this.DEFAULT_VOCODER_ID, { dtype: 'fp32' });
         }

package/src/pipelines/zero-shot-classification.js CHANGED Viewed

@@ -1,6 +1,7 @@
 import { Pipeline } from './_base.js';
 import { softmax } from '../utils/maths.js';
+import { logger } from '../utils/logger.js';
 /**
  * @typedef {import('./_base.js').TextPipelineConstructorArgs} TextPipelineConstructorArgs
@@ -93,13 +94,13 @@ export class ZeroShotClassificationPipeline
         this.entailment_id = this.label2id['entailment'];
         if (this.entailment_id === undefined) {
-            console.warn("Could not find 'entailment' in label2id mapping. Using 2 as entailment_id.");
+            logger.warn("Could not find 'entailment' in label2id mapping. Using 2 as entailment_id.");
             this.entailment_id = 2;
         }
         this.contradiction_id = this.label2id['contradiction'] ?? this.label2id['not_entailment'];
         if (this.contradiction_id === undefined) {
-            console.warn("Could not find 'contradiction' in label2id mapping. Using 0 as contradiction_id.");
+            logger.warn("Could not find 'contradiction' in label2id mapping. Using 0 as contradiction_id.");
             this.contradiction_id = 0;
         }
     }