npm - @huggingface/transformers - Versions diffs - 3.2.3 → 3.3.0 - Mend

@huggingface/transformers 3.2.3 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (105) hide show

package/README.md +5 -3
package/dist/ort-wasm-simd-threaded.jsep.wasm +0 -0
package/dist/ort.bundle.min.mjs +2776 -0
package/dist/transformers.cjs +792 -330
package/dist/transformers.cjs.map +1 -1
package/dist/transformers.js +1150 -656
package/dist/transformers.js.map +1 -1
package/dist/transformers.min.cjs +1 -1
package/dist/transformers.min.cjs.map +1 -1
package/dist/transformers.min.js +1 -1
package/dist/transformers.min.js.map +1 -1
package/dist/transformers.min.mjs +1 -1
package/dist/transformers.min.mjs.map +1 -1
package/dist/transformers.mjs +798 -331
package/dist/transformers.mjs.map +1 -1
package/package.json +3 -3
package/src/base/feature_extraction_utils.js +9 -9
package/src/base/image_processors_utils.js +12 -1
package/src/base/processing_utils.js +24 -3
package/src/configs.js +5 -0
package/src/env.js +1 -2
package/src/generation/streamers.js +5 -2
package/src/models/auto/feature_extraction_auto.js +0 -16
package/src/models/auto/processing_auto.js +0 -16
package/src/models/convnext/image_processing_convnext.js +1 -0
package/src/models/efficientnet/image_processing_efficientnet.js +1 -0
package/src/models/florence2/processing_florence2.js +3 -0
package/src/models/grounding_dino/image_processing_grounding_dino.js +29 -0
package/src/models/grounding_dino/processing_grounding_dino.js +101 -0
package/src/models/idefics3/image_processing_idefics3.js +2 -0
package/src/models/image_processors.js +1 -0
package/src/models/janus/image_processing_janus.js +1 -0
package/src/models/mgp_str/processing_mgp_str.js +2 -0
package/src/models/paligemma/processing_paligemma.js +1 -0
package/src/models/phi3_v/processing_phi3_v.js +1 -1
package/src/models/processors.js +3 -2
package/src/models/pyannote/feature_extraction_pyannote.js +1 -0
package/src/models/qwen2_vl/processing_qwen2_vl.js +1 -0
package/src/models/seamless_m4t/feature_extraction_seamless_m4t.js +2 -2
package/src/models/whisper/feature_extraction_whisper.js +1 -1
package/src/models.js +72 -20
package/src/ops/registry.js +10 -0
package/src/pipelines.js +73 -23
package/src/tokenizers.js +4 -7
package/src/utils/audio.js +113 -1
package/src/utils/core.js +26 -0
package/src/utils/dtypes.js +2 -0
package/src/utils/hub.js +1 -1
package/src/utils/image.js +5 -18
package/src/utils/maths.js +8 -6
package/src/utils/tensor.js +134 -114
package/types/base/feature_extraction_utils.d.ts +7 -7
package/types/base/image_processors_utils.d.ts +7 -0
package/types/base/image_processors_utils.d.ts.map +1 -1
package/types/base/processing_utils.d.ts +25 -19
package/types/base/processing_utils.d.ts.map +1 -1
package/types/configs.d.ts.map +1 -1
package/types/generation/parameters.d.ts +1 -1
package/types/generation/streamers.d.ts +3 -1
package/types/generation/streamers.d.ts.map +1 -1
package/types/models/auto/feature_extraction_auto.d.ts.map +1 -1
package/types/models/auto/image_processing_auto.d.ts.map +1 -1
package/types/models/auto/processing_auto.d.ts.map +1 -1
package/types/models/convnext/image_processing_convnext.d.ts.map +1 -1
package/types/models/efficientnet/image_processing_efficientnet.d.ts.map +1 -1
package/types/models/florence2/processing_florence2.d.ts.map +1 -1
package/types/models/grounding_dino/image_processing_grounding_dino.d.ts +20 -0
package/types/models/grounding_dino/image_processing_grounding_dino.d.ts.map +1 -0
package/types/models/grounding_dino/processing_grounding_dino.d.ts +27 -0
package/types/models/grounding_dino/processing_grounding_dino.d.ts.map +1 -0
package/types/models/idefics3/image_processing_idefics3.d.ts.map +1 -1
package/types/models/image_processors.d.ts +1 -0
package/types/models/janus/image_processing_janus.d.ts.map +1 -1
package/types/models/mgp_str/processing_mgp_str.d.ts.map +1 -1
package/types/models/paligemma/processing_paligemma.d.ts.map +1 -1
package/types/models/phi3_v/processing_phi3_v.d.ts +6 -2
package/types/models/phi3_v/processing_phi3_v.d.ts.map +1 -1
package/types/models/processors.d.ts +3 -2
package/types/models/pyannote/feature_extraction_pyannote.d.ts.map +1 -1
package/types/models/qwen2_vl/processing_qwen2_vl.d.ts.map +1 -1
package/types/models/sapiens/image_processing_sapiens.d.ts +10 -0
package/types/models/sapiens/image_processing_sapiens.d.ts.map +1 -0
package/types/models/whisper/generation_whisper.d.ts +1 -1
package/types/models/whisper/generation_whisper.d.ts.map +1 -1
package/types/models.d.ts +40 -17
package/types/models.d.ts.map +1 -1
package/types/ops/registry.d.ts +1 -0
package/types/ops/registry.d.ts.map +1 -1
package/types/pipelines.d.ts +7 -12
package/types/pipelines.d.ts.map +1 -1
package/types/tokenizers.d.ts.map +1 -1
package/types/tsconfig.tsbuildinfo +1 -0
package/types/utils/audio.d.ts +25 -0
package/types/utils/audio.d.ts.map +1 -1
package/types/utils/core.d.ts +6 -0
package/types/utils/core.d.ts.map +1 -1
package/types/utils/dtypes.d.ts.map +1 -1
package/types/utils/hub.d.ts +1 -1
package/types/utils/hub.d.ts.map +1 -1
package/types/utils/image.d.ts +3 -2
package/types/utils/image.d.ts.map +1 -1
package/types/utils/maths.d.ts +8 -6
package/types/utils/maths.d.ts.map +1 -1
package/types/utils/tensor.d.ts +22 -6
package/types/utils/tensor.d.ts.map +1 -1

package/src/utils/audio.js CHANGED Viewed

@@ -12,8 +12,10 @@ import {
 } from './hub.js';
 import { FFT, max } from './maths.js';
 import {
-    calculateReflectOffset,
+    calculateReflectOffset, saveBlob,
 } from './core.js';
+import { apis } from '../env.js';
+import fs from 'fs';
 import { Tensor, matmul } from './tensor.js';
@@ -702,3 +704,113 @@ export function window_function(window_length, name, {
     return window;
 }
+/**
+ * Encode audio data to a WAV file.
+ * WAV file specs : https://en.wikipedia.org/wiki/WAV#WAV_File_header
+ *
+ * Adapted from https://www.npmjs.com/package/audiobuffer-to-wav
+ * @param {Float32Array} samples The audio samples.
+ * @param {number} rate The sample rate.
+ * @returns {ArrayBuffer} The WAV audio buffer.
+ */
+function encodeWAV(samples, rate) {
+    let offset = 44;
+    const buffer = new ArrayBuffer(offset + samples.length * 4);
+    const view = new DataView(buffer);
+    /* RIFF identifier */
+    writeString(view, 0, "RIFF");
+    /* RIFF chunk length */
+    view.setUint32(4, 36 + samples.length * 4, true);
+    /* RIFF type */
+    writeString(view, 8, "WAVE");
+    /* format chunk identifier */
+    writeString(view, 12, "fmt ");
+    /* format chunk length */
+    view.setUint32(16, 16, true);
+    /* sample format (raw) */
+    view.setUint16(20, 3, true);
+    /* channel count */
+    view.setUint16(22, 1, true);
+    /* sample rate */
+    view.setUint32(24, rate, true);
+    /* byte rate (sample rate * block align) */
+    view.setUint32(28, rate * 4, true);
+    /* block align (channel count * bytes per sample) */
+    view.setUint16(32, 4, true);
+    /* bits per sample */
+    view.setUint16(34, 32, true);
+    /* data chunk identifier */
+    writeString(view, 36, "data");
+    /* data chunk length */
+    view.setUint32(40, samples.length * 4, true);
+    for (let i = 0; i < samples.length; ++i, offset += 4) {
+        view.setFloat32(offset, samples[i], true);
+    }
+    return buffer;
+}
+function writeString(view, offset, string) {
+    for (let i = 0; i < string.length; ++i) {
+        view.setUint8(offset + i, string.charCodeAt(i));
+    }
+}
+export class RawAudio {
+    /**
+     * Create a new `RawAudio` object.
+     * @param {Float32Array} audio Audio data
+     * @param {number} sampling_rate Sampling rate of the audio data
+     */
+    constructor(audio, sampling_rate) {
+        this.audio = audio
+        this.sampling_rate = sampling_rate
+    }
+    /**
+     * Convert the audio to a wav file buffer.
+     * @returns {ArrayBuffer} The WAV file.
+     */
+    toWav() {
+        return encodeWAV(this.audio, this.sampling_rate)
+    }
+    /**
+     * Convert the audio to a blob.
+     * @returns {Blob}
+     */
+    toBlob() {
+        const wav = this.toWav();
+        const blob = new Blob([wav], { type: 'audio/wav' });
+        return blob;
+    }
+    /**
+     * Save the audio to a wav file.
+     * @param {string} path
+     */
+    async save(path) {
+        let fn;
+        if (apis.IS_BROWSER_ENV) {
+            if (apis.IS_WEBWORKER_ENV) {
+                throw new Error('Unable to save a file from a Web Worker.')
+            }
+            fn = saveBlob;
+        } else if (apis.IS_FS_AVAILABLE) {
+            fn = async (/** @type {string} */ path, /** @type {Blob} */ blob) => {
+                let buffer = await blob.arrayBuffer();
+                fs.writeFileSync(path, Buffer.from(buffer));
+            }
+        } else {
+            throw new Error('Unable to save because filesystem is disabled in this environment.')
+        }
+        await fn(path, this.toBlob())
+    }
+}

package/src/utils/core.js CHANGED Viewed

@@ -189,6 +189,32 @@ export function calculateReflectOffset(i, w) {
     return Math.abs((i + w) % (2 * w) - w);
 }
+/**
+ * Save blob file on the web.
+ * @param {string} path The path to save the blob to
+ * @param {Blob} blob The blob to save
+ */
+export function saveBlob(path, blob){
+    // Convert the canvas content to a data URL
+    const dataURL = URL.createObjectURL(blob);
+    // Create an anchor element with the data URL as the href attribute
+    const downloadLink = document.createElement('a');
+    downloadLink.href = dataURL;
+    // Set the download attribute to specify the desired filename for the downloaded image
+    downloadLink.download = path;
+    // Trigger the download
+    downloadLink.click();
+    // Clean up: remove the anchor element from the DOM
+    downloadLink.remove();
+    // Revoke the Object URL to free up memory
+    URL.revokeObjectURL(dataURL);
+}
 /**
  *
  * @param {Object} o

package/src/utils/dtypes.js CHANGED Viewed

@@ -1,3 +1,5 @@
+/// <reference types="@webgpu/types" />
 import { apis } from "../env.js";
 import { DEVICE_TYPES } from "./devices.js";

package/src/utils/hub.js CHANGED Viewed

@@ -121,7 +121,7 @@ class FileResponse {
      */
     async arrayBuffer() {
         const data = await fs.promises.readFile(this.filePath);
-        return data.buffer;
+        return /** @type {ArrayBuffer} */ (data.buffer);
     }
     /**

package/src/utils/image.js CHANGED Viewed

@@ -8,9 +8,9 @@
  * @module utils/image
  */
-import { isNullishDimension } from './core.js';
+import { isNullishDimension, saveBlob } from './core.js';
 import { getFile } from './hub.js';
-import { env, apis } from '../env.js';
+import { apis } from '../env.js';
 import { Tensor } from './tensor.js';
 // Will be empty (or not used) if running in browser or web-worker
@@ -793,23 +793,9 @@ export class RawImage {
             // Convert image to Blob
             const blob = await this.toBlob(mime);
-            // Convert the canvas content to a data URL
-            const dataURL = URL.createObjectURL(blob);
+            saveBlob(path, blob)
-            // Create an anchor element with the data URL as the href attribute
-            const downloadLink = document.createElement('a');
-            downloadLink.href = dataURL;
-            // Set the download attribute to specify the desired filename for the downloaded image
-            downloadLink.download = path;
-            // Trigger the download
-            downloadLink.click();
-            // Clean up: remove the anchor element from the DOM
-            downloadLink.remove();
-        } else if (!env.useFS) {
+        } else if (!apis.IS_FS_AVAILABLE) {
             throw new Error('Unable to save the image because filesystem is disabled in this environment.')
         } else {
@@ -837,3 +823,4 @@ export class RawImage {
  * Helper function to load an image from a URL, path, etc.
  */
 export const load_image = RawImage.read.bind(RawImage);

package/src/utils/maths.js CHANGED Viewed

@@ -225,8 +225,9 @@ export function magnitude(arr) {
 /**
  * Returns the value and index of the minimum element in an array.
- * @param {number[]|TypedArray} arr array of numbers.
- * @returns {[number, number]} the value and index of the minimum element, of the form: [valueOfMin, indexOfMin]
+ * @template {number[]|bigint[]|AnyTypedArray} T
+ * @param {T} arr array of numbers.
+ * @returns {T extends bigint[]|BigTypedArray ? [bigint, number] : [number, number]} the value and index of the minimum element, of the form: [valueOfMin, indexOfMin]
  * @throws {Error} If array is empty.
  */
 export function min(arr) {
@@ -239,14 +240,15 @@ export function min(arr) {
             indexOfMin = i;
         }
     }
-    return [min, indexOfMin];
+    return /** @type {T extends bigint[]|BigTypedArray ? [bigint, number] : [number, number]} */([min, indexOfMin]);
 }
 /**
  * Returns the value and index of the maximum element in an array.
- * @param {number[]|AnyTypedArray} arr array of numbers.
- * @returns {[number, number]} the value and index of the maximum element, of the form: [valueOfMax, indexOfMax]
+ * @template {number[]|bigint[]|AnyTypedArray} T
+ * @param {T} arr array of numbers.
+ * @returns {T extends bigint[]|BigTypedArray ? [bigint, number] : [number, number]} the value and index of the maximum element, of the form: [valueOfMax, indexOfMax]
  * @throws {Error} If array is empty.
  */
 export function max(arr) {
@@ -259,7 +261,7 @@ export function max(arr) {
             indexOfMax = i;
         }
     }
-    return [Number(max), indexOfMax];
+    return /** @type {T extends bigint[]|BigTypedArray ? [bigint, number] : [number, number]} */([max, indexOfMax]);
 }
 function isPowerOfTwo(number) {

package/src/utils/tensor.js CHANGED Viewed

@@ -9,6 +9,8 @@
 import {
     interpolate_data,
+    max,
+    min,
     permute_data
 } from './maths.js';
@@ -464,8 +466,6 @@ export class Tensor {
         return this.permute(...dims);
     }
-    // TODO add .max() and .min() methods
     /**
      * Returns the sum of each row of the input tensor in the given dimension dim.
      *
@@ -494,55 +494,22 @@ export class Tensor {
         }
         const this_data = this.data;
+        const fn = (a, b) => a + (b ** p);
         if (dim === null) {
             // @ts-ignore
-            let val = this_data.reduce((a, b) => a + (b ** p), 0) ** (1 / p);
+            const val = this_data.reduce(fn, 0) ** (1 / p);
             return new Tensor(this.type, [val], []);
         }
-        // Negative indexing
-        dim = safeIndex(dim, this.dims.length);
-        // Calculate the shape of the resulting array after summation
-        const resultDims = this.dims.slice(); // Copy the original dimensions
-        resultDims[dim] = 1; // Remove the specified axis
-        // Create a new array to store the accumulated values
-        // @ts-ignore
-        const result = new this_data.constructor(this_data.length / this.dims[dim]);
-        // Iterate over the data array
-        for (let i = 0; i < this_data.length; ++i) {
-            // Calculate the index in the resulting array
-            let resultIndex = 0;
-            for (let j = this.dims.length - 1, num = i, resultMultiplier = 1; j >= 0; --j) {
-                const size = this.dims[j];
-                if (j !== dim) {
-                    const index = num % size;
-                    resultIndex += index * resultMultiplier;
-                    resultMultiplier *= resultDims[j];
-                }
-                num = Math.floor(num / size);
-            }
-            // Accumulate the value at the current index
-            result[resultIndex] += (this_data[i]) ** p;
-        }
+        const [type, result, resultDims] = reduce_helper(fn, this, dim, keepdim);
         if (p !== 1) {
             for (let i = 0; i < result.length; ++i) {
                 result[i] = result[i] ** (1 / p);
             }
         }
-        if (!keepdim) {
-            resultDims.splice(dim, 1);
-        }
-        return new Tensor(this.type, result, resultDims);
+        return new Tensor(type, result, resultDims);
     }
     /**
@@ -605,7 +572,7 @@ export class Tensor {
      * NOTE: The returned tensor shares the storage with the input tensor, so changing the contents of one will change the contents of the other.
      * If you would like a copy, use `tensor.clone()` before squeezing.
      *
-     * @param {number} [dim=null] If given, the input will be squeezed only in the specified dimensions.
+     * @param {number|number[]} [dim=null] If given, the input will be squeezed only in the specified dimensions.
      * @returns {Tensor} The squeezed tensor
      */
     squeeze(dim = null) {
@@ -715,6 +682,34 @@ export class Tensor {
         return this.clone().neg_();
     }
+    /**
+     * Computes input > val element-wise.
+     * @param {number} val The value to compare with.
+     * @returns {Tensor} A boolean tensor that is `true` where input is greater than other and `false` elsewhere.
+     */
+    gt(val) {
+        const mask = new Uint8Array(this.data.length);
+        const this_data = this.data;
+        for (let i = 0; i < this_data.length; ++i) {
+            mask[i] = this_data[i] > val ? 1 : 0;
+        }
+        return new Tensor('bool', mask, this.dims);
+    }
+    /**
+     * Computes input < val element-wise.
+     * @param {number} val The value to compare with.
+     * @returns {Tensor} A boolean tensor that is `true` where input is less than other and `false` elsewhere.
+     */
+    lt(val) {
+        const mask = new Uint8Array(this.data.length);
+        const this_data = this.data;
+        for (let i = 0; i < this_data.length; ++i) {
+            mask[i] = this_data[i] < val ? 1 : 0;
+        }
+        return new Tensor('bool', mask, this.dims);
+    }
     /**
      * In-place version of @see {@link Tensor.clamp}
      */
@@ -759,6 +754,41 @@ export class Tensor {
         return mean(this, dim, keepdim);
     }
+    min(dim = null, keepdim = false) {
+        if (dim === null) {
+            // None to reduce over all dimensions.
+            const val = min(this.data)[0];
+            return new Tensor(this.type, [val], [/* scalar */]);
+        }
+        const [type, result, resultDims] = reduce_helper((a, b) => Math.min(a, b), this, dim, keepdim, Infinity);
+        return new Tensor(type, result, resultDims);
+    }
+    max(dim = null, keepdim = false) {
+        if (dim === null) {
+            // None to reduce over all dimensions.
+            const val = max(this.data)[0];
+            return new Tensor(this.type, [val], [/* scalar */]);
+        }
+        const [type, result, resultDims] = reduce_helper((a, b) => Math.max(a, b), this, dim, keepdim, -Infinity);
+        return new Tensor(type, result, resultDims);
+    }
+    argmin(dim = null, keepdim = false) {
+        if (dim !== null) {
+            throw new Error("`dim !== null` not yet implemented.");
+        }
+        const index = min(this.data)[1];
+        return new Tensor('int64', [BigInt(index)], []);
+    }
+    argmax(dim = null, keepdim = false) {
+        if (dim !== null) {
+            throw new Error("`dim !== null` not yet implemented.");
+        }
+        const index = max(this.data)[1];
+        return new Tensor('int64', [BigInt(index)], []);
+    }
     /**
      * Performs Tensor dtype conversion.
      * @param {DataType} type The desired data type.
@@ -892,7 +922,7 @@ export function interpolate(input, [out_height, out_width], mode = 'bilinear', a
  * @param {Tensor} input the input tensor
  * @param {Object} options the options for the interpolation
  * @param {[number, number]|[number, number, number]|[number, number, number, number]} [options.size=null] output spatial size.
- * @param {"bilinear"|"bicubic"} [options.mode='bilinear'] algorithm used for upsampling
+ * @param {"nearest"|"bilinear"|"bicubic"} [options.mode='bilinear'] algorithm used for upsampling
  * @returns {Promise<Tensor>} The interpolated tensor.
  */
 export async function interpolate_4d(input, {
@@ -922,7 +952,9 @@ export async function interpolate_4d(input, {
     }
     let op;
-    if (mode === 'bilinear') {
+    if (mode === 'nearest') {
+        op = await TensorOpRegistry.nearest_interpolate_4d;
+    } else if (mode === 'bilinear') {
         op = await TensorOpRegistry.bilinear_interpolate_4d;
     } else if (mode === 'bicubic') {
         op = await TensorOpRegistry.bicubic_interpolate_4d;
@@ -963,13 +995,13 @@ export async function rfft(x, a) {
  * Returns the k largest elements of the given input tensor.
  * Inspired by https://pytorch.org/docs/stable/generated/torch.topk.html
  * @param {Tensor} x the input tensor
- * @param {number} k the k in "top-k"
+ * @param {number} [k] the k in "top-k"
  * @returns {Promise<[Tensor, Tensor]>} the output tuple of (Tensor, LongTensor) of top-k elements and their indices.
  */
 export async function topk(x, k) {
     const op = await TensorOpRegistry.top_k;
-    if (k === null) {
+    if (k == null) {
         k = x.dims.at(-1);
     } else {
         k = Math.min(k, x.dims.at(-1));
@@ -998,10 +1030,10 @@ const arrayToIndexTensor = (array) => new Tensor('int64', array, [array.length])
 export async function slice(data, starts, ends, axes, steps) {
     const op = await TensorOpRegistry.slice;
     return await op({
-        x: data,
-        s: arrayToIndexTensor(starts),
-        e: arrayToIndexTensor(ends),
-        a: arrayToIndexTensor(axes),
+        x: data,
+        s: arrayToIndexTensor(starts),
+        e: arrayToIndexTensor(ends),
+        a: arrayToIndexTensor(axes),
         t: arrayToIndexTensor(steps ?? new Array(axes.length).fill(1)),
     });
 }
@@ -1236,35 +1268,19 @@ export function stack(tensors, dim = 0) {
 /**
- * Calculates the standard deviation and mean over the dimensions specified by dim. dim can be a single dimension or `null` to reduce over all dimensions.
- * @param {Tensor} input the input tenso
- * @param {number|null} dim the dimension to reduce. If None, all dimensions are reduced.
- * @param {number} correction difference between the sample size and sample degrees of freedom. Defaults to Bessel's correction, correction=1.
+ * @param {(previousValue: any, currentValue: any, currentIndex?: number, resultIndex?: number) => any} callbackfn
+ * @param {Tensor} input the input tensor.
+ * @param {number|null} dim the dimension to reduce.
  * @param {boolean} keepdim whether the output tensor has dim retained or not.
- * @returns {Tensor[]} A tuple of (std, mean) tensors.
+ * @returns {[DataType, any, number[]]} The reduced tensor data.
  */
-export function std_mean(input, dim = null, correction = 1, keepdim = false) {
-    const inputData = /** @type {Float32Array} */(input.data);
+function reduce_helper(callbackfn, input, dim = null, keepdim = false, initialValue = null) {
+    const inputData = input.data;
     const inputDims = input.dims;
-    if (dim === null) {
-        // None to reduce over all dimensions.
-        const sum = inputData.reduce((a, b) => a + b, 0);
-        const mean = sum / inputData.length;
-        const std = Math.sqrt(inputData.reduce((a, b) => a + (b - mean) ** 2, 0) / (inputData.length - correction));
-        const meanTensor = new Tensor(input.type, [mean], [/* scalar */]);
-        const stdTensor = new Tensor(input.type, [std], [/* scalar */]);
-        return [stdTensor, meanTensor];
-    }
     // Negative indexing
     dim = safeIndex(dim, inputDims.length);
-    const meanTensor = mean(input, dim, keepdim);
-    const meanTensorData = meanTensor.data;
     // Calculate the shape of the resulting array after summation
     const resultDims = inputDims.slice(); // Copy the original dimensions
     resultDims[dim] = 1; // Remove the specified axis
@@ -1272,6 +1288,9 @@ export function std_mean(input, dim = null, correction = 1, keepdim = false) {
     // Create a new array to store the accumulated values
     // @ts-ignore
     const result = new inputData.constructor(inputData.length / inputDims[dim]);
+    if (initialValue !== null) {
+        result.fill(initialValue);
+    }
     // Iterate over the data array
     for (let i = 0; i < inputData.length; ++i) {
@@ -1290,23 +1309,55 @@ export function std_mean(input, dim = null, correction = 1, keepdim = false) {
         }
         // Accumulate the value at the current index
-        result[resultIndex] += (inputData[i] - meanTensorData[resultIndex]) ** 2;
+        result[resultIndex] = callbackfn(result[resultIndex], inputData[i], i, resultIndex);
     }
-    for (let i = 0; i < result.length; ++i) {
-        result[i] = Math.sqrt(result[i] / (inputDims[dim] - correction));
+    if (!keepdim) resultDims.splice(dim, 1);
+    return [input.type, result, resultDims];
+}
+/**
+ * Calculates the standard deviation and mean over the dimensions specified by dim. dim can be a single dimension or `null` to reduce over all dimensions.
+ * @param {Tensor} input the input tenso
+ * @param {number|null} dim the dimension to reduce. If None, all dimensions are reduced.
+ * @param {number} correction difference between the sample size and sample degrees of freedom. Defaults to Bessel's correction, correction=1.
+ * @param {boolean} keepdim whether the output tensor has dim retained or not.
+ * @returns {Tensor[]} A tuple of (std, mean) tensors.
+ */
+export function std_mean(input, dim = null, correction = 1, keepdim = false) {
+    const inputData = /** @type {Float32Array} */(input.data);
+    const inputDims = input.dims;
+    if (dim === null) {
+        // None to reduce over all dimensions.
+        const sum = inputData.reduce((a, b) => a + b, 0);
+        const mean = sum / inputData.length;
+        const std = Math.sqrt(inputData.reduce((a, b) => a + (b - mean) ** 2, 0) / (inputData.length - correction));
+        const meanTensor = new Tensor(input.type, [mean], [/* scalar */]);
+        const stdTensor = new Tensor(input.type, [std], [/* scalar */]);
+        return [stdTensor, meanTensor];
     }
+    dim = safeIndex(dim, inputDims.length);
+    const meanTensor = mean(input, dim, keepdim);
+    const meanTensorData = meanTensor.data;
+    // Compute squared sum
+    const [type, result, resultDims] = reduce_helper((a, b, i, j) => a + (b - meanTensorData[j]) ** 2, input, dim, keepdim);
-    if (!keepdim) {
-        resultDims.splice(dim, 1);
+    // Square root of the squared sum
+    for (let i = 0; i < result.length; ++i) {
+        result[i] = Math.sqrt(result[i] / (inputDims[dim] - correction));
     }
-    const stdTensor = new Tensor(input.type, result, resultDims);
+    const stdTensor = new Tensor(type, result, resultDims);
     return [stdTensor, meanTensor];
 }
 /**
  * Returns the mean value of each row of the input tensor in the given dimension dim.
  * @param {Tensor} input the input tensor.
@@ -1315,58 +1366,27 @@ export function std_mean(input, dim = null, correction = 1, keepdim = false) {
  * @returns {Tensor} A new tensor with means taken along the specified dimension.
  */
 export function mean(input, dim = null, keepdim = false) {
+    const inputDims = input.dims;
     const inputData = /** @type {Float32Array} */(input.data);
     if (dim === null) {
         // None to reduce over all dimensions.
-        // @ts-ignore
         const val = inputData.reduce((a, b) => a + b, 0);
         return new Tensor(input.type, [val / inputData.length], [/* scalar */]);
     }
-    const inputDims = input.dims;
-    // Negative indexing
     dim = safeIndex(dim, inputDims.length);
-    // Calculate the shape of the resulting array after summation
-    const resultDims = inputDims.slice(); // Copy the original dimensions
-    resultDims[dim] = 1; // Remove the specified axis
-    // Create a new array to store the accumulated values
-    // @ts-ignore
-    const result = new inputData.constructor(inputData.length / inputDims[dim]);
-    // Iterate over the data array
-    for (let i = 0; i < inputData.length; ++i) {
-        // Calculate the index in the resulting array
-        let resultIndex = 0;
-        for (let j = inputDims.length - 1, num = i, resultMultiplier = 1; j >= 0; --j) {
-            const size = inputDims[j];
-            if (j !== dim) {
-                const index = num % size;
-                resultIndex += index * resultMultiplier;
-                resultMultiplier *= resultDims[j];
-            }
-            num = Math.floor(num / size);
-        }
-        // Accumulate the value at the current index
-        result[resultIndex] += inputData[i];
-    }
+    // Compute sum
+    const [type, result, resultDims] = reduce_helper((a, b) => a + b, input, dim, keepdim);
+    // Divide by number of elements in the dimension
     if (inputDims[dim] !== 1) {
         for (let i = 0; i < result.length; ++i) {
-            result[i] = result[i] / inputDims[dim];
+            result[i] /= inputDims[dim];
         }
     }
-    if (!keepdim) {
-        resultDims.splice(dim, 1);
-    }
-    return new Tensor(input.type, result, resultDims);
+    return new Tensor(type, result, resultDims);
 }

package/types/base/feature_extraction_utils.d.ts CHANGED Viewed

@@ -14,19 +14,19 @@ declare const FeatureExtractor_base: new () => {
  */
 export class FeatureExtractor extends FeatureExtractor_base {
     /**
-     * Instantiate one of the processor classes of the library from a pretrained model.
+     * Instantiate one of the feature extractor classes of the library from a pretrained model.
      *
-     * The processor class to instantiate is selected based on the `image_processor_type` (or `feature_extractor_type`; legacy)
-     * property of the config object (either passed as an argument or loaded from `pretrained_model_name_or_path` if possible)
+     * The feature extractor class to instantiate is selected based on the `feature_extractor_type` property of
+     * the config object (either passed as an argument or loaded from `pretrained_model_name_or_path` if possible)
      *
      * @param {string} pretrained_model_name_or_path The name or path of the pretrained model. Can be either:
-     * - A string, the *model id* of a pretrained processor hosted inside a model repo on huggingface.co.
+     * - A string, the *model id* of a pretrained feature_extractor hosted inside a model repo on huggingface.co.
      *   Valid model ids can be located at the root-level, like `bert-base-uncased`, or namespaced under a
      *   user or organization name, like `dbmdz/bert-base-german-cased`.
-     * - A path to a *directory* containing processor files, e.g., `./my_model_directory/`.
-     * @param {import('../utils/hub.js').PretrainedOptions} options Additional options for loading the processor.
+     * - A path to a *directory* containing feature_extractor files, e.g., `./my_model_directory/`.
+     * @param {import('../utils/hub.js').PretrainedOptions} options Additional options for loading the feature_extractor.
      *
-     * @returns {Promise<FeatureExtractor>} A new instance of the Processor class.
+     * @returns {Promise<FeatureExtractor>} A new instance of the Feature Extractor class.
      */
     static from_pretrained(pretrained_model_name_or_path: string, options: import("../utils/hub.js").PretrainedOptions): Promise<FeatureExtractor>;
     /**