npm - catniff - Versions diffs - 0.6.7 → 0.6.9 - Mend

catniff 0.6.7 → 0.6.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/core.d.ts CHANGED Viewed

@@ -1,8 +1,8 @@
 import { Backend } from "./backend";
 export type TensorValue = number | TensorValue[];
 export interface TensorOptions {
-    shape?: readonly number[];
-    strides?: readonly number[];
+    shape?: number[];
+    strides?: number[];
     offset?: number;
     numel?: number;
     grad?: Tensor;
@@ -13,8 +13,8 @@ export interface TensorOptions {
 }
 export declare class Tensor {
     value: number[] | number;
-    readonly shape: readonly number[];
-    readonly strides: readonly number[];
+    shape: number[];
+    strides: number[];
     offset: number;
     numel: number;
     grad?: Tensor;
@@ -24,20 +24,20 @@ export declare class Tensor {
     device: string;
     static training: boolean;
     constructor(value: TensorValue, options?: TensorOptions);
-    static flatten(tensor: TensorValue): number[] | number;
-    static getShape(tensor: TensorValue): readonly number[];
-    static getStrides(shape: readonly number[]): readonly number[];
-    static padShape(stridesA: readonly number[], stridesB: readonly number[], shapeA: readonly number[], shapeB: readonly number[]): [
-        readonly number[],
-        readonly number[],
-        readonly number[],
-        readonly number[]
+    static flattenValue(tensor: TensorValue): number[] | number;
+    static getShape(tensor: TensorValue): number[];
+    static getStrides(shape: number[]): number[];
+    static padShape(stridesA: number[], stridesB: number[], shapeA: number[], shapeB: number[]): [
+        number[],
+        number[],
+        number[],
+        number[]
     ];
-    static broadcastShapes(shapeA: readonly number[], shapeB: readonly number[]): readonly number[];
-    static indexToCoords(index: number, strides: readonly number[]): number[];
-    static coordsToUnbroadcastedIndex(coords: number[], shape: readonly number[], strides: readonly number[]): number;
-    static coordsToIndex(coords: number[], strides: readonly number[]): number;
-    static shapeToSize(shape: readonly number[]): number;
+    static broadcastShapes(shapeA: number[], shapeB: number[]): number[];
+    static indexToCoords(index: number, strides: number[]): number[];
+    static coordsToUnbroadcastedIndex(coords: number[], shape: number[], strides: number[]): number;
+    static coordsToIndex(coords: number[], strides: number[]): number;
+    static shapeToSize(shape: number[]): number;
     static elementWiseAB(tA: Tensor, tB: Tensor, op: (tA: number, tB: number) => number): Tensor;
     static elementWiseSelf(tA: Tensor, op: (tA: number) => number): Tensor;
     elementWiseABDAG(other: TensorValue | Tensor, op: (a: number, b: number) => number, thisGrad?: (self: Tensor, other: Tensor, outGrad: Tensor) => Tensor, otherGrad?: (self: Tensor, other: Tensor, outGrad: Tensor) => Tensor): Tensor;
@@ -47,8 +47,9 @@ export declare class Tensor {
     static normalizeDims(dims: number[], numDims: number): number[];
     isContiguous(): boolean;
     contiguous(): Tensor;
-    view(newShape: readonly number[]): Tensor;
-    reshape(newShape: readonly number[]): Tensor;
+    view(newShape: number[]): Tensor;
+    reshape(newShape: number[]): Tensor;
+    flatten(startDim?: number, endDim?: number): Tensor;
     transpose(dim1: number, dim2: number): Tensor;
     swapaxes: (dim1: number, dim2: number) => Tensor;
     swapdims: (dim1: number, dim2: number) => Tensor;
@@ -57,6 +58,7 @@ export declare class Tensor {
     indexWithArray(indices: number[]): Tensor;
     index(indices: Tensor | TensorValue): Tensor;
     slice(ranges: number[][]): Tensor;
+    chunk(chunks: number, dim?: number): Tensor[];
     squeeze(dims?: number[] | number): Tensor;
     unsqueeze(dim: number): Tensor;
     static reduce(tensor: Tensor, dims: number[] | number | undefined, keepDims: boolean, config: {
@@ -185,17 +187,17 @@ export declare class Tensor {
     triu(diagonal?: number): Tensor;
     tril(diagonal?: number): Tensor;
     maskedFill(mask: Tensor | TensorValue, value: number): Tensor;
-    static full(shape: readonly number[], num: number, options?: TensorOptions): Tensor;
+    static full(shape: number[], num: number, options?: TensorOptions): Tensor;
     static fullLike(tensor: Tensor, num: number, options?: TensorOptions): Tensor;
-    static ones(shape?: readonly number[], options?: TensorOptions): Tensor;
+    static ones(shape?: number[], options?: TensorOptions): Tensor;
     static onesLike(tensor: Tensor, options?: TensorOptions): Tensor;
-    static zeros(shape?: readonly number[], options?: TensorOptions): Tensor;
+    static zeros(shape?: number[], options?: TensorOptions): Tensor;
     static zerosLike(tensor: Tensor, options?: TensorOptions): Tensor;
-    static rand(shape?: readonly number[], options?: TensorOptions): Tensor;
+    static rand(shape?: number[], options?: TensorOptions): Tensor;
     static randLike(tensor: Tensor, options?: TensorOptions): Tensor;
-    static randn(shape?: readonly number[], options?: TensorOptions): Tensor;
+    static randn(shape?: number[], options?: TensorOptions): Tensor;
     static randnLike(tensor: Tensor, options?: TensorOptions): Tensor;
-    static randint(shape: readonly number[], low: number, high: number, options?: TensorOptions): Tensor;
+    static randint(shape: number[], low: number, high: number, options?: TensorOptions): Tensor;
     static randintLike(tensor: Tensor, low: number, high: number, options?: TensorOptions): Tensor;
     static randperm(n: number, options?: TensorOptions): Tensor;
     static normal(shape: number[], mean: number, stdDev: number, options?: TensorOptions): Tensor;

package/dist/core.js CHANGED Viewed

@@ -16,7 +16,7 @@ class Tensor {
     static training = false;
     constructor(value, options = {}) {
         // Storage
-        this.value = Tensor.flatten(value);
+        this.value = Tensor.flattenValue(value);
         // Tensor metadata
         this.shape = options.shape || Tensor.getShape(value);
         this.strides = options.strides || Tensor.getStrides(this.shape);
@@ -32,7 +32,7 @@ class Tensor {
         this.to_(this.device);
     }
     // Utility to flatten an nD array to be 1D
-    static flatten(tensor) {
+    static flattenValue(tensor) {
         // Handle scalar tensors
         if (typeof tensor === "number")
             return tensor;
@@ -377,6 +377,40 @@ class Tensor {
         }
         return out;
     }
+    flatten(startDim = 0, endDim = -1) {
+        // Handle negative indices
+        if (startDim < 0) {
+            startDim += this.shape.length;
+        }
+        if (endDim < 0) {
+            endDim += this.shape.length;
+        }
+        // If dimension out of bound, throw error
+        if (startDim >= this.shape.length || endDim >= this.shape.length || startDim < 0 || endDim < 0) {
+            throw new Error("Dimensions do not exist to flatten");
+        }
+        const newShape = [];
+        let middleSize = 1;
+        for (let index = 0; index < this.shape.length; index++) {
+            // Keep dims before startDim
+            if (index < startDim) {
+                newShape.push(this.shape[index]);
+            }
+            // Multiply dims from startDim to endDim
+            if (index >= startDim && index <= endDim) {
+                middleSize *= this.shape[index];
+            }
+            // Push new flatten middle
+            if (index === endDim) {
+                newShape.push(middleSize);
+            }
+            // Keep dims after endDim
+            if (index > endDim) {
+                newShape.push(this.shape[index]);
+            }
+        }
+        return this.reshape(newShape);
+    }
     // Transpose
     transpose(dim1, dim2) {
         // Handle negative indices
@@ -605,6 +639,25 @@ class Tensor {
         }
         return out;
     }
+    // Tensor chunk
+    chunk(chunks, dim = 0) {
+        // Handle negative indices
+        if (dim < 0) {
+            dim += this.shape.length;
+        }
+        const sliceOpt = new Array(this.shape.length);
+        for (let index = 0; index < sliceOpt.length; index++) {
+            sliceOpt[index] = [];
+        }
+        const dimSize = this.shape[dim];
+        const chunkDimSize = Math.ceil(dimSize / chunks);
+        const results = [];
+        for (let index = 0; index < dimSize; index += chunkDimSize) {
+            sliceOpt[dim] = [index, Math.min(index + chunkDimSize, dimSize)];
+            results.push(this.slice(sliceOpt));
+        }
+        return results;
+    }
     // Tensor squeeze
     squeeze(dims) {
         if (typeof this.value === "number")
@@ -1114,7 +1167,7 @@ class Tensor {
     mish() {
         return this.elementWiseSelfDAG((a) => a * Math.tanh(Math.log1p(Math.exp(a))), (self, outGrad) => {
             const tanhSoftPlus = self.exp().add(1).log().tanh();
-            // tanh(softplus(x)) + x * (1 - tanh²(softplus(x))) * sigmoid(x)
+            // tanh(softplus(x)) + x * (1 - tanh^2(softplus(x))) * sigmoid(x)
             const derivative = tanhSoftPlus.add(self.mul(tanhSoftPlus.square().neg().add(1)).mul(self.sigmoid()));
             return outGrad.mul(derivative);
         });

package/dist/optim.js CHANGED Viewed

@@ -108,17 +108,17 @@ class Adam extends BaseOptimizer {
                 velocityBuffer = core_1.Tensor.zerosLike(grad); // Initialize with zeros (same shape as grad)
                 this.velocityBuffers.set(param, velocityBuffer);
             }
-            // Update biased first moment estimate: m_t = β1 * m_{t-1} + (1 - β1) * g_t
+            // Update biased first moment estimate: m_t = beta1 * m_{t-1} + (1 - beta1) * g_t
             momentumBuffer = momentumBuffer.mul(beta1).add(grad.mul(1 - beta1));
             this.momentumBuffers.set(param, momentumBuffer);
-            // Update biased second moment estimate: v_t = β2 * v_{t-1} + (1 - β2) * g_t^2
+            // Update biased second moment estimate: v_t = beta2 * v_{t-1} + (1 - beta2) * g_t^2
             velocityBuffer = velocityBuffer.mul(beta2).add(grad.pow(2).mul(1 - beta2));
             this.velocityBuffers.set(param, velocityBuffer);
-            // Compute bias-corrected first moment: m̂_t = m_t / (1 - β1^t)
+            // Compute bias-corrected first moment: m_hat_t = m_t / (1 - beta1^t)
             const correctedMomentum = momentumBuffer.div(biasCorrection1);
-            // Compute bias-corrected second moment: v̂_t = v_t / (1 - β2^t)
+            // Compute bias-corrected second moment: v_hat_t = v_t / (1 - beta2^t)
             const correctedVelocity = velocityBuffer.div(biasCorrection2);
-            // Update parameters: θ_t = θ_{t-1} - α * m̂_t / (√v̂_t + ε)
+            // Update parameters: theta_t = theta_{t-1} - alpha * m_hat_t / (sqrt(v_hat_t) + epsilon)
             const denom = correctedVelocity.sqrt().add(this.eps);
             const stepSize = correctedMomentum.div(denom).mul(this.lr);
             const newParam = detachedParam.sub(stepSize);
@@ -166,17 +166,17 @@ class AdamW extends BaseOptimizer {
                 velocityBuffer = core_1.Tensor.zerosLike(grad); // Initialize with zeros (same shape as grad)
                 this.velocityBuffers.set(param, velocityBuffer);
             }
-            // Update biased first moment estimate: m_t = β1 * m_{t-1} + (1 - β1) * g_t
+            // Update biased first moment estimate: m_t = beta1 * m_{t-1} + (1 - beta1) * g_t
             momentumBuffer = momentumBuffer.mul(beta1).add(grad.mul(1 - beta1));
             this.momentumBuffers.set(param, momentumBuffer);
-            // Update biased second moment estimate: v_t = β2 * v_{t-1} + (1 - β2) * g_t^2
+            // Update biased second moment estimate: v_t = beta2 * v_{t-1} + (1 - beta2) * g_t^2
             velocityBuffer = velocityBuffer.mul(beta2).add(grad.pow(2).mul(1 - beta2));
             this.velocityBuffers.set(param, velocityBuffer);
-            // Compute bias-corrected first moment: m̂_t = m_t / (1 - β1^t)
+            // Compute bias-corrected first moment: m_hat_t = m_t / (1 - beta1^t)
             const correctedMomentum = momentumBuffer.div(biasCorrection1);
-            // Compute bias-corrected second moment: v̂_t = v_t / (1 - β2^t)
+            // Compute bias-corrected second moment: v_hat_t = v_t / (1 - beta2^t)
             const correctedVelocity = velocityBuffer.div(biasCorrection2);
-            // Update parameters: θ_t = θ_t - α * m̂_t / (√v̂_t + ε)
+            // Update parameters: theta_t = theta_{t-1} - alpha * m_hat_t / (sqrt(v_hat_t) + epsilon)
             const denom = correctedVelocity.sqrt().add(this.eps);
             const stepSize = correctedMomentum.div(denom).mul(this.lr);
             const newParam = detachedParam.sub(stepSize);

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "catniff",
-  "version": "0.6.7",
+  "version": "0.6.9",
   "description": "A small Torch-like deep learning framework for Javascript",
   "main": "index.js",
   "scripts": {