npm - catniff - Versions diffs - 0.2.5 → 0.2.7 - Mend

catniff 0.2.5 → 0.2.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/core.d.ts CHANGED Viewed

@@ -39,6 +39,8 @@ export declare class Tensor {
     squeeze(dims?: number[] | number): Tensor;
     unsqueeze(dim: number): Tensor;
     sum(dims?: number[] | number, keepDims?: boolean): Tensor;
+    prod(dims?: number[] | number, keepDims?: boolean): Tensor;
+    mean(dims?: number[] | number, keepDims?: boolean): Tensor;
     add(other: TensorValue | Tensor): Tensor;
     sub(other: TensorValue | Tensor): Tensor;
     mul(other: TensorValue | Tensor): Tensor;
@@ -89,6 +91,8 @@ export declare class Tensor {
     mv(other: TensorValue | Tensor): Tensor;
     matmul(other: TensorValue | Tensor): Tensor;
     static fullLike(tensor: Tensor, num: number, options?: TensorOptions): Tensor;
+    static onesLike(tensor: Tensor, options?: TensorOptions): Tensor;
+    static zerosLike(tensor: Tensor, options?: TensorOptions): Tensor;
     backward(): void;
     val(): any;
     withGrad(requiresGrad: boolean): Tensor;

package/dist/core.js CHANGED Viewed

@@ -351,6 +351,7 @@ class Tensor {
             gradStrides = this.strides;
             gradValue = new Array(originalSize).fill(0);
         }
+        // Calculate new value after sum
         for (let index = 0; index < originalSize; index++) {
             const coords = Tensor.indexToCoords(index, this.shape, this.strides);
             // Force 0 on reduced axes to collapse into size-1 dims
@@ -362,7 +363,7 @@ class Tensor {
             outputValue[outFlatIndex] += this.value[realFlatIndex];
             // Mark for gradient if needed
             if (this.requiresGrad) {
-                (gradValue)[realFlatIndex] = 1;
+                gradValue[realFlatIndex] = 1;
             }
         }
         const out = new Tensor(outputValue, {
@@ -380,6 +381,136 @@ class Tensor {
         }
         return keepDims ? out : out.squeeze(dims);
     }
+    // Tensor product reduction
+    prod(dims, keepDims = false) {
+        if (typeof this.value === "number")
+            return new Tensor(this.value);
+        if (typeof dims === "number") {
+            dims = [dims];
+        }
+        if (typeof dims === "undefined") {
+            dims = Array.from({ length: this.shape.length }, (_, index) => index);
+        }
+        // Dims that are reduced now have size-1
+        const outputShape = this.shape.map((dim, i) => dims.includes(i) ? 1 : dim);
+        const outputStrides = Tensor.getStrides(outputShape);
+        const outputSize = Tensor.shapeToSize(outputShape);
+        const outputValue = new Array(outputSize).fill(1);
+        const originalSize = Tensor.shapeToSize(this.shape);
+        // Gradient data
+        let gradShape, gradStrides, gradValue = [];
+        // Allocate gradient data only when needed
+        if (this.requiresGrad) {
+            gradShape = this.shape;
+            gradStrides = this.strides;
+            gradValue = new Array(originalSize).fill(0);
+        }
+        // Calculate new value after multiplying
+        for (let index = 0; index < originalSize; index++) {
+            const coords = Tensor.indexToCoords(index, this.shape, this.strides);
+            // Force 0 on reduced axes to collapse into size-1 dims
+            const outCoords = coords.map((val, i) => dims.includes(i) ? 0 : val);
+            // Convert output coordinates to flat index
+            const outFlatIndex = Tensor.coordsToIndex(outCoords, outputStrides);
+            // Accumulate, outFlatIndex should match multiple realFlatIndexes
+            const realFlatIndex = Tensor.coordsToIndex(coords, this.strides);
+            outputValue[outFlatIndex] *= this.value[realFlatIndex];
+        }
+        const out = new Tensor(outputValue, {
+            shape: outputShape,
+            strides: outputStrides
+        });
+        // Set up gradient if needed
+        if (this.requiresGrad) {
+            // Grad is the product of other elements of the same axis, which is product of all els divided by the current value
+            for (let index = 0; index < originalSize; index++) {
+                const coords = Tensor.indexToCoords(index, this.shape, this.strides);
+                // Force 0 on reduced axes to collapse into size-1 dims
+                const outCoords = coords.map((val, i) => dims.includes(i) ? 0 : val);
+                // Convert output coordinates to flat index
+                const outFlatIndex = Tensor.coordsToIndex(outCoords, outputStrides);
+                // Accumulate, outFlatIndex should match multiple realFlatIndexes
+                const realFlatIndex = Tensor.coordsToIndex(coords, this.strides);
+                // Calculate gradient at position
+                gradValue[realFlatIndex] = outputValue[outFlatIndex] / this.value[realFlatIndex];
+            }
+            out.requiresGrad = true;
+            out.children.push(this);
+            out.gradFn = () => {
+                const localGrad = new Tensor(gradValue, { shape: gradShape, strides: gradStrides });
+                Tensor.addGrad(this, out.grad.withGrad(false).mul(localGrad));
+            };
+        }
+        return keepDims ? out : out.squeeze(dims);
+    }
+    // Tensor mean reduction
+    mean(dims, keepDims = false) {
+        if (typeof this.value === "number")
+            return new Tensor(this.value);
+        if (typeof dims === "number") {
+            dims = [dims];
+        }
+        if (typeof dims === "undefined") {
+            dims = Array.from({ length: this.shape.length }, (_, index) => index);
+        }
+        // Dims that are reduced now have size-1
+        const outputShape = this.shape.map((dim, i) => dims.includes(i) ? 1 : dim);
+        const outputStrides = Tensor.getStrides(outputShape);
+        const outputSize = Tensor.shapeToSize(outputShape);
+        const outputValue = new Array(outputSize).fill(0);
+        const outputFeeders = new Array(outputSize).fill(0);
+        const originalSize = Tensor.shapeToSize(this.shape);
+        // Gradient data
+        let gradShape, gradStrides, gradValue = [];
+        // Allocate gradient data only when needed
+        if (this.requiresGrad) {
+            gradShape = this.shape;
+            gradStrides = this.strides;
+            gradValue = new Array(originalSize).fill(0);
+        }
+        // Calculate sums and how many elements contribute to specific positions
+        for (let index = 0; index < originalSize; index++) {
+            const coords = Tensor.indexToCoords(index, this.shape, this.strides);
+            // Force 0 on reduced axes to collapse into size-1 dims
+            const outCoords = coords.map((val, i) => dims.includes(i) ? 0 : val);
+            // Convert output coordinates to flat index
+            const outFlatIndex = Tensor.coordsToIndex(outCoords, outputStrides);
+            // Accumulate, outFlatIndex should match multiple realFlatIndexes
+            const realFlatIndex = Tensor.coordsToIndex(coords, this.strides);
+            outputValue[outFlatIndex] += this.value[realFlatIndex];
+            outputFeeders[outFlatIndex]++;
+        }
+        // Calculate mean by dividing sum by the number of contributors to the position
+        for (let index = 0; index < outputSize; index++) {
+            outputValue[index] /= outputFeeders[index];
+        }
+        const out = new Tensor(outputValue, {
+            shape: outputShape,
+            strides: outputStrides
+        });
+        // Set up gradient if needed
+        if (this.requiresGrad) {
+            // Calculate grad by assiging 1 divide by the number of contributors to the position
+            for (let index = 0; index < originalSize; index++) {
+                const coords = Tensor.indexToCoords(index, this.shape, this.strides);
+                // Force 0 on reduced axes to collapse into size-1 dims
+                const outCoords = coords.map((val, i) => dims.includes(i) ? 0 : val);
+                // Convert output coordinates to flat index
+                const outFlatIndex = Tensor.coordsToIndex(outCoords, outputStrides);
+                // Accumulate, outFlatIndex should match multiple realFlatIndexes
+                const realFlatIndex = Tensor.coordsToIndex(coords, this.strides);
+                // Mean = 1/n * (el1 + el2 + ... + eln) so grad = 1/n
+                gradValue[realFlatIndex] = 1 / outputFeeders[outFlatIndex];
+            }
+            out.requiresGrad = true;
+            out.children.push(this);
+            out.gradFn = () => {
+                const localGrad = new Tensor(gradValue, { shape: gradShape, strides: gradStrides });
+                Tensor.addGrad(this, out.grad.withGrad(false).mul(localGrad));
+            };
+        }
+        return keepDims ? out : out.squeeze(dims);
+    }
     // Tensor element-wise addition
     add(other) {
         return this.elementWiseABDAG(other, (a, b) => a + b, (self, other, outGrad) => outGrad, (self, other, outGrad) => outGrad);
@@ -741,6 +872,18 @@ class Tensor {
             return new Tensor(num, options);
         return new Tensor(new Array(tensor.value.length).fill(num), { shape: tensor.shape, strides: tensor.strides, ...options });
     }
+    // Utility to create a new tensor with shape of another tensor, filled with 1
+    static onesLike(tensor, options = {}) {
+        if (typeof tensor.value === "number")
+            return new Tensor(1, options);
+        return new Tensor(new Array(tensor.value.length).fill(1), { shape: tensor.shape, strides: tensor.strides, ...options });
+    }
+    // Utility to create a new tensor with shape of another tensor, filled with 0
+    static zerosLike(tensor, options = {}) {
+        if (typeof tensor.value === "number")
+            return new Tensor(0, options);
+        return new Tensor(new Array(tensor.value.length).fill(0), { shape: tensor.shape, strides: tensor.strides, ...options });
+    }
     // Reverse-mode autodiff call
     backward() {
         // Build topological order
@@ -749,7 +892,7 @@ class Tensor {
         function build(node) {
             if (!visited.has(node) && node.requiresGrad) {
                 visited.add(node);
-                node.grad = Tensor.fullLike(node, 0); // Reset grad with 0
+                node.grad = Tensor.zerosLike(node); // Reset grad with 0
                 for (let child of node.children)
                     build(child);
                 topo.push(node);
@@ -757,7 +900,7 @@ class Tensor {
         }
         build(this);
         // Feed backward to calculate gradient
-        this.grad = Tensor.fullLike(this, 1);
+        this.grad = Tensor.onesLike(this);
         for (let index = topo.length - 1; index > -1; index--) {
             topo[index].gradFn();
         }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "catniff",
-  "version": "0.2.5",
+  "version": "0.2.7",
   "description": "A cute autograd engine for Javascript",
   "main": "index.js",
   "scripts": {