npm - @jax-js/jax - Versions diffs - 0.0.3 → 0.0.4 - Mend

@jax-js/jax 0.0.3 → 0.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/README.md +50 -19
package/dist/{backend-BqDtPGaR.js → backend-EBRGmEYw.js} +296 -153
package/dist/{backend-D2C4MJRP.cjs → backend-Ss1Mev_-.cjs} +315 -154
package/dist/index.cjs +681 -157
package/dist/index.d.cts +422 -76
package/dist/index.d.ts +422 -76
package/dist/index.js +677 -157
package/dist/{webgpu-fqhx41TC.cjs → webgpu-BVdMaO9T.cjs} +9 -3
package/dist/{webgpu-CNg9JGva.js → webgpu-ow0Pn_6q.js} +9 -3
package/package.json +15 -4

package/dist/index.js CHANGED Viewed

@@ -1,5 +1,5 @@
 import { __export } from "./chunk-Cl8Af3a2.js";
-import { AluExp, AluGroup, AluOp, AluVar, DEBUG, DType, FpHash, Kernel, PPrint, Reduction, ShapeTracker, accessorAluExp, accessorGlobal, byteWidth, checkAxis, deepEqual, devices, dtypedArray, dtypedJsArray, getBackend, init, invertPermutation, isFloatDtype, isNumberPair, isPermutation, partitionList, prod, range, recursiveFlatten, rep, runWithCache, setDevice, toposort, unravelAlu, unzip2, zip, zipn } from "./backend-BqDtPGaR.js";
+import { AluExp, AluGroup, AluOp, AluVar, DEBUG, DType, FpHash, Kernel, PPrint, Reduction, ShapeTracker, accessorAluExp, accessorGlobal, byteWidth, checkAxis, deepEqual, defaultDevice, devices, dtypedArray, dtypedJsArray, getBackend, init, invertPermutation, isFloatDtype, isNumberPair, isPermutation, normalizeAxis, partitionList, prod, promoteTypes, range, recursiveFlatten, rep, runWithCache, setDebug, toposort, unravelAlu, unzip2, zip, zipn } from "./backend-EBRGmEYw.js";
 //#region src/tree.ts
 var tree_exports = {};
@@ -323,6 +323,8 @@ let Primitive = /* @__PURE__ */ function(Primitive$1) {
 	Primitive$1["RandomBits"] = "random_bits";
 	Primitive$1["Sin"] = "sin";
 	Primitive$1["Cos"] = "cos";
+	Primitive$1["Asin"] = "asin";
+	Primitive$1["Atan"] = "atan";
 	Primitive$1["Exp"] = "exp";
 	Primitive$1["Log"] = "log";
 	Primitive$1["Sqrt"] = "sqrt";
@@ -390,6 +392,12 @@ function sin$1(x) {
 function cos$1(x) {
 	return bind1(Primitive.Cos, [x]);
 }
+function asin$1(x) {
+	return bind1(Primitive.Asin, [x]);
+}
+function atan$1(x) {
+	return bind1(Primitive.Atan, [x]);
+}
 function exp$1(x) {
 	return bind1(Primitive.Exp, [x]);
 }
@@ -405,18 +413,16 @@ function min$1(x, y) {
 function max$1(x, y) {
 	return bind1(Primitive.Max, [x, y]);
 }
-function reduce(x, op, axis, opts) {
+function reduce(x, op, axis = null, opts) {
 	if (!AluGroup.Reduce.has(op)) throw new TypeError(`Invalid reduce operation: ${op}`);
-	if (axis === void 0) if (x instanceof Tracer) axis = range(x.shape.length);
-	else axis = [];
-	else if (typeof axis === "number") axis = [checkAxis(axis, ndim$1(x))];
-	else axis = axis.map((a) => checkAxis(a, ndim$1(x)));
+	axis = normalizeAxis(axis, ndim$1(x));
 	const originalShape = getShape(x);
-	const result = bind1(Primitive.Reduce, [x], {
+	let result = bind1(Primitive.Reduce, [x], {
 		op,
 		axis
 	});
-	return opts?.keepDims ? broadcast(result, originalShape, axis) : result;
+	if (opts?.keepdims) result = result.reshape(originalShape.map((dim, i) => axis.includes(i) ? 1 : dim));
+	return result;
 }
 function dot$1(x, y) {
 	return bind1(Primitive.Dot, [x, y]);
@@ -462,10 +468,11 @@ function where$1(cond, x, y) {
 }
 function transpose$1(x, perm) {
 	perm = perm ? perm.map((a) => checkAxis(a, ndim$1(x))) : range(ndim$1(x)).reverse();
+	if (!isPermutation(perm, ndim$1(x))) throw new Error(`Invalid transpose permutation for ${ndim$1(x)} axes: ${JSON.stringify(perm)}`);
 	return bind1(Primitive.Transpose, [x], { perm });
 }
 function broadcast(x, shape$1, axis) {
-	axis = axis.map((a) => checkAxis(a, shape$1.length));
+	axis = normalizeAxis(axis, shape$1.length);
 	return bind1(Primitive.Broadcast, [x], {
 		shape: shape$1,
 		axis
@@ -484,7 +491,7 @@ function reshape$1(x, shape$1) {
 	return bind1(Primitive.Reshape, [x], { shape: shape$1 });
 }
 function flip$1(x, axis) {
-	axis = axis.map((a) => checkAxis(a, ndim$1(x)));
+	axis = normalizeAxis(axis, ndim$1(x));
 	return bind1(Primitive.Flip, [x], { axis });
 }
 function shrink(x, slice) {
@@ -564,15 +571,19 @@ var Tracer = class Tracer {
 	constructor(trace) {
 		this._trace = trace;
 	}
+	/** The shape of the array. */
 	get shape() {
 		return this.aval.shape;
 	}
+	/** The total number of elements in the array. */
 	get size() {
 		return prod(this.shape);
 	}
+	/** The dtype of the array. */
 	get dtype() {
 		return this.aval.dtype;
 	}
+	/** The number of dimensions of the array. */
 	get ndim() {
 		return this.shape.length;
 	}
@@ -608,22 +619,20 @@ var Tracer = class Tracer {
 		return lessEqual$1(this, other);
 	}
 	/** Sum of the elements of the array over a given axis, or axes. */
-	sum(axis, opts) {
+	sum(axis = null, opts) {
 		return reduce(this, AluOp.Add, axis, opts);
 	}
 	/** Product of the array elements over a given axis. */
-	prod(axis, opts) {
+	prod(axis = null, opts) {
 		return reduce(this, AluOp.Mul, axis, opts);
 	}
 	/** Compute the average of the array elements along the specified axis. */
-	mean(axis, opts) {
-		if (axis === void 0) axis = range(this.ndim);
-		else if (typeof axis === "number") axis = [checkAxis(axis, this.ndim)];
-		else axis = axis.map((a) => checkAxis(a, this.ndim));
-		let result = reduce(this, AluOp.Add, axis);
-		result = result.mul(result.size / this.size);
-		if (opts?.keepDims) result = broadcast(result, this.shape, axis);
-		return result;
+	mean(axis = null, opts) {
+		axis = normalizeAxis(axis, this.ndim);
+		const n = axis.reduce((acc, a) => acc * this.shape[a], 1);
+		if (n === 0) throw new Error("mean: cannot compute mean over zero-length axis");
+		const result = reduce(this, AluOp.Add, axis, opts);
+		return result.mul(1 / n);
 	}
 	/** Permute the dimensions of an array. Defaults to reversing the axis order. */
 	transpose(perm) {
@@ -1156,6 +1165,8 @@ const jitRules = {
 	},
 	[Primitive.Sin]: unopJit(AluExp.sin),
 	[Primitive.Cos]: unopJit(AluExp.cos),
+	[Primitive.Asin]: unopJit(AluExp.asin),
+	[Primitive.Atan]: unopJit(AluExp.atan),
 	[Primitive.Exp]: unopJit(AluExp.exp),
 	[Primitive.Log]: unopJit(AluExp.log),
 	[Primitive.Sqrt]: unopJit(AluExp.sqrt),
@@ -1397,7 +1408,7 @@ var Array$1 = class Array$1 extends Tracer {
 	* is a backend `Slot`, this constructor _takes ownership_ of the slot. It
 	* will be freed when the array is disposed.
 	*/
-	constructor(source, st, dtype, backend, pending = null) {
+	constructor(source, st, dtype, backend, { pending = null } = {}) {
 		super(baseArrayTrace);
 		this.id = Array$1.#nextId++;
 		this.#dtype = dtype;
@@ -1406,6 +1417,8 @@ var Array$1 = class Array$1 extends Tracer {
 		this.#backend = backend;
 		this.#rc = 1;
 		this.#pendingSet = new Set(pending);
+		if (this.#pendingSet.size === 0) this.#pendingSet = null;
+		else if (source instanceof AluExp) throw new Error("internal: AluExp source cannot have pending executes");
 	}
 	/** @ignore */
 	get aval() {
@@ -1460,7 +1473,7 @@ var Array$1 = class Array$1 extends Tracer {
 		const pending = this.#pending;
 		for (const exe of pending) exe.updateRc(1);
 		if (typeof this.#source === "number") this.#backend.incRef(this.#source);
-		const ar = new Array$1(this.#source, st, this.#dtype, this.#backend, pending);
+		const ar = new Array$1(this.#source, st, this.#dtype, this.#backend, { pending });
 		this.dispose();
 		return ar;
 	}
@@ -1509,7 +1522,7 @@ var Array$1 = class Array$1 extends Tracer {
 		pending.push(new PendingExecute(this.#backend, kernel, inputs, [output]));
 		this.dispose();
 		for (const ar of indices) ar.dispose();
-		return new Array$1(output, ShapeTracker.fromShape(finalShape), this.#dtype, this.#backend, pending);
+		return new Array$1(output, ShapeTracker.fromShape(finalShape), this.#dtype, this.#backend, { pending });
 	}
 	/** Move axes to the rightmost dimension of the shape. */
 	#moveAxesDown(axis) {
@@ -1546,7 +1559,7 @@ var Array$1 = class Array$1 extends Tracer {
 		for (const exe of pending) exe.updateRc(1);
 		pending.push(new PendingExecute(this.#backend, kernel, [this.#source], [output]));
 		this.dispose();
-		return new Array$1(output, ShapeTracker.fromShape(this.shape), dtypeOutput, this.#backend, pending);
+		return new Array$1(output, ShapeTracker.fromShape(this.shape), dtypeOutput, this.#backend, { pending });
 	}
 	#binary(op, other) {
 		const custom = (src) => new AluExp(op, this.#dtype, src);
@@ -1611,7 +1624,7 @@ var Array$1 = class Array$1 extends Tracer {
 		for (const exe of pending) exe.updateRc(1);
 		pending.add(new PendingExecute(backend, kernel, inputs, [output]));
 		for (const ar of arrays) ar.dispose();
-		return new Array$1(output, ShapeTracker.fromShape(newShape), dtypeOutput, backend, pending);
+		return new Array$1(output, ShapeTracker.fromShape(newShape), dtypeOutput, backend, { pending });
 	}
 	/** Reduce the last dimension of the array by an operation. */
 	#reduce(op) {
@@ -1635,7 +1648,7 @@ var Array$1 = class Array$1 extends Tracer {
 		for (const exe of pending) exe.updateRc(1);
 		pending.push(new PendingExecute(this.#backend, kernel, inputs, [output]));
 		this.dispose();
-		return new Array$1(output, ShapeTracker.fromShape(newShape), this.#dtype, this.#backend, pending);
+		return new Array$1(output, ShapeTracker.fromShape(newShape), this.#dtype, this.#backend, { pending });
 	}
 	/**
 	* Normalizes this array into one backed by a `Slot`.
@@ -1708,8 +1721,11 @@ var Array$1 = class Array$1 extends Tracer {
 	*
 	* If you are mapping from `data()` or `dataSync()`, it will also trigger
 	* dispatch of operations as well.
+	*
+	* **Note:** `jax.blockUntilReady()` is a higher-level API, it calls this
+	* asynchronously for multiple arrays.
 	*/
-	async wait() {
+	async blockUntilReady() {
 		this.#check();
 		if (this.#source instanceof AluExp) return this;
 		const pending = this.#pending;
@@ -1775,7 +1791,7 @@ var Array$1 = class Array$1 extends Tracer {
 				return [x.#binary(AluOp.Idiv, y)];
 			},
 			[Primitive.Neg]([x]) {
-				return [zerosLike(x.ref).#binary(AluOp.Sub, x)];
+				return [zerosLike$1(x.ref).#binary(AluOp.Sub, x)];
 			},
 			[Primitive.Reciprocal]([x]) {
 				return [x.#unary(AluOp.Reciprocal)];
@@ -1795,7 +1811,7 @@ var Array$1 = class Array$1 extends Tracer {
 					x.#backend.incRef(x.#source);
 					const pending = x.#pending;
 					for (const exe of pending) exe.updateRc(1);
-					const y = new Array$1(x.#source, x.#st, dtype, x.#backend, pending);
+					const y = new Array$1(x.#source, x.#st, dtype, x.#backend, { pending });
 					x.dispose();
 					return [y];
 				}
@@ -1825,6 +1841,12 @@ var Array$1 = class Array$1 extends Tracer {
 			[Primitive.Cos]([x]) {
 				return [x.#unary(AluOp.Cos)];
 			},
+			[Primitive.Asin]([x]) {
+				return [x.#unary(AluOp.Asin)];
+			},
+			[Primitive.Atan]([x]) {
+				return [x.#unary(AluOp.Atan)];
+			},
 			[Primitive.Exp]([x]) {
 				return [x.#unary(AluOp.Exp)];
 			},
@@ -1910,7 +1932,7 @@ var Array$1 = class Array$1 extends Tracer {
 				pending.splice(0, 0, ...prevPending);
 				args.forEach((x) => x.dispose());
 				return outputs.map((source, i) => {
-					return new Array$1(source, ShapeTracker.fromShape(jaxpr.outs[i].aval.shape), jaxpr.outs[i].aval.dtype, backend, pending);
+					return new Array$1(source, ShapeTracker.fromShape(jaxpr.outs[i].aval.shape), jaxpr.outs[i].aval.dtype, backend, { pending });
 				});
 			}
 		};
@@ -2042,12 +2064,12 @@ var EvalTrace = class extends Trace {
 };
 const baseArrayTrace = new EvalTrace(newMain(EvalTrace, null));
 const implRules = Array$1._implRules();
-function zerosLike(val, dtype) {
+function zerosLike$1(val, dtype) {
 	const aval = getAval(val);
 	if (val instanceof Tracer) val.dispose();
 	return zeros(aval.shape, { dtype: dtype ?? aval.dtype });
 }
-function onesLike(val, dtype) {
+function onesLike$1(val, dtype) {
 	const aval = getAval(val);
 	if (val instanceof Tracer) val.dispose();
 	return ones(aval.shape, { dtype: dtype ?? aval.dtype });
@@ -2110,7 +2132,7 @@ function eye(numRows, numCols, { dtype, device } = {}) {
 	const exp$2 = AluExp.cmplt(AluExp.mod(AluVar.idx, AluExp.i32(numCols + 1)), AluExp.i32(1));
 	return new Array$1(AluExp.cast(dtype, exp$2), ShapeTracker.fromShape([numRows, numCols]), dtype, getBackend(device));
 }
-/** Return the identity array, with ones on the main diagonal. */
+/** Return the identity matrix, with ones on the main diagonal. */
 function identity$1(n, { dtype, device } = {}) {
 	return eye(n, n, {
 		dtype,
@@ -2386,16 +2408,19 @@ var Jaxpr = class Jaxpr {
 			varIds.set(v, FpHash.hash(id, v.aval.dtype, ...v.aval.shape));
 			return id;
 		};
-		hasher.update(this.inBinders.length, ...this.inBinders.map(vi));
-		hasher.update(this.eqns.length, ...this.eqns.flatMap((eqn) => [
-			eqn.primitive,
-			eqn.inputs.length,
-			...eqn.inputs.map((x) => x instanceof Var ? vi(x) : x.value),
-			JSON.stringify(eqn.params),
-			eqn.outBinders.length,
-			...eqn.outBinders.map(vi)
-		]));
-		hasher.update(this.outs.length, ...this.outs.map((x) => x instanceof Var ? vi(x) : x.value));
+		hasher.update(this.inBinders.length);
+		for (const x of this.inBinders) hasher.update(vi(x));
+		hasher.update(this.eqns.length);
+		for (const eqn of this.eqns) {
+			hasher.update(eqn.primitive);
+			hasher.update(eqn.inputs.length);
+			for (const x of eqn.inputs) hasher.update(x instanceof Var ? vi(x) : x.value);
+			hasher.update(JSON.stringify(eqn.params));
+			hasher.update(eqn.outBinders.length);
+			for (const x of eqn.outBinders) hasher.update(vi(x));
+		}
+		hasher.update(this.outs.length);
+		for (const x of this.outs) hasher.update(x instanceof Var ? vi(x) : x.value);
 		return this.#hash = hasher.value;
 	}
 	hash(state) {
@@ -2432,7 +2457,7 @@ var Jaxpr = class Jaxpr {
 				const c = eqn.outBinders[0];
 				if (atomIsLit(b, 1)) context.set(c, a);
 				else newEqns.push(eqn);
-			} else if ((eqn.primitive === Primitive.Broadcast || eqn.primitive === Primitive.Reshape) && deepEqual(eqn.params.shape, eqn.inputs[0].aval.shape)) context.set(eqn.outBinders[0], eqn.inputs[0]);
+			} else if ((eqn.primitive === Primitive.Broadcast || eqn.primitive === Primitive.Reshape) && deepEqual(eqn.params.shape, eqn.inputs[0].aval.shape) || eqn.primitive === Primitive.Transpose && eqn.params.perm.every((p, i) => p === i) || eqn.primitive === Primitive.Flip && eqn.params.axis.length === 0 || eqn.primitive === Primitive.Shrink && eqn.params.slice.every(([s, e$2], i) => s === 0 && e$2 === eqn.inputs[0].aval.shape[i]) || eqn.primitive === Primitive.Pad && eqn.params.width.every(([w0, w1]) => w0 === 0 && w1 === 0)) context.set(eqn.outBinders[0], eqn.inputs[0]);
 			else newEqns.push(eqn);
 		}
 		const outs = this.outs.map((x) => x instanceof Var ? context.get(x) ?? x : x);
@@ -2698,6 +2723,8 @@ const abstractEvalRules = {
 	},
 	[Primitive.Sin]: vectorizedUnopAbstractEval,
 	[Primitive.Cos]: vectorizedUnopAbstractEval,
+	[Primitive.Asin]: vectorizedUnopAbstractEval,
+	[Primitive.Atan]: vectorizedUnopAbstractEval,
 	[Primitive.Exp]: vectorizedUnopAbstractEval,
 	[Primitive.Log]: vectorizedUnopAbstractEval,
 	[Primitive.Sqrt]: vectorizedUnopAbstractEval,
@@ -2825,7 +2852,7 @@ function makeJaxpr$1(f, opts) {
 function jit$1(f, opts) {
 	const cache = /* @__PURE__ */ new Map();
 	const staticArgnums = new Set(opts?.staticArgnums ?? []);
-	return ((...args) => {
+	const result = ((...args) => {
 		const [staticArgs, dynamicArgs] = splitIdx(args, staticArgnums);
 		const [argsFlat, inTree] = flatten(dynamicArgs);
 		const avalsInFlat = argsFlat.map((x) => ShapedArray.fromAval(getAval(x)));
@@ -2839,6 +2866,10 @@ function jit$1(f, opts) {
 		});
 		return unflatten(outTree, outs);
 	});
+	result.dispose = () => {
+		for (const { consts } of cache.values()) for (const c of consts) c.dispose();
+	};
+	return result;
 }
 //#endregion
@@ -2869,7 +2900,7 @@ var JVPTrace = class extends Trace {
 		return this.lift(pureArray(val));
 	}
 	lift(val) {
-		return new JVPTracer(this, val, zerosLike(val.ref));
+		return new JVPTracer(this, val, zerosLike$1(val.ref));
 	}
 	processPrimitive(primitive, tracers, params) {
 		const [primalsIn, tangentsIn] = unzip2(tracers.map((x) => [x.primal, x.tangent]));
@@ -2900,7 +2931,7 @@ function zeroTangentsJvp(primitive) {
 	return (primals, tangents, params) => {
 		for (const t of tangents) t.dispose();
 		const ys = bind(primitive, primals, params);
-		return [ys, ys.map((y) => zerosLike(y.ref))];
+		return [ys, ys.map((y) => zerosLike$1(y.ref))];
 	};
 }
 const jvpRules = {
@@ -2918,13 +2949,13 @@ const jvpRules = {
 		if (isFloatDtype(dtype) && isFloatDtype(x.dtype)) return [[cast(x, dtype)], [cast(dx, dtype)]];
 		else {
 			dx.dispose();
-			return [[cast(x.ref, dtype)], [zerosLike(x)]];
+			return [[cast(x.ref, dtype)], [zerosLike$1(x)]];
 		}
 	},
 	[Primitive.Bitcast]([x], [dx], { dtype }) {
 		if (x.dtype === dtype) return [[x], [dx]];
 		dx.dispose();
-		return [[bitcast(x.ref, dtype)], [zerosLike(x)]];
+		return [[bitcast(x.ref, dtype)], [zerosLike$1(x)]];
 	},
 	[Primitive.RandomBits]: zeroTangentsJvp(Primitive.RandomBits),
 	[Primitive.Sin]([x], [dx]) {
@@ -2933,6 +2964,14 @@ const jvpRules = {
 	[Primitive.Cos]([x], [dx]) {
 		return [[cos$1(x.ref)], [neg(sin$1(x)).mul(dx)]];
 	},
+	[Primitive.Asin]([x], [dx]) {
+		const denom = sqrt$1(reciprocal$1(cast(1, x.dtype).sub(x.ref.mul(x.ref))));
+		return [[asin$1(x)], [denom.mul(dx)]];
+	},
+	[Primitive.Atan]([x], [dx]) {
+		const denom = cast(1, x.dtype).add(x.ref.mul(x.ref));
+		return [[atan$1(x)], [dx.div(denom)]];
+	},
 	[Primitive.Exp]([x], [dx]) {
 		const z = exp$1(x);
 		return [[z.ref], [z.mul(dx)]];
@@ -3048,7 +3087,10 @@ function mappedAval(batchDim, aval) {
 /** Move one axis to a different index. */
 function moveaxis$1(x, src, dst) {
 	const t = pureArray(x);
-	const perm = range(t.shape.length);
+	src = checkAxis(src, t.ndim);
+	dst = checkAxis(dst, t.ndim);
+	if (src === dst) return t;
+	const perm = range(t.ndim);
 	perm.splice(src, 1);
 	perm.splice(dst, 0, src);
 	return transpose$1(t, perm);
@@ -3141,6 +3183,8 @@ const vmapRules = {
 	[Primitive.Bitcast]: unopBatcher((x, { dtype }) => bitcast(x, dtype)),
 	[Primitive.Sin]: unopBatcher(sin$1),
 	[Primitive.Cos]: unopBatcher(cos$1),
+	[Primitive.Asin]: unopBatcher(asin$1),
+	[Primitive.Atan]: unopBatcher(atan$1),
 	[Primitive.Exp]: unopBatcher(exp$1),
 	[Primitive.Log]: unopBatcher(log$1),
 	[Primitive.Sqrt]: unopBatcher(sqrt$1),
@@ -3326,20 +3370,28 @@ function linearizeFlatUtil(f, primalsIn) {
 function linearizeFlat(f, primalsIn) {
 	const { primalsOut, jaxpr, consts } = linearizeFlatUtil(f, primalsIn);
 	const fLin = (...tangents) => evalJaxpr(jaxpr, [...consts.map((c) => c.ref), ...tangents]);
-	return [primalsOut, fLin];
+	const dispose$1 = () => {
+		for (const c of consts) c.dispose();
+	};
+	return [
+		primalsOut,
+		fLin,
+		dispose$1
+	];
 }
 function linearize$1(f, ...primalsIn) {
 	const [primalsInFlat, inTree] = flatten(primalsIn);
 	const [fFlat, outTree] = flattenFun(f, inTree);
-	const [primalsOutFlat, fLinFlat] = linearizeFlat(fFlat, primalsInFlat.map(pureArray));
+	const [primalsOutFlat, fLinFlat, dispose$1] = linearizeFlat(fFlat, primalsInFlat.map(pureArray));
 	if (outTree.value === void 0) throw new Error("outTree was not set in linearize");
 	const primalsOut = unflatten(outTree.value, primalsOutFlat);
-	const fLin = (...tangentsIn) => {
+	const fLin = ((...tangentsIn) => {
 		const [tangentsInFlat, inTree2] = flatten(tangentsIn);
 		if (!inTree.equals(inTree2)) throw new TreeMismatchError("linearize", inTree, inTree2);
 		const tangentsOutFlat = fLinFlat(...tangentsInFlat.map(pureArray));
 		return unflatten(outTree.value, tangentsOutFlat);
-	};
+	});
+	fLin.dispose = dispose$1;
 	return [primalsOut, fLin];
 }
 var PartialEvalTracer = class extends Tracer {
@@ -3455,7 +3507,10 @@ var PartialEvalTrace = class extends Trace {
 			avalsOut: jaxpr2.outs.map((x) => x.aval),
 			tracerRefsOut: []
 		};
-		const outs2 = jaxpr2.outs.map((x) => new PartialEvalTracer(this, PartialVal.unknown(x.aval), recipe));
+		const outs2 = jaxpr2.outs.map((x, i$1) => {
+			if (i$1 > 0) recipe.tracersIn.forEach((t) => t.ref);
+			return new PartialEvalTracer(this, PartialVal.unknown(x.aval), recipe);
+		});
 		recipe.tracerRefsOut = outs2.map((t) => new WeakRef(t));
 		let i = 0;
 		let j = 0;
@@ -3539,13 +3594,15 @@ function partialEvalGraphToJaxpr(tracersIn, tracersOut) {
 	const [consts, constvars] = unzip2(constToVar.entries());
 	const inBinders = [...constvars, ...tracersIn.map((t) => tracerToVar.get(t))];
 	const outVars = tracersOut.map((t) => tracerToVar.get(t));
-	const jaxpr = new Jaxpr(inBinders, eqns, outVars);
+	let jaxpr = new Jaxpr(inBinders, eqns, outVars);
 	typecheckJaxpr(jaxpr);
 	for (const t of consts) t.ref;
 	for (const t of tracersIn) t.dispose();
 	for (const t of tracersOut) t.dispose();
+	jaxpr = jaxpr.simplify();
+	if (DEBUG >= 5) console.log("jaxpr from partial evaluation:\n" + jaxpr.toString());
 	return {
-		jaxpr: jaxpr.simplify(),
+		jaxpr,
 		consts
 	};
 }
@@ -3811,20 +3868,28 @@ function vjpFlat(f, primalsIn) {
 		const transposeInputs = [...consts.map((c) => c.ref), ...primalsIn.map((t) => new UndefPrimal(t.aval))];
 		return evalJaxprTransposed(jaxpr, transposeInputs, cotangents);
 	};
-	return [primalsOut, fVjp];
+	const dispose$1 = () => {
+		for (const c of consts) c.dispose();
+	};
+	return [
+		primalsOut,
+		fVjp,
+		dispose$1
+	];
 }
 function vjp$1(f, ...primalsIn) {
 	const [primalsInFlat, inTree] = flatten(primalsIn);
 	const [fFlat, outTree] = flattenFun(f, inTree);
-	const [primalsOutFlat, fVjpFlat] = vjpFlat(fFlat, primalsInFlat.map(pureArray));
+	const [primalsOutFlat, fVjpFlat, dispose$1] = vjpFlat(fFlat, primalsInFlat.map(pureArray));
 	if (outTree.value === void 0) throw new Error("outTree was not set in vjp");
 	const primalsOut = unflatten(outTree.value, primalsOutFlat);
-	const fVjp = (cotangentsOut) => {
+	const fVjp = ((cotangentsOut) => {
 		const [cotangentsOutFlat, outTree2] = flatten(cotangentsOut);
 		if (!outTree.value.equals(outTree2)) throw new TreeMismatchError("vjp", outTree.value, outTree2);
 		const cotangentsInFlat = fVjpFlat(...cotangentsOutFlat.map(pureArray));
 		return unflatten(inTree, cotangentsInFlat);
-	};
+	});
+	fVjp.dispose = dispose$1;
 	return [primalsOut, fVjp];
 }
 function grad$1(f) {
@@ -3842,7 +3907,8 @@ function valueAndGrad$1(f) {
 		if (!(y instanceof Tracer) || ndim$1(y) !== 0) throw new TypeError("grad requires a scalar output");
 		if (!isFloatDtype(y.dtype)) throw new TypeError("grad only supports floating-point dtypes");
 		const [ct, ...rest] = fVjp(scalar(1, { dtype: y.dtype }));
-		for (const r of rest) r.dispose();
+		for (const r of rest) dispose(r);
+		fVjp.dispose();
 		return [y, ct];
 	};
 }
@@ -3850,7 +3916,13 @@ function jacrev$1(f) {
 	return function jacobianReverse(x) {
 		if (x.shape.length !== 1) throw new TypeError("jacrev only supports 1D inputs");
 		const [size$1] = x.shape;
-		const pullback = (ct) => vjp$1(f, x)[1](ct)[0];
+		const pullback = (ct) => {
+			const [y, fVjp] = vjp$1(f, x);
+			y.dispose();
+			const [ret] = fVjp(ct);
+			fVjp.dispose();
+			return ret;
+		};
 		return vmap$1(pullback, [1])(eye(size$1, void 0, { dtype: x.dtype }));
 	};
 }
@@ -3930,19 +4002,38 @@ __export(numpy_exports, {
 	DType: () => DType,
 	abs: () => abs,
 	absolute: () => absolute,
+	acos: () => acos,
+	acosh: () => acosh,
 	add: () => add,
 	allclose: () => allclose,
 	arange: () => arange,
+	arccos: () => arccos,
+	arccosh: () => arccosh,
+	arcsinh: () => arcsinh,
+	arctan: () => arctan,
+	arctan2: () => arctan2,
+	arctanh: () => arctanh,
 	argmax: () => argmax,
 	argmin: () => argmin,
 	array: () => array,
+	asin: () => asin,
+	asinh: () => asinh,
 	astype: () => astype,
+	atan: () => atan,
+	atan2: () => atan2,
+	atanh: () => atanh,
 	bool: () => bool,
+	broadcastArrays: () => broadcastArrays,
+	broadcastShapes: () => broadcastShapes,
+	broadcastTo: () => broadcastTo,
+	cbrt: () => cbrt,
 	clip: () => clip,
 	columnStack: () => columnStack,
 	concatenate: () => concatenate,
 	cos: () => cos,
 	cosh: () => cosh,
+	deg2rad: () => deg2rad,
+	degrees: () => degrees,
 	diag: () => diag,
 	diagonal: () => diagonal,
 	divide: () => divide,
@@ -3953,6 +4044,7 @@ __export(numpy_exports, {
 	eulerGamma: () => eulerGamma,
 	exp: () => exp,
 	exp2: () => exp2,
+	expm1: () => expm1,
 	eye: () => eye,
 	flip: () => flip,
 	fliplr: () => fliplr,
@@ -3964,14 +4056,17 @@ __export(numpy_exports, {
 	greater: () => greater,
 	greaterEqual: () => greaterEqual,
 	hstack: () => hstack,
+	hypot: () => hypot,
 	identity: () => identity$1,
 	inf: () => inf,
+	inner: () => inner,
 	int32: () => int32,
 	less: () => less,
 	lessEqual: () => lessEqual,
 	linspace: () => linspace,
 	log: () => log,
 	log10: () => log10,
+	log1p: () => log1p,
 	log2: () => log2,
 	matmul: () => matmul,
 	max: () => max,
@@ -3987,35 +4082,49 @@ __export(numpy_exports, {
 	negative: () => negative,
 	notEqual: () => notEqual,
 	ones: () => ones,
-	onesLike: () => onesLike$1,
+	onesLike: () => onesLike,
+	outer: () => outer,
 	pad: () => pad,
 	permuteDims: () => permuteDims,
 	pi: () => pi,
+	pow: () => pow,
+	power: () => power,
 	prod: () => prod$1,
+	promoteTypes: () => promoteTypes,
+	rad2deg: () => rad2deg,
+	radians: () => radians,
 	ravel: () => ravel,
 	reciprocal: () => reciprocal,
+	repeat: () => repeat,
 	reshape: () => reshape,
-	scalar: () => scalar,
 	shape: () => shape,
+	sign: () => sign,
 	sin: () => sin,
 	sinh: () => sinh,
 	size: () => size,
 	sqrt: () => sqrt,
 	square: () => square,
 	stack: () => stack,
+	std: () => std,
+	subtract: () => subtract,
 	sum: () => sum,
 	tan: () => tan,
 	tanh: () => tanh,
+	tile: () => tile,
 	transpose: () => transpose,
+	tri: () => tri,
+	tril: () => tril,
+	triu: () => triu,
 	trueDivide: () => trueDivide,
 	trunc: () => trunc,
 	uint32: () => uint32,
+	var_: () => var_,
 	vdot: () => vdot,
 	vecdot: () => vecdot,
 	vstack: () => vstack,
 	where: () => where,
 	zeros: () => zeros,
-	zerosLike: () => zerosLike$1
+	zerosLike: () => zerosLike
 });
 const float32 = DType.Float32;
 const int32 = DType.Int32;
@@ -4032,54 +4141,66 @@ const inf = Number.POSITIVE_INFINITY;
 const nan = NaN;
 /** This is Pi, `π = 3.14159265358979...` */
 const pi = Math.PI;
-/** Element-wise addition, with broadcasting. */
+/** @function Element-wise addition, with broadcasting. */
 const add = add$1;
-/** Element-wise multiplication, with broadcasting. */
+/** @function Element-wise multiplication, with broadcasting. */
 const multiply = mul;
-/** Numerical negative of every element of an array. */
+/** @function Numerical negative of every element of an array. */
 const negative = neg;
-/** Calculate element-wise reciprocal of the input. This is `1/x`. */
+/** @function Calculate element-wise reciprocal of the input. This is `1/x`. */
 const reciprocal = reciprocal$1;
-/** Element-wise sine function (takes radians). */
+/** @function Element-wise sine function (takes radians). */
 const sin = sin$1;
-/** Element-wise cosine function (takes radians). */
+/** @function Element-wise cosine function (takes radians). */
 const cos = cos$1;
-/** Calculate the exponential of all elements in the input array. */
+/** @function Element-wise inverse sine function (inverse of sin). */
+const asin = asin$1;
+/** @function Element-wise inverse tangent function (inverse of tan). */
+const atan = atan$1;
+/** @function Calculate the exponential of all elements in the input array. */
 const exp = exp$1;
-/** Calculate the natural logarithm of all elements in the input array. */
+/** @function Calculate the natural logarithm of all elements in the input array. */
 const log = log$1;
-/** Calculate the square root of all elements in the input array. */
+/** @function Calculate the square root of all elements in the input array. */
 const sqrt = sqrt$1;
-/** Return element-wise minimum of the input arrays. */
+/** @function Return element-wise minimum of the input arrays. */
 const minimum = min$1;
-/** Return element-wise maximum of the input arrays. */
+/** @function Return element-wise maximum of the input arrays. */
 const maximum = max$1;
-/** Compare two arrays element-wise. */
+/** @function Compare two arrays element-wise. */
 const greater = greater$1;
-/** Compare two arrays element-wise. */
+/** @function Compare two arrays element-wise. */
 const less = less$1;
-/** Compare two arrays element-wise. */
+/** @function Compare two arrays element-wise. */
 const equal = equal$1;
-/** Compare two arrays element-wise. */
+/** @function Compare two arrays element-wise. */
 const notEqual = notEqual$1;
-/** Compare two arrays element-wise. */
+/** @function Compare two arrays element-wise. */
 const greaterEqual = greaterEqual$1;
-/** Compare two arrays element-wise. */
+/** @function Compare two arrays element-wise. */
 const lessEqual = lessEqual$1;
-/** Element-wise ternary operator, evaluates to `x` if cond else `y`. */
+/** @function Element-wise ternary operator, evaluates to `x` if cond else `y`. */
 const where = where$1;
-/** Permute the dimensions of an array. Defaults to reversing the axis order. */
+/**
+* @function
+* Permute the dimensions of an array. Defaults to reversing the axis order.
+*/
 const transpose = transpose$1;
 /**
+* @function
 * Give a new shape to an array without changing its data.
 *
 * One shape dimension can be -1. In this case, the value is inferred from the
 * length of the array and remaining dimensions.
 */
 const reshape = reshape$1;
-/** Move axes of an array to new positions. Other axes retain original order. */
+/**
+* @function
+* Move axes of an array to new positions. Other axes retain original order.
+*/
 const moveaxis = moveaxis$1;
 /**
+* @function
 * Add padding (zeros) to an array.
 *
 * The `width` argument is either an integer or pair of integers, in which case
@@ -4087,15 +4208,27 @@ const moveaxis = moveaxis$1;
 * pair specifies the padding for its corresponding axis.
 */
 const pad = pad$1;
-/** Return the number of dimensions of an array. Does not consume array reference. */
+/**
+* @function
+* Return the number of dimensions of an array. Does not consume array reference.
+*/
 const ndim = ndim$1;
-/** Return the shape of an array. Does not consume array reference. */
+/** @function Return the shape of an array. Does not consume array reference. */
 const shape = getShape;
-/** Return an array of zeros with the same shape and type as a given array. */
-const zerosLike$1 = zerosLike;
-/** Return an array of ones with the same shape and type as a given array. */
-const onesLike$1 = onesLike;
-/** Return a full array with the same shape and type as a given array. */
+/**
+* @function
+* Return an array of zeros with the same shape and type as a given array.
+*/
+const zerosLike = zerosLike$1;
+/**
+* @function
+* Return an array of ones with the same shape and type as a given array.
+*/
+const onesLike = onesLike$1;
+/**
+* @function
+* Return a full array with the same shape and type as a given array.
+*/
 const fullLike$1 = fullLike;
 /**
 * Return the number of elements in an array, optionally along an axis.
@@ -4110,23 +4243,23 @@ function astype(a, dtype) {
 	return fudgeArray(a).astype(dtype);
 }
 /** Sum of the elements of the array over a given axis, or axes. */
-function sum(a, axis, opts) {
+function sum(a, axis = null, opts) {
 	return reduce(a, AluOp.Add, axis, opts);
 }
 /** Product of the array elements over a given axis. */
-function prod$1(a, axis, opts) {
+function prod$1(a, axis = null, opts) {
 	return reduce(a, AluOp.Mul, axis, opts);
 }
 /** Return the minimum of array elements along a given axis. */
-function min(a, axis, opts) {
+function min(a, axis = null, opts) {
 	return reduce(a, AluOp.Min, axis, opts);
 }
 /** Return the maximum of array elements along a given axis. */
-function max(a, axis, opts) {
+function max(a, axis = null, opts) {
 	return reduce(a, AluOp.Max, axis, opts);
 }
 /** Compute the average of the array elements along the specified axis. */
-function mean(a, axis, opts) {
+function mean(a, axis = null, opts) {
 	return fudgeArray(a).mean(axis, opts);
 }
 /**
@@ -4142,7 +4275,7 @@ function argmin(a, axis, opts) {
 		axis = 0;
 	} else axis = checkAxis(axis, a.ndim);
 	const shape$1 = a.shape;
-	const isMax = equal(a, min(a.ref, axis, { keepDims: true }));
+	const isMax = equal(a, min(a.ref, axis, { keepdims: true }));
 	const length = scalar(shape$1[axis], {
 		dtype: int32,
 		device: a.device
@@ -4166,7 +4299,7 @@ function argmax(a, axis, opts) {
 		axis = 0;
 	} else axis = checkAxis(axis, a.ndim);
 	const shape$1 = a.shape;
-	const isMax = equal(a, max(a.ref, axis, { keepDims: true }));
+	const isMax = equal(a, max(a.ref, axis, { keepdims: true }));
 	const length = scalar(shape$1[axis], {
 		dtype: int32,
 		device: a.device
@@ -4178,17 +4311,9 @@ function argmax(a, axis, opts) {
 	return length.sub(max(idx, axis, opts));
 }
 /** Reverse the elements in an array along the given axes. */
-function flip(x, axis) {
+function flip(x, axis = null) {
 	const nd = ndim(x);
-	if (axis === void 0) axis = range(nd);
-	else if (typeof axis === "number") axis = [axis];
-	const seen = /* @__PURE__ */ new Set();
-	for (let i = 0; i < axis.length; i++) {
-		if (axis[i] >= nd || axis[i] < -nd) throw new Error(`flip: axis ${axis[i]} out of bounds for array of ${nd} dimensions`);
-		if (axis[i] < 0) axis[i] += nd;
-		if (seen.has(axis[i])) throw new Error(`flip: duplicate axis ${axis[i]} in axis list`);
-		seen.add(axis[i]);
-	}
+	axis = normalizeAxis(axis, nd);
 	return flip$1(x, axis);
 }
 /**
@@ -4294,12 +4419,80 @@ function flipud(x) {
 function fliplr(x) {
 	return flip(x, 1);
 }
+/** @function Alternative name for `numpy.transpose()`. */
 const permuteDims = transpose;
 /** Return a 1-D flattened array containing the elements of the input. */
 function ravel(a) {
 	return fudgeArray(a).ravel();
 }
 /**
+* Repeat each element of an array after themselves.
+*
+* If no axis is provided, use the flattened input array, and return a flat
+* output array.
+*/
+function repeat(a, repeats, axis) {
+	if (!Number.isInteger(repeats) || repeats < 0) throw new Error(`repeat: repeats must be a non-negative integer, got ${repeats}`);
+	a = fudgeArray(a);
+	if (axis === void 0) {
+		a = ravel(a);
+		axis = 0;
+	}
+	axis = checkAxis(axis, a.ndim);
+	if (repeats === 1) return a;
+	const broadcastedShape = a.shape.toSpliced(axis + 1, 0, repeats);
+	const finalShape = a.shape.toSpliced(axis, 1, a.shape[axis] * repeats);
+	return broadcast(a, broadcastedShape, [axis + 1]).reshape(finalShape);
+}
+/**
+* Construct an array by repeating A the number of times given by reps.
+*
+* If `A` is an array of shape `(d1, d2, ..., dn)` and `reps` is a sequence of
+* integers, the resulting array will have a shape of `(reps[0] * d1,
+* reps[1] * d2, ..., reps[n] * dn)`, with `A` tiled along each dimension.
+*/
+function tile(a, reps) {
+	a = fudgeArray(a);
+	if (typeof reps === "number") reps = [reps];
+	if (!reps.every((r) => Number.isInteger(r) && r >= 0)) throw new Error(`tile: reps must be non-negative integers, got ${JSON.stringify(reps)}`);
+	const ndiff = reps.length - a.ndim;
+	if (ndiff > 0) a = a.reshape([...rep(ndiff, 1), ...a.shape]);
+	if (ndiff < 0) reps = [...rep(-ndiff, 1), ...reps];
+	const broadcastedShape = [];
+	const broadcastAxes = [];
+	for (let i = 0; i < a.ndim; i++) {
+		if (reps[i] > 1) {
+			broadcastedShape.push(reps[i]);
+			broadcastAxes.push(broadcastedShape.length - 1);
+		}
+		broadcastedShape.push(a.shape[i]);
+	}
+	const finalShape = a.shape.map((d, i) => reps[i] * d);
+	return broadcast(a, broadcastedShape, broadcastAxes).reshape(finalShape);
+}
+/**
+* Broadcast an array to a shape, with NumPy-style broadcasing rules.
+*
+* In other words, this lets you append axes to the left, and/or expand
+* dimensions where the shape is 1.
+*/
+function broadcastTo(a, shape$1) {
+	const nd = ndim(a);
+	if (shape$1.length < nd) throw new Error(`broadcastTo: target shape ${JSON.stringify(shape$1)} has fewer dimensions than input array: ${nd}`);
+	return broadcast(a, shape$1, range(shape$1.length - nd));
+}
+/** Broadcast input shapes to a common output shape. */
+function broadcastShapes(...shapes) {
+	if (shapes.length === 0) return [];
+	return shapes.reduce(generalBroadcast);
+}
+/** Broadcast arrays to a common shape. */
+function broadcastArrays(...arrays) {
+	const shapes = arrays.map((a) => shape(a));
+	const outShape = broadcastShapes(...shapes);
+	return arrays.map((a) => broadcastTo(a, outShape));
+}
+/**
 * Return specified diagonals.
 *
 * If a is 2D, return the diagonal of the array with the given offset. If a is
@@ -4323,7 +4516,7 @@ function diag(v, k = 0) {
 	if (!Number.isInteger(k)) throw new TypeError(`k must be an integer, got ${k}`);
 	if (a.ndim === 1) {
 		const n = a.shape[0];
-		const ret = where(eye(n).equal(1), a.ref, zerosLike$1(a));
+		const ret = where(eye(n).equal(1), a.ref, zerosLike(a));
 		if (k > 0) return pad(ret, [[0, k], [k, 0]]);
 		else if (k < 0) return pad(ret, [[-k, 0], [0, -k]]);
 		else return ret;
@@ -4367,8 +4560,36 @@ function dot(x, y) {
 	]);
 	return dot$1(x, y);
 }
-/** Vector dot product of two arrays. */
-function vecdot(x, y) {
+/**
+* Compute the inner product of two arrays.
+*
+* Unlike `jax.numpy.matmul()` or `jax.numpy.dot()`, this always performs a
+* contraction on the last axis.
+*
+* Returned array has shape `[...x.shape[:-1], ...y.shape[:-1]]`.
+*/
+function inner(x, y) {
+	x = reshape(x, shape(x).toSpliced(-1, 0, ...rep(ndim(y) - 1, 1)));
+	return dot$1(x, y);
+}
+/**
+* Compute the outer product of two arrays.
+*
+* If the input arrays are not 1D, they will be flattened. Returned array will
+* be of shape `[x.size, y.size]`.
+*/
+function outer(x, y) {
+	x = ravel(x);
+	y = ravel(y);
+	return multiply(x.reshape([x.shape[0], 1]), y);
+}
+/** Vector dot product of two arrays along a given axis. */
+function vecdot(x, y, { axis } = {}) {
+	const xaxis = checkAxis(axis ?? -1, ndim(x));
+	const yaxis = checkAxis(axis ?? -1, ndim(y));
+	if (shape(x)[xaxis] !== shape(y)[yaxis]) throw new Error(`vecdot: shapes ${JSON.stringify(shape(x))} and ${JSON.stringify(shape(y))} not aligned along axis ${axis}: ${shape(x)[xaxis]} != ${shape(y)[yaxis]}`);
+	x = moveaxis(x, xaxis, -1);
+	y = moveaxis(y, yaxis, -1);
 	return dot$1(x, y);
 }
 /**
@@ -4377,7 +4598,7 @@ function vecdot(x, y) {
 * Like vecdot() but flattens the arguments first into vectors.
 */
 function vdot(x, y) {
-	return vecdot(ravel(x), ravel(y));
+	return dot$1(ravel(x), ravel(y));
 }
 /**
 * Return a tuple of coordinate matrices from coordinate vectors.
@@ -4406,6 +4627,43 @@ function meshgrid(xs, { indexing } = {}) {
 	return xs.map((x, i) => broadcast(x, shape$1, [...range(i), ...range(i + 1, xs.length)]));
 }
 /**
+* Return an array with ones on and below the diagonal and zeros elsewhere.
+*
+* If `k` is provided, it specifies the sub-diagonal on and below which the
+* array is filled with ones. `k=0` is the main diagonal, `k<0` is below it, and
+* `k>0` is above it.
+*/
+function tri(n, m, k = 0, { dtype, device } = {}) {
+	m ??= n;
+	dtype ??= DType.Float32;
+	if (!Number.isInteger(n) || n < 0) throw new TypeError(`tri: n must be a non-negative integer, got ${n}`);
+	if (!Number.isInteger(m) || m < 0) throw new TypeError(`tri: m must be a non-negative integer, got ${m}`);
+	if (!Number.isInteger(k)) throw new TypeError(`tri: k must be an integer, got ${k}`);
+	const rows = arange(k, n + k, 1, {
+		dtype: DType.Int32,
+		device
+	});
+	const cols = arange(0, m, 1, {
+		dtype: DType.Int32,
+		device
+	});
+	return rows.reshape([n, 1]).greaterEqual(cols).astype(dtype);
+}
+/** Return the lower triangle of an array. Must be of dimension >= 2. */
+function tril(a, k = 0) {
+	if (ndim(a) < 2) throw new TypeError(`tril: input array must be at least 2D, got ${ndim(a)}D`);
+	a = fudgeArray(a);
+	const [n, m] = a.shape.slice(-2);
+	return where(tri(n, m, k, { dtype: bool }), a.ref, zerosLike(a));
+}
+/** Return the upper triangle of an array. Must be of dimension >= 2. */
+function triu(a, k = 0) {
+	if (ndim(a) < 2) throw new TypeError(`tril: input array must be at least 2D, got ${ndim(a)}D`);
+	a = fudgeArray(a);
+	const [n, m] = a.shape.slice(-2);
+	return where(tri(n, m, k - 1, { dtype: bool }), zerosLike(a.ref), a);
+}
+/**
 * Clip (limit) the values in an array.
 *
 * Given an interval, values outside the interval are clipped to the interval
@@ -4429,18 +4687,70 @@ function absolute(x) {
 	x = fudgeArray(x);
 	return where(less(x.ref, 0), x.ref.mul(-1), x);
 }
-/** Alias of `jax.numpy.absolute()`. */
+/** @function Alias of `jax.numpy.absolute()`. */
 const abs = absolute;
+/** Return an element-wise indication of sign of the input. */
+function sign(x) {
+	x = fudgeArray(x);
+	return where(notEqual(x.ref, 0), where(less(x.ref, 0), -1, 1), 0);
+}
 /** Calculate element-wise square of the input array. */
 function square(x) {
 	x = fudgeArray(x);
 	return x.ref.mul(x);
 }
-/** Compute a trigonometric tangent of each element of input. */
+/** Element-wise tangent function (takes radians). */
 function tan(x) {
 	x = fudgeArray(x);
 	return sin(x.ref).div(cos(x));
 }
+/** Element-wise inverse cosine function (inverse of cos). */
+function acos(x) {
+	return subtract(pi / 2, asin(x));
+}
+/**
+* @function
+* Return element-wise hypotenuse for the given legs of a right triangle.
+*
+* In the original NumPy/JAX implementation, this function is more numerically
+* stable than sqrt(x1**2 + x2**2). We don't currently implement those stability
+* improvements.
+*/
+const hypot = jit$1((x1, x2) => {
+	return sqrt(square(x1).add(square(x2)));
+});
+/**
+* @function
+* Element-wise arc tangent of y/x with correct quadrant.
+*
+* Returns the angle in radians between the positive x-axis and the point (x, y).
+* The result is in the range [-π, π].
+*
+* Uses numerically stable formulas:
+* - When x >= 0: atan2(y, x) = 2 * atan(y / (sqrt(x^2 + y^2) + x))
+* - When x < 0:  atan2(y, x) = 2 * atan((sqrt(x^2 + y^2) - x) / y)
+*
+* The output is ill-defined when both x and y are zero.
+*/
+const atan2 = jit$1((y, x) => {
+	const r = sqrt(square(x.ref).add(square(y.ref)));
+	const xNeg = less(x.ref, 0);
+	const numer = where(xNeg.ref, r.ref.sub(x.ref), y.ref);
+	const denom = where(xNeg, y, r.add(x));
+	return atan(numer.div(denom)).mul(2);
+});
+/** @function Alias of `jax.numpy.acos()`. */
+const arccos = acos;
+/** @function Alias of `jax.numpy.atan()`. */
+const arctan = atan;
+/** @function Alias of `jax.numpy.atan2()`. */
+const arctan2 = atan2;
+/** Element-wise subtraction, with broadcasting. */
+function subtract(x, y) {
+	x = fudgeArray(x);
+	y = fudgeArray(y);
+	return x.sub(y);
+}
 /** Calculates the floating-point division of x by y element-wise. */
 function trueDivide(x, y) {
 	x = fudgeArray(x);
@@ -4448,7 +4758,7 @@ function trueDivide(x, y) {
 	if (!isFloatDtype(x.dtype) || !isFloatDtype(y.dtype)) throw new TypeError(`trueDivide: x and y must be floating-point arrays, got ${x.dtype} and ${y.dtype}`);
 	return x.div(y);
 }
-/** Alias of `jax.numpy.trueDivide()`. */
+/** @function Alias of `jax.numpy.trueDivide()`. */
 const divide = trueDivide;
 /** Round input to the nearest integer towards zero. */
 function trunc(x) {
@@ -4466,36 +4776,134 @@ function log2(x) {
 function log10(x) {
 	return log(x).mul(Math.LOG10E);
 }
+/** Calculate `exp(x) - 1` element-wise. */
+function expm1(x) {
+	return exp(x).sub(1);
+}
+/** Calculate the natural logarithm of `1 + x` element-wise. */
+function log1p(x) {
+	return log(add(1, x));
+}
+/** Convert angles from degrees to radians. */
+function deg2rad(x) {
+	return multiply(x, pi / 180);
+}
+/** @function Alias of `jax.numpy.deg2rad()`. */
+const radians = deg2rad;
+/** Convert angles from radians to degrees. */
+function rad2deg(x) {
+	return multiply(x, 180 / pi);
+}
+/** @function Alias of `jax.numpy.rad2deg()`. */
+const degrees = rad2deg;
 /**
+* @function
+* Computes first array raised to power of second array, element-wise.
+*/
+const power = jit$1((x1, x2) => {
+	return exp(log(x1).mul(x2));
+});
+/** @function Alias of `jax.numpy.power()`. */
+const pow = power;
+/** @function Calculate the element-wise cube root of the input array. */
+const cbrt = jit$1((x) => {
+	const sgn = where(less(x.ref, 0), -1, 1);
+	return sgn.ref.mul(exp(log(x.mul(sgn)).mul(1 / 3)));
+});
+/**
+* @function
 * Calculate element-wise hyperbolic sine of input.
 *
 * `sinh(x) = (exp(x) - exp(-x)) / 2`
 */
-function sinh(x) {
+const sinh = jit$1((x) => {
 	const ex = exp(x);
 	const emx = reciprocal(ex.ref);
 	return ex.sub(emx).mul(.5);
-}
+});
 /**
+* @function
 * Calculate element-wise hyperbolic cosine of input.
 *
 * `cosh(x) = (exp(x) + exp(-x)) / 2`
 */
-function cosh(x) {
+const cosh = jit$1((x) => {
 	const ex = exp(x);
 	const emx = reciprocal(ex.ref);
 	return ex.add(emx).mul(.5);
-}
+});
 /**
+* @function
 * Calculate element-wise hyperbolic tangent of input.
 *
 * `tanh(x) = sinh(x)/cosh(x) = (exp(x) - exp(-x)) / (exp(x) + exp(-x))`
 */
-function tanh(x) {
-	x = fudgeArray(x);
+const tanh = jit$1((x) => {
 	const negsgn = where(less(x.ref, 0), 1, -1);
 	const en2x = exp(x.mul(negsgn.ref).mul(2));
 	return en2x.ref.sub(1).div(en2x.add(1)).mul(negsgn);
+});
+/**
+* @function
+* Calculate element-wise inverse hyperbolic sine of input.
+*
+* `arcsinh(x) = ln(x + sqrt(x^2 + 1))`
+*/
+const arcsinh = jit$1((x) => {
+	return log(x.ref.add(sqrt(square(x).add(1))));
+});
+/**
+* @function
+* Calculate element-wise inverse hyperbolic cosine of input.
+*
+* `arccosh(x) = ln(x + sqrt(x^2 - 1))`
+*/
+const arccosh = jit$1((x) => {
+	return log(x.ref.add(sqrt(square(x).sub(1))));
+});
+/**
+* @function
+* Calculate element-wise inverse hyperbolic tangent of input.
+*
+* `arctanh(x) = 0.5 * ln((1 + x) / (1 - x))`
+*/
+const arctanh = jit$1((x) => {
+	return log(add(1, x.ref).div(subtract(1, x))).mul(.5);
+});
+/** @function Alias of `jax.numpy.arcsinh()`. */
+const asinh = arcsinh;
+/** @function Alias of `jax.numpy.arccosh()`. */
+const acosh = arccosh;
+/** @function Alias of `jax.numpy.arctanh()`. */
+const atanh = arctanh;
+/**
+* Compute the variance of an array.
+*
+* The variance is computed for the flattened array by default, otherwise over
+* the specified axis.
+*
+* If `correction` is provided, the divisor in calculation is `N - correction`,
+* where `N` represents the number of elements (e.g., for Bessel's correction).
+*/
+function var_(x, axis = null, opts) {
+	x = fudgeArray(x);
+	axis = normalizeAxis(axis, x.ndim);
+	const n = axis.reduce((acc, a) => acc * x.shape[a], 1);
+	if (n === 0) throw new Error("var: cannot compute variance over zero-length axis");
+	const mu = opts?.mean !== void 0 ? opts.mean : mean(x.ref, axis, { keepdims: true });
+	return square(x.sub(mu)).sum(axis, { keepdims: opts?.keepdims }).mul(1 / (n - (opts?.correction ?? 0)));
+}
+/**
+* Compute the standard deviation of an array.
+*
+* The standard deviation is computed for the flattened array by default,
+* otherwise over the specified axis.
+*
+* If `correction` is provided, the divisor in calculation is `N - correction`,
+* where `N` represents the number of elements (e.g., for Bessel's correction).
+*/
+function std(x, axis = null, opts) {
+	return sqrt(var_(x, axis, opts));
 }
 //#endregion
@@ -4510,6 +4918,7 @@ __export(nn_exports, {
 	leakyRelu: () => leakyRelu,
 	logSigmoid: () => logSigmoid,
 	logSoftmax: () => logSoftmax,
+	logmeanexp: () => logmeanexp,
 	logsumexp: () => logsumexp,
 	mish: () => mish,
 	oneHot: () => oneHot,
@@ -4520,6 +4929,8 @@ __export(nn_exports, {
 	softSign: () => softSign,
 	softmax: () => softmax,
 	softplus: () => softplus,
+	squareplus: () => squareplus,
+	standardize: () => standardize,
 	swish: () => swish
 });
 /**
@@ -4563,6 +4974,7 @@ function softSign(x) {
 	return x.ref.div(absolute(x).add(1));
 }
 /**
+* @function
 * Sigmoid-weighted Linear Unit (SiLU) activation function, also known as
 * Swish, computed element-wise:
 * `silu(x) = x * sigmoid(x) = x / (1 + exp(-x))`.
@@ -4573,6 +4985,7 @@ function softSign(x) {
 */
 const silu = jit$1((x) => x.ref.mul(sigmoid(x)));
 /**
+* @function
 * Sigmoid-weighted Linear Unit (SiLU) activation function, also known as
 * Swish, computed element-wise:
 * `silu(x) = x * sigmoid(x) = x / (1 + exp(-x))`.
@@ -4589,7 +5002,10 @@ const swish = silu;
 function logSigmoid(x) {
 	return negative(softplus(negative(x)));
 }
-/** Identity activation function. Returns the argument unmodified. */
+/**
+* @function
+* Identity activation function. Returns the argument unmodified.
+*/
 const identity = fudgeArray;
 /** Leaky rectified linear (ReLU) activation function */
 function leakyRelu(x, negativeSlope = .01) {
@@ -4617,6 +5033,7 @@ function celu(x, alpha = 1) {
 	return where(less(x.ref, 0), exp(x.ref.div(alpha)).sub(1).mul(alpha), x);
 }
 /**
+* @function
 * Gaussion error linear unit (GELU) activation function.
 *
 * This is computed element-wise. Currently jax-js does not support the erf() or
@@ -4648,6 +5065,16 @@ function glu(x, axis = -1) {
 	return a.mul(sigmoid(b));
 }
 /**
+* Squareplus activation function.
+*
+* Computes the element-wise function:
+* `squareplus(x) = 0.5 * (x + sqrt(x^2 + b))`
+*/
+function squareplus(x, b = 4) {
+	x = fudgeArray(x);
+	return x.ref.add(sqrt(square(x).add(b))).mul(.5);
+}
+/**
 * Mish activation function.
 *
 * Computes the element-wise function:
@@ -4665,17 +5092,13 @@ function mish(x) {
 *
 * Reference: https://en.wikipedia.org/wiki/Softmax_function
 */
-function softmax(x, axis) {
+function softmax(x, axis = -1) {
 	x = fudgeArray(x);
-	if (axis === void 0) axis = x.ndim ? [x.ndim - 1] : [];
-	else if (typeof axis === "number") axis = [axis];
-	if (axis.length === 0) {
-		x.dispose();
-		return ones(x.shape);
-	}
-	const xMax = max(x.ref, axis, { keepDims: true });
+	axis = normalizeAxis(axis, x.ndim);
+	if (axis.length === 0) return onesLike(x);
+	const xMax = max(x.ref, axis, { keepdims: true });
 	const unnormalized = exp(x.sub(stopGradient(xMax)));
-	return unnormalized.ref.div(unnormalized.sum(axis, { keepDims: true }));
+	return unnormalized.ref.div(unnormalized.sum(axis, { keepdims: true }));
 }
 /**
 * Log-Softmax function.
@@ -4685,17 +5108,13 @@ function softmax(x, axis) {
 *
 * If `axis` is not specified, it defaults to the last axis.
 */
-function logSoftmax(x, axis) {
+function logSoftmax(x, axis = -1) {
 	x = fudgeArray(x);
-	if (axis === void 0) axis = x.ndim ? [x.ndim - 1] : [];
-	else if (typeof axis === "number") axis = [axis];
-	if (axis.length === 0) {
-		x.dispose();
-		return zeros(x.shape);
-	}
-	const xMax = max(x.ref, axis, { keepDims: true });
+	axis = normalizeAxis(axis, x.ndim);
+	if (axis.length === 0) return zerosLike(x);
+	const xMax = max(x.ref, axis, { keepdims: true });
 	const shifted = x.sub(stopGradient(xMax));
-	const shiftedLogsumexp = log(exp(shifted.ref).sum(axis, { keepDims: true }));
+	const shiftedLogsumexp = log(exp(shifted.ref).sum(axis, { keepdims: true }));
 	return shifted.sub(shiftedLogsumexp);
 }
 /**
@@ -4706,16 +5125,39 @@ function logSoftmax(x, axis) {
 *
 * Reference: https://en.wikipedia.org/wiki/LogSumExp
 */
-function logsumexp(x, axis) {
+function logsumexp(x, axis = null) {
 	x = fudgeArray(x);
-	if (axis === void 0) axis = range(x.ndim);
-	else if (typeof axis === "number") axis = [axis];
+	axis = normalizeAxis(axis, x.ndim);
 	if (axis.length === 0) return x;
 	const xMax = stopGradient(max(x.ref, axis));
 	const xMaxDims = broadcast(xMax.ref, x.shape, axis);
 	const shifted = x.sub(xMaxDims);
 	return xMax.add(log(exp(shifted).sum(axis)));
 }
+/** Log-mean-exp reduction, like `jax.nn.logsumexp()` but subtracts `log(n)`. */
+function logmeanexp(x, axis = null) {
+	x = fudgeArray(x);
+	axis = normalizeAxis(axis, x.ndim);
+	if (axis.length === 0) return x;
+	const n = axis.reduce((acc, a) => acc * x.shape[a], 1);
+	return logsumexp(x, axis).sub(Math.log(n));
+}
+/**
+* Standardizes input to zero mean and unit variance.
+*
+* By default, this is computed over the last axis. You can pass in a different
+* axis, or `null` to standardize over all elements.
+*
+* Epsilon is added to denominator, it defaults to `1e-5` for stability.
+*/
+function standardize(x, axis = -1, opts = {}) {
+	x = fudgeArray(x);
+	axis = normalizeAxis(axis, x.ndim);
+	if (axis.length === 0) return x;
+	const mu = opts.mean !== void 0 ? fudgeArray(opts.mean) : x.ref.mean(axis, { keepdims: true });
+	const sigma2 = opts.variance !== void 0 ? fudgeArray(opts.variance) : square(x.ref).mean(axis, { keepdims: true }).sub(square(mu.ref));
+	return x.sub(mu).div(sqrt(sigma2.add(opts.epsilon ?? 1e-5)));
+}
 /**
 * One-hot encodes the given indices.
 *
@@ -4733,7 +5175,7 @@ function logsumexp(x, axis) {
 * ```
 */
 function oneHot(x, numClasses) {
-	if (x.dtype !== DType.Int32) throw new TypeError(`oneHot expects integers, got ${x.dtype}`);
+	if (isFloatDtype(x.dtype)) throw new TypeError(`oneHot expects integers, got ${x.dtype}`);
 	return eye(numClasses, void 0, { device: x.device }).slice(x);
 }
@@ -4741,8 +5183,11 @@ function oneHot(x, numClasses) {
 //#region src/random.ts
 var random_exports = {};
 __export(random_exports, {
+	bernoulli: () => bernoulli,
 	bits: () => bits,
+	exponential: () => exponential,
 	key: () => key,
+	normal: () => normal,
 	split: () => split,
 	uniform: () => uniform
 });
@@ -4773,11 +5218,11 @@ function bits(key$1, shape$1 = []) {
 /** Sample uniform random values in [minval, maxval) with given shape. */
 function uniform(key$1, shape$1 = [], { minval = 0, maxval = 1 } = {}) {
 	if (minval >= maxval) throw new Error(`Invalid range: [${minval}, ${maxval}).`);
-	const mantissa = bits(key$1, shape$1).div(scalar(512, {
+	const mantissa = bits(key$1, shape$1).div(array(512, {
 		dtype: DType.Uint32,
 		device: key$1.device
 	}));
-	const float12 = mantissa.add(scalar(1065353216, {
+	const float12 = mantissa.add(array(1065353216, {
 		dtype: DType.Uint32,
 		device: key$1.device
 	}));
@@ -4785,6 +5230,36 @@ function uniform(key$1, shape$1 = [], { minval = 0, maxval = 1 } = {}) {
 	if (minval === 0 && maxval === 1) return rand;
 	else return rand.mul(maxval - minval).add(minval);
 }
+/**
+* Sample Bernoulli random variables with given mean (0,1 categorical).
+*
+* Returns a random Boolean array with the specified shape. `p` can be an array
+* and must be broadcastable to `shape`.
+*/
+function bernoulli(key$1, p = .5, shape$1 = []) {
+	p = fudgeArray(p);
+	return uniform(key$1, shape$1).less(p);
+}
+/** Sample exponential random values according to `p(x) = exp(-x)`. */
+function exponential(key$1, shape$1 = []) {
+	const u = uniform(key$1, shape$1);
+	return negative(log1p(negative(u)));
+}
+/**
+* Sample random values according to `p(x) = 1/sqrt(2pi) * exp(-x^2/2)`.
+*
+* Unlike JAX, this uses the Box-Muller transform. JAX uses the erf_inv primitive instead and
+* directly inverts the CDF, but we don't have support for that yet. Outputs will not be
+* bitwise identical to JAX.
+*/
+function normal(key$1, shape$1 = []) {
+	const [k1, k2] = split(key$1, 2);
+	const u1 = uniform(k1, shape$1);
+	const u2 = uniform(k2, shape$1);
+	const radius = sqrt(log1p(negative(u1)).mul(-2));
+	const theta = u2.mul(2 * Math.PI);
+	return radius.mul(cos(theta));
+}
 //#endregion
 //#region src/polyfills.ts
@@ -4794,20 +5269,36 @@ Symbol.asyncDispose ??= Symbol.for("Symbol.asyncDispose");
 //#endregion
 //#region src/index.ts
-/** Compute the forward-mode Jacobian-vector product for a function. */
+/**
+* @function
+* Compute the forward-mode Jacobian-vector product for a function.
+*/
 const jvp = jvp$1;
-/** Vectorize an operation on a batched axis for one or more inputs. */
+/**
+* @function
+* Vectorize an operation on a batched axis for one or more inputs.
+*/
 const vmap = vmap$1;
-/** Compute the Jacobian evaluated column-by-column by forward-mode AD. */
+/**
+* @function
+* Compute the Jacobian evaluated column-by-column by forward-mode AD.
+*/
 const jacfwd = jacfwd$1;
-/** Construct a Jaxpr by dynamically tracing a function with example inputs. */
+/**
+* @function
+* Construct a Jaxpr by dynamically tracing a function with example inputs.
+*/
 const makeJaxpr = makeJaxpr$1;
 /**
+* @function
 * Mark a function for automatic JIT compilation, with operator fusion.
 *
 * The function will be compiled the first time it is called with a set of
 * argument shapes.
 *
+* You can call `.dispose()` on the returned, JIT-compiled function after all
+* calls to free memory associated with array constants.
+*
 * **Options:**
 * - `staticArgnums`: An array of argument indices to treat as static
 *   (compile-time constant). These arguments must be hashable, won't be traced,
@@ -4817,23 +5308,52 @@ const makeJaxpr = makeJaxpr$1;
 */
 const jit = jit$1;
 /**
+* @function
 * Produce a local linear approximation to a function at a point using jvp() and
 * partial evaluation.
 */
 const linearize = linearize$1;
-/** Calculate the reverse-mode vector-Jacobian product for a function. */
+/**
+* @function
+* Calculate the reverse-mode vector-Jacobian product for a function.
+*/
 const vjp = vjp$1;
 /**
+* @function
 * Compute the gradient of a scalar-valued function `f` with respect to its
 * first argument.
 */
 const grad = grad$1;
-/** Create a function that evaluates both `f` and the gradient of `f`. */
+/**
+* @function
+* Create a function that evaluates both `f` and the gradient of `f`.
+*/
 const valueAndGrad = valueAndGrad$1;
-/** Compute the Jacobian evaluated row-by-row by reverse-mode AD. */
+/**
+* @function
+* Compute the Jacobian evaluated row-by-row by reverse-mode AD.
+*/
 const jacrev = jacrev$1;
-/** Compute the Jacobian with reverse-mode AD. Alias for `jacrev()`. */
+/**
+* @function
+* Compute the Jacobian with reverse-mode AD. Alias for `jacrev()`.
+*/
 const jacobian = jacrev;
+/**
+* Wait until all `Array` leaves are ready by calling `Array.blockUntilReady()`.
+*
+* This can be used to wait for the results of an intermediate computation to
+* finish. It's recommended to call this regularly in an iterative computation
+* to avoid queueing up too many pending operations.
+*
+* Does not consume reference to the arrays.
+*/
+async function blockUntilReady(x) {
+	const promises = [];
+	for (const leaf of leaves(x)) if (leaf instanceof Array$1) promises.push(leaf.blockUntilReady());
+	await Promise.all(promises);
+	return x;
+}
 //#endregion
-export { DType, devices, grad, init, jacfwd, jacobian, jacrev, jit, jvp, lax_exports as lax, linearize, makeJaxpr, nn_exports as nn, numpy_exports as numpy, random_exports as random, setDevice, tree_exports as tree, valueAndGrad, vjp, vmap };
+export { Array$1 as Array, DType, Jaxpr, blockUntilReady, defaultDevice, devices, grad, init, jacfwd, jacobian, jacrev, jit, jvp, lax_exports as lax, linearize, makeJaxpr, nn_exports as nn, numpy_exports as numpy, random_exports as random, setDebug, tree_exports as tree, valueAndGrad, vjp, vmap };