npm - umap-gpu - Versions diffs - 0.2.13 → 0.2.15 - Mend

umap-gpu 0.2.13 → 0.2.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/dist/fuzzy-set.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 export interface FuzzyGraph {
-    rows: Float32Array;
-    cols: Float32Array;
+    rows: Uint32Array;
+    cols: Uint32Array;
     vals: Float32Array;
     nVertices: number;
 }

package/dist/gpu/device.d.ts CHANGED Viewed

@@ -7,6 +7,23 @@
  */
 export declare function getGPUDevice(): Promise<GPUDevice | null>;
 /**
- * Check whether WebGPU is available in the current environment.
+ * Fast synchronous heuristic: returns `true` if `navigator.gpu` exists.
+ *
+ * **Caveat (Bug 13):** `navigator.gpu` being truthy does NOT guarantee that a
+ * WebGPU adapter can be acquired — `requestAdapter()` may still return `null`
+ * (no compatible hardware, or the browser has disabled WebGPU for the page).
+ * Use `checkWebGPUAvailable()` for a reliable async check, or rely on the
+ * `try/catch` around `GPUSgd.init()` in the calling code.
  */
 export declare function isWebGPUAvailable(): boolean;
+/**
+ * Reliably check whether WebGPU is usable in the current environment by
+ * attempting to acquire an adapter via `getGPUDevice()`.
+ *
+ * Unlike the synchronous `isWebGPUAvailable()`, this actually calls
+ * `navigator.gpu.requestAdapter()` and returns `false` if the adapter is
+ * unavailable (no compatible GPU, browser policy, etc.).
+ *
+ * The result is automatically cached — repeated calls are free.
+ */
+export declare function checkWebGPUAvailable(): Promise<boolean>;

package/dist/gpu/sgd.d.ts CHANGED Viewed

@@ -6,11 +6,23 @@ export interface SGDParams {
 }
 /**
  * GPU-accelerated SGD optimizer for UMAP embedding.
- * Each GPU thread processes one graph edge, applying attraction and repulsion forces.
+ *
+ * Uses a two-pass design per epoch to eliminate write-write races on shared
+ * vertex positions (Bug 2 fix):
+ *   Pass 1 (sgd.wgsl):           Each thread accumulates its attraction and
+ *                                  repulsion gradients into an atomic<i32>
+ *                                  forces buffer — no direct embedding writes.
+ *   Pass 2 (apply-forces.wgsl):  Each thread applies one element's accumulated
+ *                                  force to the embedding and resets the
+ *                                  accumulator to zero for the next epoch.
+ *
+ * Both passes are submitted in the same command encoder so WebGPU guarantees
+ * sequential execution and storage-buffer visibility between them.
  */
 export declare class GPUSgd {
     private device;
-    private pipeline;
+    private sgdPipeline;
+    private applyForcesPipeline;
     init(): Promise<void>;
     /**
      * Run SGD optimization on the GPU.

package/dist/index.d.ts CHANGED Viewed

@@ -2,4 +2,4 @@ export { fit, UMAP } from './umap';
 export type { UMAPOptions, ProgressCallback } from './umap';
 export type { KNNResult, HNSWOptions, HNSWSearchableIndex } from './hnsw-knn';
 export type { FuzzyGraph } from './fuzzy-set';
-export { isWebGPUAvailable } from './gpu/device';
+export { isWebGPUAvailable, checkWebGPUAvailable } from './gpu/device';

package/dist/index.js CHANGED Viewed

@@ -1,104 +1,111 @@
-var V = Object.defineProperty;
-var Y = (e, t, r) => t in e ? V(e, t, { enumerable: !0, configurable: !0, writable: !0, value: r }) : e[t] = r;
-var G = (e, t, r) => Y(e, typeof t != "symbol" ? t + "" : t, r);
-import { loadHnswlib as D } from "hnswlib-wasm";
-async function Q(e, t, r = {}) {
-  const { M: s = 16, efConstruction: n = 200, efSearch: g = 50 } = r, c = await D(), d = e[0].length, f = e.length, a = new c.HierarchicalNSW("l2", d, "");
-  a.initIndex(f, s, n, 200), a.setEfSearch(Math.max(g, t)), a.addItems(e, !1);
-  const o = [], i = [];
-  for (let h = 0; h < f; h++) {
-    const l = a.searchKnn(e[h], t + 1, void 0), u = l.neighbors.map((p, m) => ({ idx: p, dist: l.distances[m] })).filter(({ idx: p }) => p !== h).slice(0, t);
-    o.push(u.map(({ idx: p }) => p)), i.push(u.map(({ dist: p }) => p));
+var te = Object.defineProperty;
+var ne = (e, t, f) => t in e ? te(e, t, { enumerable: !0, configurable: !0, writable: !0, value: f }) : e[t] = f;
+var R = (e, t, f) => ne(e, typeof t != "symbol" ? t + "" : t, f);
+import { loadHnswlib as H } from "hnswlib-wasm";
+async function se(e, t, f = {}) {
+  const { M: a = 16, efConstruction: s = 200, efSearch: u = 50 } = f, c = await H(), d = e[0].length, o = e.length, n = new c.HierarchicalNSW("l2", d, "");
+  n.initIndex(o, a, s, 200), n.setEfSearch(Math.max(u, t)), n.addItems(e, !1);
+  const r = [], i = [];
+  for (let h = 0; h < o; h++) {
+    const l = n.searchKnn(e[h], t + 1, void 0), p = l.neighbors.map((g, _) => ({ idx: g, dist: l.distances[_] })).filter(({ idx: g }) => g !== h).slice(0, t);
+    r.push(p.map(({ idx: g }) => g)), i.push(p.map(({ dist: g }) => Math.sqrt(g)));
   }
-  return { indices: o, distances: i };
+  return { indices: r, distances: i };
 }
-async function J(e, t, r = {}) {
-  const { M: s = 16, efConstruction: n = 200, efSearch: g = 50 } = r, c = await D(), d = e[0].length, f = e.length, a = new c.HierarchicalNSW("l2", d, "");
-  a.initIndex(f, s, n, 200), a.setEfSearch(Math.max(g, t)), a.addItems(e, !1);
-  const o = [], i = [];
-  for (let l = 0; l < f; l++) {
-    const u = a.searchKnn(e[l], t + 1, void 0), p = u.neighbors.map((m, _) => ({ idx: m, dist: u.distances[_] })).filter(({ idx: m }) => m !== l).slice(0, t);
-    o.push(p.map(({ idx: m }) => m)), i.push(p.map(({ dist: m }) => m));
+async function ae(e, t, f = {}) {
+  const { M: a = 16, efConstruction: s = 200, efSearch: u = 50 } = f, c = await H(), d = e[0].length, o = e.length, n = new c.HierarchicalNSW("l2", d, "");
+  n.initIndex(o, a, s, 200), n.setEfSearch(Math.max(u, t)), n.addItems(e, !1);
+  const r = [], i = [];
+  for (let l = 0; l < o; l++) {
+    const p = n.searchKnn(e[l], t + 1, void 0), g = p.neighbors.map((_, m) => ({ idx: _, dist: p.distances[m] })).filter(({ idx: _ }) => _ !== l).slice(0, t);
+    r.push(g.map(({ idx: _ }) => _)), i.push(g.map(({ dist: _ }) => Math.sqrt(_)));
   }
-  return { knn: { indices: o, distances: i }, index: {
-    searchKnn(l, u) {
-      const p = [], m = [];
-      for (const _ of l) {
-        const w = a.searchKnn(_, u, void 0), b = w.neighbors.map((A, x) => ({ idx: A, dist: w.distances[x] })).sort((A, x) => A.dist - x.dist).slice(0, u);
-        p.push(b.map(({ idx: A }) => A)), m.push(b.map(({ dist: A }) => A));
+  return { knn: { indices: r, distances: i }, index: {
+    searchKnn(l, p) {
+      const g = [], _ = [];
+      for (const m of l) {
+        const b = n.searchKnn(m, p, void 0), y = b.neighbors.map((x, v) => ({ idx: x, dist: b.distances[v] })).sort((x, v) => x.dist - v.dist).slice(0, p);
+        g.push(y.map(({ idx: x }) => x)), _.push(y.map(({ dist: x }) => Math.sqrt(x)));
       }
-      return { indices: p, distances: m };
+      return { indices: g, distances: _ };
     }
   } };
 }
-function L(e, t, r, s = 1) {
-  const n = e.length, { sigmas: g, rhos: c } = W(t, r), d = [], f = [], a = [];
-  for (let i = 0; i < n; i++)
+function V(e, t, f, a = 1) {
+  const s = e.length, { sigmas: u, rhos: c } = Y(t, f), d = [], o = [], n = [];
+  for (let i = 0; i < s; i++)
     for (let h = 0; h < e[i].length; h++) {
-      const l = t[i][h], u = l <= c[i] ? 1 : Math.exp(-((l - c[i]) / g[i]));
-      d.push(i), f.push(e[i][h]), a.push(u);
+      const l = t[i][h], p = l <= c[i] ? 1 : Math.exp(-((l - c[i]) / u[i]));
+      d.push(i), o.push(e[i][h]), n.push(p);
     }
-  return { ...Z(d, f, a, n, s), nVertices: n };
+  return { ...ie(d, o, n, s, a), nVertices: s };
 }
-function X(e, t, r) {
-  const s = e.length, { sigmas: n, rhos: g } = W(t, r), c = [], d = [], f = [];
-  for (let a = 0; a < s; a++)
-    for (let o = 0; o < e[a].length; o++) {
-      const i = t[a][o], h = i <= g[a] ? 1 : Math.exp(-((i - g[a]) / n[a]));
-      c.push(a), d.push(e[a][o]), f.push(h);
+function re(e, t, f) {
+  const a = e.length, { sigmas: s, rhos: u } = Y(t, f), c = [], d = [], o = [];
+  for (let n = 0; n < a; n++)
+    for (let r = 0; r < e[n].length; r++) {
+      const i = t[n][r], h = i <= u[n] ? 1 : Math.exp(-((i - u[n]) / s[n]));
+      c.push(n), d.push(e[n][r]), o.push(h);
     }
   return {
-    rows: new Float32Array(c),
-    cols: new Float32Array(d),
-    vals: new Float32Array(f),
-    nVertices: s
+    rows: new Uint32Array(c),
+    cols: new Uint32Array(d),
+    vals: new Float32Array(o),
+    nVertices: a
   };
 }
-function W(e, t) {
-  const s = e.length, n = new Float32Array(s), g = new Float32Array(s);
-  for (let c = 0; c < s; c++) {
+function Y(e, t) {
+  const a = e.length, s = new Float32Array(a), u = new Float32Array(a);
+  for (let c = 0; c < a; c++) {
     const d = e[c];
-    g[c] = d.find((h) => h > 0) ?? 0;
-    let f = 0, a = 1 / 0, o = 1;
+    u[c] = d.find((h) => h > 0) ?? 0;
+    let o = 0, n = 1 / 0, r = 1;
     const i = Math.log2(t);
     for (let h = 0; h < 64; h++) {
       let l = 0;
-      for (let u = 0; u < d.length; u++)
-        l += Math.exp(-Math.max(0, d[u] - g[c]) / o);
+      for (let p = 0; p < d.length; p++)
+        l += Math.exp(-Math.max(0, d[p] - u[c]) / r);
       if (Math.abs(l - i) < 1e-5) break;
-      l > i ? (a = o, o = (f + a) / 2) : (f = o, o = a === 1 / 0 ? o * 2 : (f + a) / 2);
+      l > i ? (n = r, r = (o + n) / 2) : (o = r, r = n === 1 / 0 ? r * 2 : (o + n) / 2);
     }
-    n[c] = o;
+    s[c] = r;
   }
-  return { sigmas: n, rhos: g };
+  return { sigmas: s, rhos: u };
 }
-function Z(e, t, r, s, n) {
-  const g = /* @__PURE__ */ new Map();
-  for (let a = 0; a < e.length; a++)
-    g.set(e[a] * s + t[a], r[a]);
-  const c = [], d = [], f = [];
-  for (const [a, o] of g) {
-    const i = Math.floor(a / s), h = a % s, l = g.get(h * s + i) ?? 0, u = o + l - o * l, p = o * l;
-    c.push(i), d.push(h), f.push(n * u + (1 - n) * p);
+function ie(e, t, f, a, s) {
+  const u = /* @__PURE__ */ new Map();
+  for (let n = 0; n < e.length; n++)
+    u.set(e[n] * a + t[n], f[n]);
+  const c = [], d = [], o = [];
+  for (const [n, r] of u) {
+    const i = Math.floor(n / a), h = n % a, l = u.get(h * a + i) ?? 0, p = r + l - r * l, g = r * l;
+    c.push(i), d.push(h), o.push(s * p + (1 - s) * g);
   }
   return {
-    rows: new Float32Array(c),
-    cols: new Float32Array(d),
-    vals: new Float32Array(f)
+    rows: new Uint32Array(c),
+    cols: new Uint32Array(d),
+    vals: new Float32Array(o)
   };
 }
-const $ = `// UMAP SGD compute shader — processes one graph edge per GPU thread.
-// Applies attraction forces between connected nodes and repulsion forces
-// against negative samples.
+const oe = `// UMAP SGD compute shader — processes one graph edge per GPU thread.
+// Computes attraction and repulsion forces and accumulates them atomically
+// into a forces buffer. A separate apply-forces pass then updates embeddings,
+// eliminating write-write races on shared vertex positions.
 @group(0) @binding(0) var<storage, read>       epochs_per_sample : array<f32>;
 @group(0) @binding(1) var<storage, read>       head              : array<u32>;  // edge source
 @group(0) @binding(2) var<storage, read>       tail              : array<u32>;  // edge target
-@group(0) @binding(3) var<storage, read_write> embedding         : array<f32>;  // [n * nComponents]
+@group(0) @binding(3) var<storage, read>       embedding         : array<f32>;  // [n * nComponents], read-only
 @group(0) @binding(4) var<storage, read_write> epoch_of_next_sample : array<f32>;
 @group(0) @binding(5) var<storage, read_write> epoch_of_next_negative_sample : array<f32>;
 @group(0) @binding(6) var<uniform>             params            : Params;
 @group(0) @binding(7) var<storage, read>       rng_seeds         : array<u32>;  // per-edge seed
+@group(0) @binding(8) var<storage, read_write> forces            : array<atomic<i32>>;  // [n * nComponents]
+// Scale factor for quantizing f32 gradients into i32 for atomic accumulation.
+// Gradients are clipped to [-4, 4]. With up to ~1000 edges sharing a vertex
+// the max accumulated magnitude is ~4000, well within i32 range at this scale.
+const FORCE_SCALE : f32 = 65536.0;
 struct Params {
   n_edges        : u32,
@@ -106,7 +113,7 @@ struct Params {
   n_components   : u32,
   current_epoch  : u32,
   n_epochs       : u32,
-  alpha          : f32,   // learning rate
+  alpha          : f32,   // learning rate (applied by apply-forces pass)
   a              : f32,
   b              : f32,
   gamma          : f32,   // repulsion strength
@@ -147,7 +154,6 @@ fn main(@builtin(global_invocation_id) gid: vec3<u32>) {
   let pow_b = pow(dist_sq, params.b);
   // Guard dist_sq == 0: b-1 is negative so pow(0, b-1) = +Inf.
-  // Mirror CPU: use pow_b / dist_sq only when dist_sq > 0, else 0.
   let grad_coeff_attr = select(
     -2.0 * params.a * params.b * (pow_b / dist_sq) / (params.a * pow_b + 1.0),
     0.0,
@@ -157,20 +163,28 @@ fn main(@builtin(global_invocation_id) gid: vec3<u32>) {
   for (var d = 0u; d < nc; d++) {
     let diff = embedding[i * nc + d] - embedding[j * nc + d];
     let grad = clip(grad_coeff_attr * diff, -4.0, 4.0);
-    embedding[i * nc + d] += params.alpha * grad;
-    embedding[j * nc + d] -= params.alpha * grad;
+    // Accumulate atomically to avoid write-write races across threads.
+    atomicAdd(&forces[i * nc + d],  i32(grad * FORCE_SCALE));
+    atomicAdd(&forces[j * nc + d], -i32(grad * FORCE_SCALE));
   }
   epoch_of_next_sample[edge_idx] += epochs_per_sample[edge_idx];
   // --- Repulsion (negative samples) ---
-  let eps = epochs_per_sample[edge_idx];
-  let neg_eps = epoch_of_next_negative_sample[edge_idx];
+  // Compute how many negative samples are overdue relative to current epoch,
+  // matching the Python reference: n_neg = floor((n - next_neg) / eps_per_neg).
+  let epoch_f      = f32(params.current_epoch);
+  let epochs_per_neg = epochs_per_sample[edge_idx] / f32(params.negative_sample_rate);
   var n_neg = 0u;
-  if (neg_eps > 0.0) {
-    n_neg = u32(eps / neg_eps);
+  if (epochs_per_neg > 0.0 && epoch_f >= epoch_of_next_negative_sample[edge_idx]) {
+    n_neg = u32((epoch_f - epoch_of_next_negative_sample[edge_idx]) / epochs_per_neg);
+    epoch_of_next_negative_sample[edge_idx] += f32(n_neg) * epochs_per_neg;
   }
-  var rng = xorshift(rng_seeds[edge_idx] + params.current_epoch * 6364136223u);
+  // 2654435761u is the 32-bit golden-ratio hash constant (0x9E3779B1),
+  // which fits in u32 unlike the 64-bit LCG value 6364136223 used originally.
+  // Bug 14 fix: the original constant exceeded u32 range and failed WGSL validation.
+  var rng = xorshift(rng_seeds[edge_idx] + params.current_epoch * 2654435761u);
   for (var s = 0u; s < n_neg; s++) {
     rng = xorshift(rng);
@@ -189,26 +203,73 @@ fn main(@builtin(global_invocation_id) gid: vec3<u32>) {
     for (var d = 0u; d < nc; d++) {
       let diff = embedding[i * nc + d] - embedding[k * nc + d];
       let grad = clip(grad_coeff_rep * diff, -4.0, 4.0);
-      embedding[i * nc + d] += params.alpha * grad;
+      atomicAdd(&forces[i * nc + d], i32(grad * FORCE_SCALE));
     }
   }
+}
+`, ce = `// Apply-forces shader — second pass of the two-pass GPU SGD.
+//
+// After the SGD pass has atomically accumulated all gradients into the forces
+// buffer, this shader applies each element's accumulated force to the
+// embedding and resets the accumulator to zero for the next epoch.
-  epoch_of_next_negative_sample[edge_idx] +=
-    epochs_per_sample[edge_idx] / f32(params.negative_sample_rate);
+@group(0) @binding(0) var<storage, read_write> embedding : array<f32>;
+@group(0) @binding(1) var<storage, read_write> forces    : array<atomic<i32>>;
+@group(0) @binding(2) var<uniform>             params    : ApplyParams;
+struct ApplyParams {
+  n_elements : u32,   // nVertices * nComponents
+  alpha      : f32,   // current learning rate
+}
+// Must match FORCE_SCALE in sgd.wgsl
+const FORCE_SCALE : f32 = 65536.0;
+@compute @workgroup_size(256)
+fn main(@builtin(global_invocation_id) gid: vec3<u32>) {
+  let idx = gid.x;
+  if (idx >= params.n_elements) { return; }
+  // atomicExchange atomically reads the accumulated force and resets it to 0.
+  let raw = atomicExchange(&forces[idx], 0);
+  embedding[idx] += params.alpha * f32(raw) / FORCE_SCALE;
 }
 `;
-class j {
+let z = null;
+async function Q() {
+  if (z) return z;
+  if (typeof navigator > "u" || !navigator.gpu)
+    return null;
+  const e = await navigator.gpu.requestAdapter();
+  return e ? (z = await e.requestDevice(), z.lost.then(() => {
+    z = null;
+  }), z) : null;
+}
+function J() {
+  return typeof navigator < "u" && !!navigator.gpu;
+}
+async function he() {
+  return await Q() !== null;
+}
+class X {
   constructor() {
-    G(this, "device");
-    G(this, "pipeline");
+    R(this, "device");
+    R(this, "sgdPipeline");
+    R(this, "applyForcesPipeline");
   }
   async init() {
-    const t = await navigator.gpu.requestAdapter();
+    const t = await Q();
     if (!t) throw new Error("WebGPU not supported");
-    this.device = await t.requestDevice(), this.pipeline = this.device.createComputePipeline({
+    this.device = t, this.sgdPipeline = this.device.createComputePipeline({
+      layout: "auto",
+      compute: {
+        module: this.device.createShaderModule({ code: oe }),
+        entryPoint: "main"
+      }
+    }), this.applyForcesPipeline = this.device.createComputePipeline({
       layout: "auto",
       compute: {
-        module: this.device.createShaderModule({ code: $ }),
+        module: this.device.createShaderModule({ code: ce }),
         entryPoint: "main"
       }
     });
@@ -226,222 +287,254 @@ class j {
    * @param params      - UMAP curve parameters and repulsion settings
    * @returns Optimized embedding as Float32Array
    */
-  async optimize(t, r, s, n, g, c, d, f, a) {
-    const { device: o } = this, i = r.length, h = this.makeBuffer(
+  async optimize(t, f, a, s, u, c, d, o, n) {
+    const { device: r } = this, i = f.length, h = u * c, l = this.makeBuffer(
       t,
       GPUBufferUsage.STORAGE | GPUBufferUsage.COPY_SRC
-    ), l = this.makeBuffer(r, GPUBufferUsage.STORAGE), u = this.makeBuffer(s, GPUBufferUsage.STORAGE), p = this.makeBuffer(n, GPUBufferUsage.STORAGE), m = new Float32Array(i).fill(0), _ = this.makeBuffer(m, GPUBufferUsage.STORAGE), w = new Float32Array(i);
-    for (let M = 0; M < i; M++)
-      w[M] = n[M] / f.negativeSampleRate;
-    const b = this.makeBuffer(w, GPUBufferUsage.STORAGE), A = new Uint32Array(i);
-    for (let M = 0; M < i; M++)
-      A[M] = Math.random() * 4294967295 | 0;
-    const x = this.makeBuffer(A, GPUBufferUsage.STORAGE), U = o.createBuffer({
+    ), p = this.makeBuffer(f, GPUBufferUsage.STORAGE), g = this.makeBuffer(a, GPUBufferUsage.STORAGE), _ = this.makeBuffer(s, GPUBufferUsage.STORAGE), m = new Float32Array(s), b = this.makeBuffer(m, GPUBufferUsage.STORAGE), y = new Float32Array(i);
+    for (let A = 0; A < i; A++)
+      y[A] = s[A] / o.negativeSampleRate;
+    const x = this.makeBuffer(y, GPUBufferUsage.STORAGE), v = new Uint32Array(i);
+    for (let A = 0; A < i; A++)
+      v[A] = Math.random() * 4294967295 | 0;
+    const G = this.makeBuffer(v, GPUBufferUsage.STORAGE), P = r.createBuffer({
+      size: h * 4,
+      usage: GPUBufferUsage.STORAGE,
+      mappedAtCreation: !0
+    });
+    new Int32Array(P.getMappedRange()).fill(0), P.unmap();
+    const U = r.createBuffer({
       size: 40,
       usage: GPUBufferUsage.UNIFORM | GPUBufferUsage.COPY_DST
+    }), F = r.createBuffer({
+      size: 16,
+      usage: GPUBufferUsage.UNIFORM | GPUBufferUsage.COPY_DST
+    }), N = r.createBindGroup({
+      layout: this.sgdPipeline.getBindGroupLayout(0),
+      entries: [
+        { binding: 0, resource: { buffer: _ } },
+        { binding: 1, resource: { buffer: p } },
+        { binding: 2, resource: { buffer: g } },
+        { binding: 3, resource: { buffer: l } },
+        { binding: 4, resource: { buffer: b } },
+        { binding: 5, resource: { buffer: x } },
+        { binding: 6, resource: { buffer: U } },
+        { binding: 7, resource: { buffer: G } },
+        { binding: 8, resource: { buffer: P } }
+      ]
+    }), M = r.createBindGroup({
+      layout: this.applyForcesPipeline.getBindGroupLayout(0),
+      entries: [
+        { binding: 0, resource: { buffer: l } },
+        { binding: 1, resource: { buffer: P } },
+        { binding: 2, resource: { buffer: F } }
+      ]
     });
-    for (let M = 0; M < d; M++) {
-      const v = 1 - M / d, S = new ArrayBuffer(40), y = new Uint32Array(S), B = new Float32Array(S);
-      y[0] = i, y[1] = g, y[2] = c, y[3] = M, y[4] = d, B[5] = v, B[6] = f.a, B[7] = f.b, B[8] = f.gamma, y[9] = f.negativeSampleRate, o.queue.writeBuffer(U, 0, S);
-      const k = o.createBindGroup({
-        layout: this.pipeline.getBindGroupLayout(0),
-        entries: [
-          { binding: 0, resource: { buffer: p } },
-          { binding: 1, resource: { buffer: l } },
-          { binding: 2, resource: { buffer: u } },
-          { binding: 3, resource: { buffer: h } },
-          { binding: 4, resource: { buffer: _ } },
-          { binding: 5, resource: { buffer: b } },
-          { binding: 6, resource: { buffer: U } },
-          { binding: 7, resource: { buffer: x } }
-        ]
-      }), E = o.createCommandEncoder(), P = E.beginComputePass();
-      P.setPipeline(this.pipeline), P.setBindGroup(0, k), P.dispatchWorkgroups(Math.ceil(i / 256)), P.end(), o.queue.submit([E.finish()]), M % 10 === 0 && (await o.queue.onSubmittedWorkDone(), a == null || a(M, d));
+    for (let A = 0; A < d; A++) {
+      const B = 1 - A / d, O = new ArrayBuffer(40), S = new Uint32Array(O), k = new Float32Array(O);
+      S[0] = i, S[1] = u, S[2] = c, S[3] = A, S[4] = d, k[5] = B, k[6] = o.a, k[7] = o.b, k[8] = o.gamma, S[9] = o.negativeSampleRate, r.queue.writeBuffer(U, 0, O);
+      const D = new ArrayBuffer(16), $ = new Uint32Array(D), ee = new Float32Array(D);
+      $[0] = h, ee[1] = B, r.queue.writeBuffer(F, 0, D);
+      const T = r.createCommandEncoder(), q = T.beginComputePass();
+      q.setPipeline(this.sgdPipeline), q.setBindGroup(0, N), q.dispatchWorkgroups(Math.ceil(i / 256)), q.end();
+      const L = T.beginComputePass();
+      L.setPipeline(this.applyForcesPipeline), L.setBindGroup(0, M), L.dispatchWorkgroups(Math.ceil(h / 256)), L.end(), r.queue.submit([T.finish()]), A % 10 === 0 && (await r.queue.onSubmittedWorkDone(), n == null || n(A, d));
     }
-    const N = o.createBuffer({
+    const E = r.createBuffer({
       size: t.byteLength,
       usage: GPUBufferUsage.COPY_DST | GPUBufferUsage.MAP_READ
-    }), R = o.createCommandEncoder();
-    R.copyBufferToBuffer(h, 0, N, 0, t.byteLength), o.queue.submit([R.finish()]), await N.mapAsync(GPUMapMode.READ);
-    const O = new Float32Array(N.getMappedRange().slice(0));
-    return N.unmap(), h.destroy(), l.destroy(), u.destroy(), p.destroy(), _.destroy(), b.destroy(), x.destroy(), U.destroy(), N.destroy(), O;
+    }), w = r.createCommandEncoder();
+    w.copyBufferToBuffer(l, 0, E, 0, t.byteLength), r.queue.submit([w.finish()]), await E.mapAsync(GPUMapMode.READ);
+    const C = new Float32Array(E.getMappedRange().slice(0));
+    return E.unmap(), l.destroy(), p.destroy(), g.destroy(), _.destroy(), b.destroy(), x.destroy(), G.destroy(), P.destroy(), U.destroy(), F.destroy(), E.destroy(), C;
   }
-  makeBuffer(t, r) {
-    const s = this.device.createBuffer({
+  makeBuffer(t, f) {
+    const a = this.device.createBuffer({
       size: t.byteLength,
-      usage: r,
+      usage: f,
       mappedAtCreation: !0
     });
-    return t instanceof Float32Array ? new Float32Array(s.getMappedRange()).set(t) : new Uint32Array(s.getMappedRange()).set(t), s.unmap(), s;
+    return t instanceof Float32Array ? new Float32Array(a.getMappedRange()).set(t) : new Uint32Array(a.getMappedRange()).set(t), a.unmap(), a;
   }
 }
-function z(e) {
+function I(e) {
   return Math.max(-4, Math.min(4, e));
 }
-function I(e, t, r, s, n, g, c, d) {
-  const { a: f, b: a, gamma: o = 1, negativeSampleRate: i = 5 } = c, h = t.rows.length, l = new Uint32Array(t.rows), u = new Uint32Array(t.cols), p = new Float32Array(h).fill(0), m = new Float32Array(h);
-  for (let _ = 0; _ < h; _++)
-    m[_] = r[_] / i;
-  for (let _ = 0; _ < g; _++) {
-    d == null || d(_, g);
-    const w = 1 - _ / g;
-    for (let b = 0; b < h; b++) {
-      if (p[b] > _) continue;
-      const A = l[b], x = u[b];
-      let U = 0;
-      for (let v = 0; v < n; v++) {
-        const S = e[A * n + v] - e[x * n + v];
-        U += S * S;
+function j(e, t, f, a, s, u, c, d) {
+  const { a: o, b: n, gamma: r = 1, negativeSampleRate: i = 5 } = c, h = t.rows.length, l = new Uint32Array(t.rows), p = new Uint32Array(t.cols), g = new Float32Array(f), _ = new Float32Array(h);
+  for (let m = 0; m < h; m++)
+    _[m] = f[m] / i;
+  for (let m = 0; m < u; m++) {
+    d == null || d(m, u);
+    const b = 1 - m / u;
+    for (let y = 0; y < h; y++) {
+      if (g[y] > m) continue;
+      const x = l[y], v = p[y];
+      let G = 0;
+      for (let M = 0; M < s; M++) {
+        const E = e[x * s + M] - e[v * s + M];
+        G += E * E;
       }
-      const N = Math.pow(U, a), R = -2 * f * a * (U > 0 ? N / U : 0) / (f * N + 1);
-      for (let v = 0; v < n; v++) {
-        const S = e[A * n + v] - e[x * n + v], y = z(R * S);
-        e[A * n + v] += w * y, e[x * n + v] -= w * y;
+      const P = Math.pow(G, n), U = -2 * o * n * (G > 0 ? P / G : 0) / (o * P + 1);
+      for (let M = 0; M < s; M++) {
+        const E = e[x * s + M] - e[v * s + M], w = I(U * E);
+        e[x * s + M] += b * w, e[v * s + M] -= b * w;
       }
-      p[b] += r[b];
-      const O = r[b] / i, M = Math.max(0, Math.floor(
-        (_ - m[b]) / O
+      g[y] += f[y];
+      const F = f[y] / i, N = Math.max(0, Math.floor(
+        (m - _[y]) / F
       ));
-      m[b] += M * O;
-      for (let v = 0; v < M; v++) {
-        const S = Math.floor(Math.random() * s);
-        if (S === A) continue;
-        let y = 0;
-        for (let E = 0; E < n; E++) {
-          const P = e[A * n + E] - e[S * n + E];
-          y += P * P;
+      _[y] += N * F;
+      for (let M = 0; M < N; M++) {
+        const E = Math.floor(Math.random() * a);
+        if (E === x) continue;
+        let w = 0;
+        for (let B = 0; B < s; B++) {
+          const O = e[x * s + B] - e[E * s + B];
+          w += O * O;
         }
-        const B = Math.pow(y, a), k = 2 * o * a / ((1e-3 + y) * (f * B + 1));
-        for (let E = 0; E < n; E++) {
-          const P = e[A * n + E] - e[S * n + E], F = z(k * P);
-          e[A * n + E] += w * F;
+        const C = Math.pow(w, n), A = 2 * r * n / ((1e-3 + w) * (o * C + 1));
+        for (let B = 0; B < s; B++) {
+          const O = e[x * s + B] - e[E * s + B], S = I(A * O);
+          e[x * s + B] += b * S;
         }
       }
     }
   }
   return e;
 }
-function ee(e, t, r, s, n, g, c, d, f, a) {
-  const { a: o, b: i, gamma: h = 1, negativeSampleRate: l = 5 } = f, u = r.rows.length, p = new Uint32Array(r.rows), m = new Uint32Array(r.cols), _ = new Float32Array(u).fill(0), w = new Float32Array(u);
-  for (let b = 0; b < u; b++)
-    w[b] = s[b] / l;
-  for (let b = 0; b < d; b++) {
-    const A = 1 - b / d;
-    for (let x = 0; x < u; x++) {
-      if (_[x] > b) continue;
-      const U = p[x], N = m[x];
-      let R = 0;
-      for (let y = 0; y < c; y++) {
-        const B = e[U * c + y] - t[N * c + y];
-        R += B * B;
+function fe(e, t, f, a, s, u, c, d, o, n) {
+  const { a: r, b: i, gamma: h = 1, negativeSampleRate: l = 5 } = o, p = f.rows.length, g = new Uint32Array(f.rows), _ = new Uint32Array(f.cols), m = new Float32Array(a), b = new Float32Array(p);
+  for (let y = 0; y < p; y++)
+    b[y] = a[y] / l;
+  for (let y = 0; y < d; y++) {
+    const x = 1 - y / d;
+    for (let v = 0; v < p; v++) {
+      if (m[v] > y) continue;
+      const G = g[v], P = _[v];
+      let U = 0;
+      for (let w = 0; w < c; w++) {
+        const C = e[G * c + w] - t[P * c + w];
+        U += C * C;
       }
-      const O = Math.pow(R, i), M = -2 * o * i * (R > 0 ? O / R : 0) / (o * O + 1);
-      for (let y = 0; y < c; y++) {
-        const B = e[U * c + y] - t[N * c + y];
-        e[U * c + y] += A * z(M * B);
+      const F = Math.pow(U, i), N = -2 * r * i * (U > 0 ? F / U : 0) / (r * F + 1);
+      for (let w = 0; w < c; w++) {
+        const C = e[G * c + w] - t[P * c + w];
+        e[G * c + w] += x * I(N * C);
       }
-      _[x] += s[x];
-      const v = s[x] / l, S = Math.max(0, Math.floor(
-        (b - w[x]) / v
+      m[v] += a[v];
+      const M = a[v] / l, E = Math.max(0, Math.floor(
+        (y - b[v]) / M
       ));
-      w[x] += S * v;
-      for (let y = 0; y < S; y++) {
-        const B = Math.floor(Math.random() * g);
-        if (B === N) continue;
-        let k = 0;
-        for (let F = 0; F < c; F++) {
-          const q = e[U * c + F] - t[B * c + F];
-          k += q * q;
+      b[v] += E * M;
+      for (let w = 0; w < E; w++) {
+        const C = Math.floor(Math.random() * u);
+        if (C === P) continue;
+        let A = 0;
+        for (let S = 0; S < c; S++) {
+          const k = e[G * c + S] - t[C * c + S];
+          A += k * k;
         }
-        const E = Math.pow(k, i), P = 2 * h * i / ((1e-3 + k) * (o * E + 1));
-        for (let F = 0; F < c; F++) {
-          const q = e[U * c + F] - t[B * c + F];
-          e[U * c + F] += A * z(P * q);
+        const B = Math.pow(A, i), O = 2 * h * i / ((1e-3 + A) * (r * B + 1));
+        for (let S = 0; S < c; S++) {
+          const k = e[G * c + S] - t[C * c + S];
+          e[G * c + S] += x * I(O * k);
         }
       }
     }
   }
   return e;
 }
-function K() {
-  return typeof navigator < "u" && !!navigator.gpu;
-}
-async function re(e, t = {}, r) {
+async function pe(e, t = {}, f) {
   const {
-    nComponents: s = 2,
-    nNeighbors: n = 15,
-    minDist: g = 0.1,
+    nComponents: a = 2,
+    nNeighbors: s = 15,
+    minDist: u = 0.1,
     spread: c = 1,
     hnsw: d = {}
-  } = t, f = t.nEpochs ?? (e.length > 1e4 ? 200 : 500);
+  } = t, o = t.nEpochs ?? (e.length > 1e4 ? 200 : 500);
   console.time("knn");
-  const { indices: a, distances: o } = await Q(e, n, {
+  const { indices: n, distances: r } = await se(e, s, {
     M: d.M ?? 16,
     efConstruction: d.efConstruction ?? 200,
     efSearch: d.efSearch ?? 50
   });
   console.timeEnd("knn"), console.time("fuzzy-set");
-  const i = L(a, o, n);
+  const i = V(n, r, s);
   console.timeEnd("fuzzy-set");
-  const { a: h, b: l } = H(g, c), u = T(i.vals), p = e.length, m = new Float32Array(p * s);
-  for (let w = 0; w < m.length; w++)
-    m[w] = Math.random() * 20 - 10;
+  const { a: h, b: l } = Z(u, c), p = W(i.vals), g = e.length, _ = new Float32Array(g * a);
+  for (let b = 0; b < _.length; b++)
+    _[b] = Math.random() * 20 - 10;
   console.time("sgd");
-  let _;
-  if (K())
+  let m;
+  if (J())
     try {
-      const w = new j();
-      await w.init(), _ = await w.optimize(
-        m,
+      const b = new X();
+      await b.init(), m = await b.optimize(
+        _,
         new Uint32Array(i.rows),
         new Uint32Array(i.cols),
-        u,
         p,
-        s,
-        f,
+        g,
+        a,
+        o,
         { a: h, b: l, gamma: 1, negativeSampleRate: 5 },
-        r
+        f
       );
-    } catch (w) {
-      console.warn("WebGPU SGD failed, falling back to CPU:", w), _ = I(m, i, u, p, s, f, { a: h, b: l }, r);
+    } catch (b) {
+      console.warn("WebGPU SGD failed, falling back to CPU:", b), m = j(_, i, p, g, a, o, { a: h, b: l }, f);
     }
   else
-    _ = I(m, i, u, p, s, f, { a: h, b: l }, r);
-  return console.timeEnd("sgd"), _;
+    m = j(_, i, p, g, a, o, { a: h, b: l }, f);
+  return console.timeEnd("sgd"), m;
 }
-function H(e, t) {
-  if (Math.abs(t - 1) < 1e-6 && Math.abs(e - 0.1) < 1e-6)
-    return { a: 1.9292, b: 0.7915 };
-  if (Math.abs(t - 1) < 1e-6 && Math.abs(e - 0) < 1e-6)
-    return { a: 1.8956, b: 0.8006 };
-  if (Math.abs(t - 1) < 1e-6 && Math.abs(e - 0.5) < 1e-6)
-    return { a: 1.5769, b: 0.8951 };
-  const r = te(e, t);
-  return { a: ne(e, t, r), b: r };
+function Z(e, t) {
+  return Math.abs(t - 1) < 1e-6 && Math.abs(e - 0.1) < 1e-6 ? { a: 1.9292, b: 0.7915 } : Math.abs(t - 1) < 1e-6 && Math.abs(e - 0) < 1e-6 ? { a: 1.8956, b: 0.8006 } : Math.abs(t - 1) < 1e-6 && Math.abs(e - 0.5) < 1e-6 ? { a: 1.5769, b: 0.8951 } : de(e, t);
 }
-function te(e, t) {
-  return 1 / (t * 1.2);
-}
-function ne(e, t, r) {
-  return e < 1e-6 ? 1.8956 : (1 / (1 + 1e-3) - 1) / -Math.pow(e, 2 * r);
+function de(e, t) {
+  const a = [], s = [];
+  for (let o = 0; o < 299; o++) {
+    const n = (o + 1) / 299 * t * 3;
+    a.push(n), s.push(n < e ? 1 : Math.exp(-(n - e) / t));
+  }
+  let u = 1, c = 1, d = 1e-3;
+  for (let o = 0; o < 500; o++) {
+    let n = 0, r = 0, i = 0, h = 0, l = 0, p = 0;
+    for (let U = 0; U < 299; U++) {
+      const F = a[U], N = Math.pow(F, 2 * c), M = 1 + u * N, w = 1 / M - s[U];
+      p += w * w;
+      const C = M * M, A = -N / C, B = F > 0 ? -2 * Math.log(F) * u * N / C : 0;
+      n += A * w, r += B * w, i += A * A, h += B * B, l += A * B;
+    }
+    const g = i + d, _ = h + d, m = l, b = g * _ - m * m;
+    if (Math.abs(b) < 1e-20) break;
+    const y = -(_ * n - m * r) / b, x = -(g * r - m * n) / b, v = Math.max(1e-4, u + y), G = Math.max(1e-4, c + x);
+    let P = 0;
+    for (let U = 0; U < 299; U++) {
+      const F = Math.pow(a[U], 2 * G), N = 1 / (1 + v * F) - s[U];
+      P += N * N;
+    }
+    if (P < p ? (u = v, c = G, d = Math.max(1e-10, d / 10)) : d = Math.min(1e10, d * 10), Math.abs(y) < 1e-8 && Math.abs(x) < 1e-8) break;
+  }
+  return { a: u, b: c };
 }
-class ie {
+class ge {
   constructor(t = {}) {
-    G(this, "_nComponents");
-    G(this, "_nNeighbors");
-    G(this, "_minDist");
-    G(this, "_spread");
-    G(this, "_nEpochs");
-    G(this, "_hnswOpts");
-    G(this, "_a");
-    G(this, "_b");
+    R(this, "_nComponents");
+    R(this, "_nNeighbors");
+    R(this, "_minDist");
+    R(this, "_spread");
+    R(this, "_nEpochs");
+    R(this, "_hnswOpts");
+    R(this, "_a");
+    R(this, "_b");
     /** The low-dimensional embedding produced by the last fit() call. */
-    G(this, "embedding", null);
-    G(this, "_hnswIndex", null);
-    G(this, "_nTrain", 0);
+    R(this, "embedding", null);
+    R(this, "_hnswIndex", null);
+    R(this, "_nTrain", 0);
     this._nComponents = t.nComponents ?? 2, this._nNeighbors = t.nNeighbors ?? 15, this._minDist = t.minDist ?? 0.1, this._spread = t.spread ?? 1, this._nEpochs = t.nEpochs, this._hnswOpts = t.hnsw ?? {};
-    const { a: r, b: s } = H(this._minDist, this._spread);
-    this._a = r, this._b = s;
+    const { a: f, b: a } = Z(this._minDist, this._spread);
+    this._a = f, this._b = a;
   }
   /**
    * Train UMAP on `vectors`.
@@ -449,45 +542,45 @@ class ie {
    * index so that transform() can project new points later.
    * Returns `this` for chaining.
    */
-  async fit(t, r) {
-    const s = t.length, n = this._nEpochs ?? (s > 1e4 ? 200 : 500), { M: g = 16, efConstruction: c = 200, efSearch: d = 50 } = this._hnswOpts;
+  async fit(t, f) {
+    const a = t.length, s = this._nEpochs ?? (a > 1e4 ? 200 : 500), { M: u = 16, efConstruction: c = 200, efSearch: d = 50 } = this._hnswOpts;
     console.time("knn");
-    const { knn: f, index: a } = await J(t, this._nNeighbors, {
-      M: g,
+    const { knn: o, index: n } = await ae(t, this._nNeighbors, {
+      M: u,
       efConstruction: c,
       efSearch: d
     });
-    this._hnswIndex = a, this._nTrain = s, console.timeEnd("knn"), console.time("fuzzy-set");
-    const o = L(f.indices, f.distances, this._nNeighbors);
+    this._hnswIndex = n, this._nTrain = a, console.timeEnd("knn"), console.time("fuzzy-set");
+    const r = V(o.indices, o.distances, this._nNeighbors);
     console.timeEnd("fuzzy-set");
-    const i = T(o.vals), h = new Float32Array(s * this._nComponents);
+    const i = W(r.vals), h = new Float32Array(a * this._nComponents);
     for (let l = 0; l < h.length; l++)
       h[l] = Math.random() * 20 - 10;
-    if (console.time("sgd"), K())
+    if (console.time("sgd"), J())
       try {
-        const l = new j();
+        const l = new X();
         await l.init(), this.embedding = await l.optimize(
           h,
-          new Uint32Array(o.rows),
-          new Uint32Array(o.cols),
+          new Uint32Array(r.rows),
+          new Uint32Array(r.cols),
           i,
-          s,
+          a,
           this._nComponents,
-          n,
+          s,
           { a: this._a, b: this._b, gamma: 1, negativeSampleRate: 5 },
-          r
+          f
         );
       } catch (l) {
-        console.warn("WebGPU SGD failed, falling back to CPU:", l), this.embedding = I(h, o, i, s, this._nComponents, n, {
+        console.warn("WebGPU SGD failed, falling back to CPU:", l), this.embedding = j(h, r, i, a, this._nComponents, s, {
           a: this._a,
           b: this._b
-        }, r);
+        }, f);
       }
     else
-      this.embedding = I(h, o, i, s, this._nComponents, n, {
+      this.embedding = j(h, r, i, a, this._nComponents, s, {
         a: this._a,
         b: this._b
-      }, r);
+      }, f);
     return console.timeEnd("sgd"), this;
   }
   /**
@@ -501,35 +594,35 @@ class ie {
    *   returned embedding to [0, 1].  The stored training embedding is never
    *   mutated.  Defaults to `false`.
    */
-  async transform(t, r = !1) {
+  async transform(t, f = !1) {
     if (!this._hnswIndex || !this.embedding)
       throw new Error("UMAP.transform() must be called after fit()");
-    const s = t.length, n = this._nEpochs ?? (this._nTrain > 1e4 ? 200 : 500), g = Math.max(100, Math.floor(n / 4)), c = this._hnswIndex.searchKnn(t, this._nNeighbors), d = X(c.indices, c.distances, this._nNeighbors), f = new Uint32Array(d.rows), a = new Uint32Array(d.cols), o = new Float32Array(s), i = new Float32Array(s * this._nComponents);
-    for (let u = 0; u < f.length; u++) {
-      const p = f[u], m = a[u], _ = d.vals[u];
-      o[p] += _;
-      for (let w = 0; w < this._nComponents; w++)
-        i[p * this._nComponents + w] += _ * this.embedding[m * this._nComponents + w];
+    const a = t.length, s = this._nEpochs ?? (this._nTrain > 1e4 ? 200 : 500), u = Math.max(100, Math.floor(s / 4)), c = this._hnswIndex.searchKnn(t, this._nNeighbors), d = re(c.indices, c.distances, this._nNeighbors), o = new Uint32Array(d.rows), n = new Uint32Array(d.cols), r = new Float32Array(a), i = new Float32Array(a * this._nComponents);
+    for (let p = 0; p < o.length; p++) {
+      const g = o[p], _ = n[p], m = d.vals[p];
+      r[g] += m;
+      for (let b = 0; b < this._nComponents; b++)
+        i[g * this._nComponents + b] += m * this.embedding[_ * this._nComponents + b];
     }
-    for (let u = 0; u < s; u++)
-      if (o[u] > 0)
-        for (let p = 0; p < this._nComponents; p++)
-          i[u * this._nComponents + p] /= o[u];
+    for (let p = 0; p < a; p++)
+      if (r[p] > 0)
+        for (let g = 0; g < this._nComponents; g++)
+          i[p * this._nComponents + g] /= r[p];
       else
-        for (let p = 0; p < this._nComponents; p++)
-          i[u * this._nComponents + p] = Math.random() * 20 - 10;
-    const h = T(d.vals), l = ee(
+        for (let g = 0; g < this._nComponents; g++)
+          i[p * this._nComponents + g] = Math.random() * 20 - 10;
+    const h = W(d.vals), l = fe(
       i,
       this.embedding,
       d,
       h,
-      s,
+      a,
       this._nTrain,
       this._nComponents,
-      g,
+      u,
       { a: this._a, b: this._b }
     );
-    return r ? C(l, s, this._nComponents) : l;
+    return f ? K(l, a, this._nComponents) : l;
   }
   /**
    * Convenience method equivalent to `fit(vectors)` followed by
@@ -540,37 +633,38 @@ class ie {
    *   returned embedding to [0, 1].  `this.embedding` is never mutated.
    *   Defaults to `false`.
    */
-  async fit_transform(t, r, s = !1) {
-    return await this.fit(t, r), s ? C(this.embedding, t.length, this._nComponents) : this.embedding;
+  async fit_transform(t, f, a = !1) {
+    return await this.fit(t, f), a ? K(this.embedding, t.length, this._nComponents) : this.embedding;
   }
 }
-function C(e, t, r) {
-  const s = new Float32Array(e.length);
-  for (let n = 0; n < r; n++) {
-    let g = 1 / 0, c = -1 / 0;
-    for (let f = 0; f < t; f++) {
-      const a = e[f * r + n];
-      a < g && (g = a), a > c && (c = a);
+function K(e, t, f) {
+  const a = new Float32Array(e.length);
+  for (let s = 0; s < f; s++) {
+    let u = 1 / 0, c = -1 / 0;
+    for (let o = 0; o < t; o++) {
+      const n = e[o * f + s];
+      n < u && (u = n), n > c && (c = n);
     }
-    const d = c - g;
-    for (let f = 0; f < t; f++)
-      s[f * r + n] = d > 0 ? (e[f * r + n] - g) / d : 0;
+    const d = c - u;
+    for (let o = 0; o < t; o++)
+      a[o * f + s] = d > 0 ? (e[o * f + s] - u) / d : 0;
   }
-  return s;
+  return a;
 }
-function T(e, t) {
-  let r = -1 / 0;
-  for (let n = 0; n < e.length; n++)
-    e[n] > r && (r = e[n]);
-  const s = new Float32Array(e.length);
-  for (let n = 0; n < e.length; n++) {
-    const g = e[n] / r;
-    s[n] = g > 0 ? 1 / g : -1;
+function W(e, t) {
+  let f = -1 / 0;
+  for (let s = 0; s < e.length; s++)
+    e[s] > f && (f = e[s]);
+  const a = new Float32Array(e.length);
+  for (let s = 0; s < e.length; s++) {
+    const u = e[s] / f;
+    a[s] = u > 0 ? 1 / u : -1;
   }
-  return s;
+  return a;
 }
 export {
-  ie as UMAP,
-  re as fit,
-  K as isWebGPUAvailable
+  ge as UMAP,
+  he as checkWebGPUAvailable,
+  pe as fit,
+  J as isWebGPUAvailable
 };

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "umap-gpu",
-  "version": "0.2.13",
+  "version": "0.2.15",
   "description": "UMAP with HNSW kNN and WebGPU-accelerated SGD",
   "type": "module",
   "main": "dist/index.js",
@@ -55,7 +55,8 @@
     "vite": "^5.0.0",
     "vitepress": "^1.6.4",
     "vitepress-plugin-llms": "^1.11.0",
-    "vitest": "^4.0.18"
+    "vitest": "^4.0.18",
+    "webgpu": "^0.3.8"
   },
   "license": "MIT"
 }