npm - @softerist/heuristic-mcp - Versions diffs - 3.0.15 → 3.0.16 - Mend

@softerist/heuristic-mcp 3.0.15 → 3.0.16

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (49) hide show

package/README.md +104 -104
package/config.jsonc +173 -173
package/features/ann-config.js +131 -0
package/features/clear-cache.js +84 -0
package/features/find-similar-code.js +291 -0
package/features/hybrid-search.js +544 -0
package/features/index-codebase.js +3268 -0
package/features/lifecycle.js +1189 -0
package/features/package-version.js +302 -0
package/features/register.js +408 -0
package/features/resources.js +156 -0
package/features/set-workspace.js +265 -0
package/index.js +96 -96
package/lib/cache-ops.js +22 -22
package/lib/cache-utils.js +565 -565
package/lib/cache.js +1870 -1870
package/lib/call-graph.js +396 -396
package/lib/cli.js +1 -1
package/lib/config.js +517 -517
package/lib/constants.js +39 -39
package/lib/embed-query-process.js +7 -7
package/lib/embedding-process.js +7 -7
package/lib/embedding-worker.js +299 -299
package/lib/ignore-patterns.js +316 -316
package/lib/json-worker.js +14 -14
package/lib/json-writer.js +337 -337
package/lib/logging.js +164 -164
package/lib/memory-logger.js +13 -13
package/lib/onnx-backend.js +193 -193
package/lib/project-detector.js +84 -84
package/lib/server-lifecycle.js +165 -165
package/lib/settings-editor.js +754 -754
package/lib/tokenizer.js +256 -256
package/lib/utils.js +428 -428
package/lib/vector-store-binary.js +627 -627
package/lib/vector-store-sqlite.js +95 -95
package/lib/workspace-env.js +28 -28
package/mcp_config.json +9 -9
package/package.json +86 -75
package/scripts/clear-cache.js +20 -0
package/scripts/download-model.js +43 -0
package/scripts/mcp-launcher.js +49 -0
package/scripts/postinstall.js +12 -0
package/search-configs.js +36 -36
package/.prettierrc +0 -7
package/debug-pids.js +0 -30
package/eslint.config.js +0 -36
package/specs/plan.md +0 -23
package/vitest.config.js +0 -39

package/lib/embedding-worker.js CHANGED Viewed

@@ -24,51 +24,51 @@ console.info = (...args) => console.error('[INFO]', ...args);
 console.warn = (...args) => console.error('[WARN]', ...args);
 import { RESULT_BATCH_SIZE, DEFAULT_INFERENCE_BATCH_SIZE } from './constants.js';
-const workerId = Number.isInteger(workerData.workerId) ? workerData.workerId : null;
-const workerLabel = workerId === null ? '[Worker]' : `[Worker ${workerId}]`;
-const workerThreads = Number.isFinite(workerData.numThreads) ? workerData.numThreads : 1;
-const explicitGcEnabled = workerData.enableExplicitGc !== false;
-const failFastEmbeddingErrors = workerData.failFastEmbeddingErrors === true;
-const FAIL_FAST_CONSECUTIVE_ERROR_LIMIT = 8;
-const logInfo = (...args) => {
-  console.info(...args);
-};
-let nativeBackendConfigured = false;
-function maybeRunGc() {
-  if (!explicitGcEnabled || typeof global.gc !== 'function') return;
-  global.gc();
-}
-function createFailFastState(scope) {
-  if (!failFastEmbeddingErrors) return null;
-  return { scope, consecutiveFailures: 0 };
-}
-function noteEmbeddingSuccess(failFastState) {
-  if (!failFastState) return;
-  failFastState.consecutiveFailures = 0;
-}
-function noteEmbeddingFailure(failFastState, err) {
-  if (!failFastState) return;
-  failFastState.consecutiveFailures += 1;
-  if (failFastState.consecutiveFailures >= FAIL_FAST_CONSECUTIVE_ERROR_LIMIT) {
-    const message =
-      `${failFastState.scope}: fail-fast breaker tripped after ` +
-      `${failFastState.consecutiveFailures} consecutive embedding failures (${err?.message || err})`;
-    console.warn(`${workerLabel} ${message}`);
-    throw new Error(message);
-  }
-  if (workerData.verbose) {
-    console.warn(
-      `${workerLabel} ${failFastState.scope}: embedding failure ` +
-      `${failFastState.consecutiveFailures}/${FAIL_FAST_CONSECUTIVE_ERROR_LIMIT}`
-    );
-  }
-}
+const workerId = Number.isInteger(workerData.workerId) ? workerData.workerId : null;
+const workerLabel = workerId === null ? '[Worker]' : `[Worker ${workerId}]`;
+const workerThreads = Number.isFinite(workerData.numThreads) ? workerData.numThreads : 1;
+const explicitGcEnabled = workerData.enableExplicitGc !== false;
+const failFastEmbeddingErrors = workerData.failFastEmbeddingErrors === true;
+const FAIL_FAST_CONSECUTIVE_ERROR_LIMIT = 8;
+const logInfo = (...args) => {
+  console.info(...args);
+};
+let nativeBackendConfigured = false;
+function maybeRunGc() {
+  if (!explicitGcEnabled || typeof global.gc !== 'function') return;
+  global.gc();
+}
+function createFailFastState(scope) {
+  if (!failFastEmbeddingErrors) return null;
+  return { scope, consecutiveFailures: 0 };
+}
+function noteEmbeddingSuccess(failFastState) {
+  if (!failFastState) return;
+  failFastState.consecutiveFailures = 0;
+}
+function noteEmbeddingFailure(failFastState, err) {
+  if (!failFastState) return;
+  failFastState.consecutiveFailures += 1;
+  if (failFastState.consecutiveFailures >= FAIL_FAST_CONSECUTIVE_ERROR_LIMIT) {
+    const message =
+      `${failFastState.scope}: fail-fast breaker tripped after ` +
+      `${failFastState.consecutiveFailures} consecutive embedding failures (${err?.message || err})`;
+    console.warn(`${workerLabel} ${message}`);
+    throw new Error(message);
+  }
+  if (workerData.verbose) {
+    console.warn(
+      `${workerLabel} ${failFastState.scope}: embedding failure ` +
+      `${failFastState.consecutiveFailures}/${FAIL_FAST_CONSECUTIVE_ERROR_LIMIT}`
+    );
+  }
+}
 function ensureNativeBackend() {
   if (nativeBackendConfigured) return;
@@ -172,7 +172,7 @@ const embeddingDimension = workerData.embeddingDimension || null;
 // Use a promise to handle concurrent calls to initializeEmbedder safely
 let embedderPromise = null;
-async function initializeEmbedder() {
+async function initializeEmbedder() {
   if (!embedderPromise) {
     const modelLoadStart = Date.now();
@@ -183,16 +183,16 @@ async function initializeEmbedder() {
     embedderPromise = (async () => {
       try {
-        ensureNativeBackend();
-        const model = await pipeline('feature-extraction', workerData.embeddingModel, {
-          quantized: true,
-          dtype: 'fp32',
-          session_options: {
-            numThreads: workerThreads,
-            intraOpNumThreads: workerThreads,
-            interOpNumThreads: 1,
-          },
-        });
+        ensureNativeBackend();
+        const model = await pipeline('feature-extraction', workerData.embeddingModel, {
+          quantized: true,
+          dtype: 'fp32',
+          session_options: {
+            numThreads: workerThreads,
+            intraOpNumThreads: workerThreads,
+            interOpNumThreads: 1,
+          },
+        });
         const loadSeconds = ((Date.now() - modelLoadStart) / 1000).toFixed(1);
         logInfo(
           `${workerLabel} Embedding model ready: ${workerData.embeddingModel} (${loadSeconds}s)`
@@ -204,48 +204,48 @@ async function initializeEmbedder() {
       }
     })();
   }
-  return embedderPromise;
-}
-function isFatalRuntimeEmbeddingError(err) {
-  const message = String(err?.message || err || '').toLowerCase();
-  return (
-    message.includes('exception is pending') ||
-    message.includes('invalid embedding output') ||
-    message.includes("cannot read properties of undefined (reading 'data')") ||
-    message.includes("cannot read properties of null (reading 'data')")
-  );
-}
-function getEmbeddingTensor(output, { requireDimsForBatch = false, batchSize = null } = {}) {
-  const data = output?.data;
-  if (!data || typeof data.length !== 'number') {
-    throw new Error('Invalid embedding output: missing tensor data');
-  }
-  if (!requireDimsForBatch) {
-    return { data };
-  }
-  const dims = Array.isArray(output?.dims) ? output.dims : null;
-  const hiddenSize = Number.isInteger(dims?.[dims.length - 1]) ? dims[dims.length - 1] : null;
-  if (!hiddenSize || hiddenSize <= 0) {
-    throw new Error('Invalid embedding output: missing tensor dims');
-  }
-  if (Number.isInteger(batchSize) && batchSize > 0 && data.length < hiddenSize * batchSize) {
-    throw new Error('Invalid embedding output: tensor length mismatch');
-  }
-  return { data, hiddenSize };
-}
-/**
- * Legacy Protocol: Process chunks with optimized single-text embedding
- * Streams results in batches.
- */
-async function processChunks(chunks, batchId) {
-  const embedder = await initializeEmbedder();
-  let results = [];
-  let transferList = [];
-  const failFastState = createFailFastState('legacy chunk embedding');
+  return embedderPromise;
+}
+function isFatalRuntimeEmbeddingError(err) {
+  const message = String(err?.message || err || '').toLowerCase();
+  return (
+    message.includes('exception is pending') ||
+    message.includes('invalid embedding output') ||
+    message.includes("cannot read properties of undefined (reading 'data')") ||
+    message.includes("cannot read properties of null (reading 'data')")
+  );
+}
+function getEmbeddingTensor(output, { requireDimsForBatch = false, batchSize = null } = {}) {
+  const data = output?.data;
+  if (!data || typeof data.length !== 'number') {
+    throw new Error('Invalid embedding output: missing tensor data');
+  }
+  if (!requireDimsForBatch) {
+    return { data };
+  }
+  const dims = Array.isArray(output?.dims) ? output.dims : null;
+  const hiddenSize = Number.isInteger(dims?.[dims.length - 1]) ? dims[dims.length - 1] : null;
+  if (!hiddenSize || hiddenSize <= 0) {
+    throw new Error('Invalid embedding output: missing tensor dims');
+  }
+  if (Number.isInteger(batchSize) && batchSize > 0 && data.length < hiddenSize * batchSize) {
+    throw new Error('Invalid embedding output: tensor length mismatch');
+  }
+  return { data, hiddenSize };
+}
+/**
+ * Legacy Protocol: Process chunks with optimized single-text embedding
+ * Streams results in batches.
+ */
+async function processChunks(chunks, batchId) {
+  const embedder = await initializeEmbedder();
+  let results = [];
+  let transferList = [];
+  const failFastState = createFailFastState('legacy chunk embedding');
   const flush = (done = false) => {
     // Only flush intermediate results when we have enough for a batch
@@ -270,16 +270,16 @@ async function processChunks(chunks, batchId) {
   };
   for (const chunk of chunks) {
-    try {
-      const output = await embedder(chunk.text, {
-        pooling: 'mean',
-        normalize: true,
-      });
-      // CRITICAL: Deep copy to release ONNX tensor memory
-      const { data } = getEmbeddingTensor(output);
-      let vector = new Float32Array(data);
-      // Apply MRL dimension slicing if configured
-      vector = sliceAndNormalize(vector, embeddingDimension);
+    try {
+      const output = await embedder(chunk.text, {
+        pooling: 'mean',
+        normalize: true,
+      });
+      // CRITICAL: Deep copy to release ONNX tensor memory
+      const { data } = getEmbeddingTensor(output);
+      let vector = new Float32Array(data);
+      // Apply MRL dimension slicing if configured
+      vector = sliceAndNormalize(vector, embeddingDimension);
       // Properly dispose tensor to release ONNX runtime memory
       if (typeof output.dispose === 'function')
         try {
@@ -289,37 +289,37 @@ async function processChunks(chunks, batchId) {
             console.warn(`${workerLabel} Failed to dispose tensor: ${disposeErr.message}`);
           }
         }
-      results.push({
-        file: chunk.file,
-        startLine: chunk.startLine,
-        endLine: chunk.endLine,
-        content: chunk.text,
-        vector,
-        success: true,
-      });
-      transferList.push(vector.buffer);
-      noteEmbeddingSuccess(failFastState);
-    } catch (error) {
-      results.push({
-        file: chunk.file,
-        startLine: chunk.startLine,
-        endLine: chunk.endLine,
-        error: error.message,
-        success: false,
-      });
-      noteEmbeddingFailure(failFastState, error);
-      if (isFatalRuntimeEmbeddingError(error)) {
-        throw error;
-      }
-    }
-    flush();
-  }
-  flush(true);
-  // Force GC if available to free massive tensor buffers immediately
-  maybeRunGc();
-}
+      results.push({
+        file: chunk.file,
+        startLine: chunk.startLine,
+        endLine: chunk.endLine,
+        content: chunk.text,
+        vector,
+        success: true,
+      });
+      transferList.push(vector.buffer);
+      noteEmbeddingSuccess(failFastState);
+    } catch (error) {
+      results.push({
+        file: chunk.file,
+        startLine: chunk.startLine,
+        endLine: chunk.endLine,
+        error: error.message,
+        success: false,
+      });
+      noteEmbeddingFailure(failFastState, error);
+      if (isFatalRuntimeEmbeddingError(error)) {
+        throw error;
+      }
+    }
+    flush();
+  }
+  flush(true);
+  // Force GC if available to free massive tensor buffers immediately
+  maybeRunGc();
+}
 // =====================================================================
 // SHARED HELPER FUNCTIONS
@@ -434,9 +434,9 @@ function processFileMetadata(file, content, options) {
  * New Protocol: Process entire file (read, chunk, embed) in worker.
  * Returns results once processing is complete.
  */
-async function processFileTask(message) {
-  const embedder = await initializeEmbedder();
-  const failFastState = createFailFastState(`file-task ${path.basename(message.file || '')}`);
+async function processFileTask(message) {
+  const embedder = await initializeEmbedder();
+  const failFastState = createFailFastState(`file-task ${path.basename(message.file || '')}`);
   const file = message.file;
   const force = !!message.force;
@@ -488,38 +488,38 @@ async function processFileTask(message) {
   // Batch size for inference (balance between speed and memory)
   // Configurable via workerData, default 4 balances memory and throughput
-  const INFERENCE_BATCH_SIZE = Number.isInteger(workerData.inferenceBatchSize)
-    ? workerData.inferenceBatchSize
-    : DEFAULT_INFERENCE_BATCH_SIZE;
-  let processedSinceGc = 0;
-  for (let i = 0; i < chunks.length; i += INFERENCE_BATCH_SIZE) {
+  const INFERENCE_BATCH_SIZE = Number.isInteger(workerData.inferenceBatchSize)
+    ? workerData.inferenceBatchSize
+    : DEFAULT_INFERENCE_BATCH_SIZE;
+  let processedSinceGc = 0;
+  for (let i = 0; i < chunks.length; i += INFERENCE_BATCH_SIZE) {
     const batchChunks = chunks.slice(i, i + INFERENCE_BATCH_SIZE);
     const batchTexts = batchChunks.map((c) => c.text);
-    try {
-      // Run inference on the batch
-      const output = await embedder(batchTexts, {
-        pooling: 'mean',
-        normalize: true,
-      });
-      // Output is a Tensor with shape [batch_size, hidden_size]
-      // data is a flat Float32Array
-      const { data, hiddenSize } = getEmbeddingTensor(output, {
-        requireDimsForBatch: true,
-        batchSize: batchChunks.length,
-      });
-      for (let j = 0; j < batchChunks.length; j++) {
-        const c = batchChunks[j];
-        // Slice the flat buffer to get this chunk's vector
-        // specific slice for this element
-        const start = j * hiddenSize;
-        const end = start + hiddenSize;
-        const vectorView =
-          typeof data.subarray === 'function' ? data.subarray(start, end) : data.slice(start, end);
+    try {
+      // Run inference on the batch
+      const output = await embedder(batchTexts, {
+        pooling: 'mean',
+        normalize: true,
+      });
+      // Output is a Tensor with shape [batch_size, hidden_size]
+      // data is a flat Float32Array
+      const { data, hiddenSize } = getEmbeddingTensor(output, {
+        requireDimsForBatch: true,
+        batchSize: batchChunks.length,
+      });
+      for (let j = 0; j < batchChunks.length; j++) {
+        const c = batchChunks[j];
+        // Slice the flat buffer to get this chunk's vector
+        // specific slice for this element
+        const start = j * hiddenSize;
+        const end = start + hiddenSize;
+        const vectorView =
+          typeof data.subarray === 'function' ? data.subarray(start, end) : data.slice(start, end);
         // Deep copy to ensure independent buffer for transfer
         let vector = new Float32Array(vectorView);
@@ -535,29 +535,29 @@ async function processFileTask(message) {
         transferList.push(vector.buffer);
       }
       // Properly dispose tensor to release ONNX runtime memory
-      if (typeof output.dispose === 'function')
-        try {
-          output.dispose();
-        } catch (disposeErr) {
-          if (workerData.verbose) {
-            console.warn(`${workerLabel} Failed to dispose tensor: ${disposeErr.message}`);
-          }
-        }
-      noteEmbeddingSuccess(failFastState);
-    } catch (err) {
-      if (isFatalRuntimeEmbeddingError(err)) {
-        noteEmbeddingFailure(failFastState, err);
-        throw err;
-      }
-      // Fallback: if batch fails (e.g. OOM), try one by one for this batch
-      console.warn(`${workerLabel} Batch inference failed (${err.name}), retrying individually: ${err.message}`);
-      noteEmbeddingFailure(failFastState, err);
-      for (const c of batchChunks) {
-        try {
-          const output = await embedder(c.text, { pooling: 'mean', normalize: true });
-          const { data } = getEmbeddingTensor(output);
-          let vector = new Float32Array(data);
+      if (typeof output.dispose === 'function')
+        try {
+          output.dispose();
+        } catch (disposeErr) {
+          if (workerData.verbose) {
+            console.warn(`${workerLabel} Failed to dispose tensor: ${disposeErr.message}`);
+          }
+        }
+      noteEmbeddingSuccess(failFastState);
+    } catch (err) {
+      if (isFatalRuntimeEmbeddingError(err)) {
+        noteEmbeddingFailure(failFastState, err);
+        throw err;
+      }
+      // Fallback: if batch fails (e.g. OOM), try one by one for this batch
+      console.warn(`${workerLabel} Batch inference failed (${err.name}), retrying individually: ${err.message}`);
+      noteEmbeddingFailure(failFastState, err);
+      for (const c of batchChunks) {
+        try {
+          const output = await embedder(c.text, { pooling: 'mean', normalize: true });
+          const { data } = getEmbeddingTensor(output);
+          let vector = new Float32Array(data);
           // Apply MRL dimension slicing if configured
           vector = sliceAndNormalize(vector, embeddingDimension);
           // Properly dispose tensor to release ONNX runtime memory
@@ -569,36 +569,36 @@ async function processFileTask(message) {
                 console.warn(`${workerLabel} Failed to dispose tensor: ${disposeErr.message}`);
               }
             }
-          results.push({
-            startLine: c.startLine,
-            endLine: c.endLine,
-            text: c.text,
-            vectorBuffer: vector.buffer,
-          });
-          transferList.push(vector.buffer);
-          noteEmbeddingSuccess(failFastState);
-        } catch (innerErr) {
-          // Note: No tensor disposal needed - embedder() threw before returning a tensor
-          console.warn(`${workerLabel} Chunk embedding failed: ${innerErr.message}`);
-          // We omit this chunk from results, effectively skipping it
-          noteEmbeddingFailure(failFastState, innerErr);
-          if (isFatalRuntimeEmbeddingError(innerErr)) {
-            throw innerErr;
-          }
-        }
-      }
-    }
-    // Yield to event loop briefly between batches and trigger GC
-    processedSinceGc += batchChunks.length;
-    if (chunks.length > INFERENCE_BATCH_SIZE) {
-      if (processedSinceGc >= 100) {
-        maybeRunGc();
-        processedSinceGc = 0;
-      }
-      await new Promise((resolve) => setTimeout(resolve, 0));
-    }
-  }
+          results.push({
+            startLine: c.startLine,
+            endLine: c.endLine,
+            text: c.text,
+            vectorBuffer: vector.buffer,
+          });
+          transferList.push(vector.buffer);
+          noteEmbeddingSuccess(failFastState);
+        } catch (innerErr) {
+          // Note: No tensor disposal needed - embedder() threw before returning a tensor
+          console.warn(`${workerLabel} Chunk embedding failed: ${innerErr.message}`);
+          // We omit this chunk from results, effectively skipping it
+          noteEmbeddingFailure(failFastState, innerErr);
+          if (isFatalRuntimeEmbeddingError(innerErr)) {
+            throw innerErr;
+          }
+        }
+      }
+    }
+    // Yield to event loop briefly between batches and trigger GC
+    processedSinceGc += batchChunks.length;
+    if (chunks.length > INFERENCE_BATCH_SIZE) {
+      if (processedSinceGc >= 100) {
+        maybeRunGc();
+        processedSinceGc = 0;
+      }
+      await new Promise((resolve) => setTimeout(resolve, 0));
+    }
+  }
   return { status: 'indexed', hash, mtimeMs, size, callData, results, transferList };
 }
@@ -635,13 +635,13 @@ parentPort.on('message', async (message) => {
         // Clear references
         embedderPromise = null;
-      }
-      // Trigger garbage collection if available
-      if (explicitGcEnabled && typeof global.gc === 'function') {
-        const before = process.memoryUsage();
-        global.gc();
-        const after = process.memoryUsage();
+      }
+      // Trigger garbage collection if available
+      if (explicitGcEnabled && typeof global.gc === 'function') {
+        const before = process.memoryUsage();
+        global.gc();
+        const after = process.memoryUsage();
         logInfo(
           `${workerLabel} Post-unload GC: rss ${(before.rss / 1024 / 1024).toFixed(1)}MB -> ${(after.rss / 1024 / 1024).toFixed(1)}MB`
         );
@@ -672,10 +672,10 @@ parentPort.on('message', async (message) => {
     }
     // ---- Batch file processing ----
-    if (message.type === 'processFiles') {
-      const { files, batchId } = message;
-      const batchTransfer = [];
-      const failFastState = createFailFastState('cross-file batch embedding');
+    if (message.type === 'processFiles') {
+      const { files, batchId } = message;
+      const batchTransfer = [];
+      const failFastState = createFailFastState('cross-file batch embedding');
       // 1. Pre-process all files: Read, Stat, and Chunk
       // We do this first to gather a massive list of chunks for batched inference
@@ -760,13 +760,13 @@ parentPort.on('message', async (message) => {
             continue;
           }
-          const { hash, callData, chunks } = meta;
-          const chunkCount = chunks.length;
-          // Trigger GC every 100 files
-          if ((i + 1) % 100 === 0) {
-            maybeRunGc();
-          }
+          const { hash, callData, chunks } = meta;
+          const chunkCount = chunks.length;
+          // Trigger GC every 100 files
+          if ((i + 1) % 100 === 0) {
+            maybeRunGc();
+          }
           // Register chunks for batching
           if (chunks.length > 0) {
@@ -814,52 +814,52 @@ parentPort.on('message', async (message) => {
           const batchSlice = allPendingChunks.slice(i, i + INFERENCE_BATCH_SIZE);
           const batchTexts = batchSlice.map((c) => c.text);
-          try {
-            const output = await embedder(batchTexts, { pooling: 'mean', normalize: true });
-            const { data, hiddenSize } = getEmbeddingTensor(output, {
-              requireDimsForBatch: true,
-              batchSize: batchSlice.length,
-            });
-            for (let j = 0; j < batchSlice.length; j++) {
-              const start = j * hiddenSize;
-              const end = start + hiddenSize;
-              const vectorView =
-                typeof data.subarray === 'function'
-                  ? data.subarray(start, end)
-                  : data.slice(start, end);
-              // Deep copy the view to avoid WASM memory issues, then apply MRL slicing
-              const vector = sliceAndNormalize(new Float32Array(vectorView), embeddingDimension);
+          try {
+            const output = await embedder(batchTexts, { pooling: 'mean', normalize: true });
+            const { data, hiddenSize } = getEmbeddingTensor(output, {
+              requireDimsForBatch: true,
+              batchSize: batchSlice.length,
+            });
+            for (let j = 0; j < batchSlice.length; j++) {
+              const start = j * hiddenSize;
+              const end = start + hiddenSize;
+              const vectorView =
+                typeof data.subarray === 'function'
+                  ? data.subarray(start, end)
+                  : data.slice(start, end);
+              // Deep copy the view to avoid WASM memory issues, then apply MRL slicing
+              const vector = sliceAndNormalize(new Float32Array(vectorView), embeddingDimension);
               batchSlice[j].vectorBuffer = vector.buffer;
               batchTransfer.push(vector.buffer);
             }
             // Properly dispose tensor to release ONNX runtime memory
-            if (typeof output.dispose === 'function')
-              try {
-                output.dispose();
-              } catch (disposeErr) {
-                if (workerData.verbose) {
-                  console.warn(`${workerLabel} Failed to dispose tensor: ${disposeErr.message}`);
-                }
-            }
-            noteEmbeddingSuccess(failFastState);
-          } catch (err) {
-            if (isFatalRuntimeEmbeddingError(err)) {
-              noteEmbeddingFailure(failFastState, err);
-              throw err;
-            }
-            console.warn(
-              `${workerLabel} Cross-file batch inference failed, retrying individually: ${err.message}`
-            );
-            noteEmbeddingFailure(failFastState, err);
-            // Fallback: individual embedding for this failed batch
-            for (const item of batchSlice) {
-              try {
-                const output = await embedder(item.text, { pooling: 'mean', normalize: true });
-                const { data } = getEmbeddingTensor(output);
-                // Deep copy and apply MRL slicing
-                const vector = sliceAndNormalize(new Float32Array(data), embeddingDimension);
+            if (typeof output.dispose === 'function')
+              try {
+                output.dispose();
+              } catch (disposeErr) {
+                if (workerData.verbose) {
+                  console.warn(`${workerLabel} Failed to dispose tensor: ${disposeErr.message}`);
+                }
+            }
+            noteEmbeddingSuccess(failFastState);
+          } catch (err) {
+            if (isFatalRuntimeEmbeddingError(err)) {
+              noteEmbeddingFailure(failFastState, err);
+              throw err;
+            }
+            console.warn(
+              `${workerLabel} Cross-file batch inference failed, retrying individually: ${err.message}`
+            );
+            noteEmbeddingFailure(failFastState, err);
+            // Fallback: individual embedding for this failed batch
+            for (const item of batchSlice) {
+              try {
+                const output = await embedder(item.text, { pooling: 'mean', normalize: true });
+                const { data } = getEmbeddingTensor(output);
+                // Deep copy and apply MRL slicing
+                const vector = sliceAndNormalize(new Float32Array(data), embeddingDimension);
                 // Properly dispose tensor to release ONNX runtime memory
                 if (typeof output.dispose === 'function')
                   try {
@@ -869,18 +869,18 @@ parentPort.on('message', async (message) => {
                       console.warn(`${workerLabel} Failed to dispose tensor: ${disposeErr.message}`);
                     }
                   }
-                item.vectorBuffer = vector.buffer;
-                batchTransfer.push(vector.buffer);
-                noteEmbeddingSuccess(failFastState);
-              } catch (innerErr) {
-                console.warn(`${workerLabel} Chunk embedding failed: ${innerErr.message}`);
-                noteEmbeddingFailure(failFastState, innerErr);
-                if (isFatalRuntimeEmbeddingError(innerErr)) {
-                  throw innerErr;
-                }
-              }
-            }
-          }
+                item.vectorBuffer = vector.buffer;
+                batchTransfer.push(vector.buffer);
+                noteEmbeddingSuccess(failFastState);
+              } catch (innerErr) {
+                console.warn(`${workerLabel} Chunk embedding failed: ${innerErr.message}`);
+                noteEmbeddingFailure(failFastState, innerErr);
+                if (isFatalRuntimeEmbeddingError(innerErr)) {
+                  throw innerErr;
+                }
+              }
+            }
+          }
           // Minimal yield to keep event loop breathing (optional, can be removed for max throughput)
           if (allPendingChunks.length > 50 && i % 50 === 0) {
@@ -944,10 +944,10 @@ parentPort.on('message', async (message) => {
         batchTransfer
       );
-      // Explicitly clear references and trigger GC
-      batchTransfer.length = 0;
-      maybeRunGc();
-      return;
+      // Explicitly clear references and trigger GC
+      batchTransfer.length = 0;
+      maybeRunGc();
+      return;
     }
     // ---- Legacy protocol: batch of chunks prepared by main thread ----