npm - @softerist/heuristic-mcp - Versions diffs - 3.0.15 → 3.0.16 - Mend

@softerist/heuristic-mcp 3.0.15 → 3.0.16

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (49) hide show

package/README.md +104 -104
package/config.jsonc +173 -173
package/features/ann-config.js +131 -0
package/features/clear-cache.js +84 -0
package/features/find-similar-code.js +291 -0
package/features/hybrid-search.js +544 -0
package/features/index-codebase.js +3268 -0
package/features/lifecycle.js +1189 -0
package/features/package-version.js +302 -0
package/features/register.js +408 -0
package/features/resources.js +156 -0
package/features/set-workspace.js +265 -0
package/index.js +96 -96
package/lib/cache-ops.js +22 -22
package/lib/cache-utils.js +565 -565
package/lib/cache.js +1870 -1870
package/lib/call-graph.js +396 -396
package/lib/cli.js +1 -1
package/lib/config.js +517 -517
package/lib/constants.js +39 -39
package/lib/embed-query-process.js +7 -7
package/lib/embedding-process.js +7 -7
package/lib/embedding-worker.js +299 -299
package/lib/ignore-patterns.js +316 -316
package/lib/json-worker.js +14 -14
package/lib/json-writer.js +337 -337
package/lib/logging.js +164 -164
package/lib/memory-logger.js +13 -13
package/lib/onnx-backend.js +193 -193
package/lib/project-detector.js +84 -84
package/lib/server-lifecycle.js +165 -165
package/lib/settings-editor.js +754 -754
package/lib/tokenizer.js +256 -256
package/lib/utils.js +428 -428
package/lib/vector-store-binary.js +627 -627
package/lib/vector-store-sqlite.js +95 -95
package/lib/workspace-env.js +28 -28
package/mcp_config.json +9 -9
package/package.json +86 -75
package/scripts/clear-cache.js +20 -0
package/scripts/download-model.js +43 -0
package/scripts/mcp-launcher.js +49 -0
package/scripts/postinstall.js +12 -0
package/search-configs.js +36 -36
package/.prettierrc +0 -7
package/debug-pids.js +0 -30
package/eslint.config.js +0 -36
package/specs/plan.md +0 -23
package/vitest.config.js +0 -39

package/features/hybrid-search.js ADDED Viewed

@@ -0,0 +1,544 @@
+import path from 'path';
+import fs from 'fs/promises';
+import { dotSimilarity } from '../lib/utils.js';
+import { extractSymbolsFromContent } from '../lib/call-graph.js';
+import { embedQueryInChildProcess } from '../lib/embed-query-process.js';
+import {
+  STAT_CONCURRENCY_LIMIT,
+  SEARCH_BATCH_SIZE,
+  PARTIAL_MATCH_BOOST,
+} from '../lib/constants.js';
+export class HybridSearch {
+  constructor(embedder, cache, config) {
+    this.embedder = embedder;
+    this.cache = cache;
+    this.config = config;
+    this.fileModTimes = new Map(); // Cache for file modification times
+    this._lastAccess = new Map(); // Track last access time for LRU eviction
+  }
+  async getChunkContent(chunkOrIndex) {
+    return await this.cache.getChunkContent(chunkOrIndex);
+  }
+  getChunkVector(chunk) {
+    return this.cache.getChunkVector(chunk);
+  }
+  getAnnCandidateCount(maxResults, totalChunks) {
+    const minCandidates = this.config.annMinCandidates ?? 0;
+    const maxCandidates = this.config.annMaxCandidates ?? totalChunks;
+    const multiplier = this.config.annCandidateMultiplier ?? 1;
+    const desired = Math.max(minCandidates, Math.ceil(maxResults * multiplier));
+    const capped = Math.min(maxCandidates, desired);
+    return Math.min(totalChunks, Math.max(maxResults, capped));
+  }
+  async populateFileModTimes(files) {
+    const uniqueFiles = new Set(files);
+    const missing = [];
+    for (const file of uniqueFiles) {
+      if (!this.fileModTimes.has(file)) {
+        // Try to get from cache metadata first (fast)
+        const meta = this.cache.getFileMeta(file);
+        if (meta && typeof meta.mtimeMs === 'number') {
+          this.fileModTimes.set(file, meta.mtimeMs);
+          this._lastAccess.set(file, Date.now()); // Track for LRU
+        } else {
+          missing.push(file);
+        }
+      } else {
+        this._lastAccess.set(file, Date.now()); // Track access for LRU
+      }
+    }
+    if (missing.length === 0) {
+      return;
+    }
+    // Concurrency-limited execution to avoid EMFILE
+    // Pre-distribute files to workers (no shared mutable state - avoids race condition)
+    const workerCount = Math.min(STAT_CONCURRENCY_LIMIT, missing.length);
+    const worker = async (startIdx) => {
+      for (let i = startIdx; i < missing.length; i += workerCount) {
+        const file = missing[i];
+        try {
+          const stats = await fs.stat(file);
+          this.fileModTimes.set(file, stats.mtimeMs);
+          this._lastAccess.set(file, Date.now());
+        } catch {
+          this.fileModTimes.set(file, null);
+        }
+      }
+    };
+    await Promise.all(Array.from({ length: workerCount }, (_, i) => worker(i)));
+    // Prevent unbounded growth (LRU-style eviction based on access time)
+    const lruMaxEntries = this.config.lruMaxEntries ?? 5000;
+    const lruTargetEntries = this.config.lruTargetEntries ?? 4000;
+    if (this.fileModTimes.size > lruMaxEntries) {
+      // Convert to array with last-access info, sort by oldest access
+      const entries = [...this.fileModTimes.keys()].map((k) => ({
+        key: k,
+        lastAccess: this._lastAccess?.get(k) ?? 0,
+      }));
+      entries.sort((a, b) => a.lastAccess - b.lastAccess); // Oldest first
+      const toEvict = entries.slice(0, entries.length - lruTargetEntries);
+      for (const { key } of toEvict) {
+        this.fileModTimes.delete(key);
+        this._lastAccess?.delete(key);
+      }
+    }
+  }
+  // Cache invalidation helper
+  clearFileModTime(file) {
+    this.fileModTimes.delete(file);
+  }
+  /**
+   * Search the indexed codebase for relevant code snippets.
+   * Uses a hybrid approach combining semantic similarity (via embeddings) with
+   * keyword matching for optimal results.
+   * @param {string} query - Natural language or keyword search query
+   * @param {number} maxResults - Maximum number of results to return (default: 15)
+   * @returns {Promise<{results: Array<{file: string, startLine: number, endLine: number, content: string, score: number}>, message?: string}>}
+   * @throws {Error} If embedder is not initialized
+   */
+  async search(query, maxResults) {
+    try {
+      if (typeof this.cache.ensureLoaded === 'function') {
+        await this.cache.ensureLoaded();
+      }
+      this.cache.startRead();
+      const storeSize = this.cache.getStoreSize();
+      if (storeSize === 0) {
+        return {
+          results: [],
+          message: 'No code has been indexed yet. Please wait for initial indexing to complete.',
+        };
+      }
+      // Generate query embedding
+      if (this.config.verbose) {
+        console.info(`[Search] Query: "${query}"`);
+      }
+      let queryVector;
+      // Use child process for embedding when unloadModelAfterSearch is enabled
+      // This ensures the OS completely reclaims memory when the child exits
+      if (this.config.unloadModelAfterSearch) {
+        queryVector = await embedQueryInChildProcess(query, this.config);
+      } else {
+        // Use main process embedder (faster for consecutive searches)
+        const queryEmbed = await this.embedder(query, {
+          pooling: 'mean',
+          normalize: true,
+        });
+        try {
+          queryVector = new Float32Array(queryEmbed.data);
+        } finally {
+          if (typeof queryEmbed.dispose === 'function') {
+            try {
+              queryEmbed.dispose();
+            } catch {
+              /* ignore */
+            }
+          }
+        }
+      }
+      let candidateIndices = null; // null implies full scan of all chunks
+      let usedAnn = false;
+      if (this.config.annEnabled) {
+        const candidateCount = this.getAnnCandidateCount(maxResults, storeSize);
+        const annLabels = await this.cache.queryAnn(queryVector, candidateCount);
+        if (annLabels && annLabels.length >= maxResults) {
+          usedAnn = true;
+          if (this.config.verbose) {
+            console.info(`[Search] Using ANN index (${annLabels.length} candidates)`);
+          }
+          candidateIndices = Array.from(new Set(annLabels)); // dedupe
+        }
+      }
+      if (!usedAnn) {
+        if (this.config.verbose) {
+          console.info(`[Search] Using full scan (${storeSize} chunks)`);
+        }
+      }
+      if (usedAnn && candidateIndices && candidateIndices.length < maxResults) {
+        if (this.config.verbose) {
+          console.info(
+            `[Search] ANN returned fewer results (${candidateIndices.length}) than requested (${maxResults}), augmenting with full scan...`
+          );
+        }
+        candidateIndices = null; // Fallback to full scan to ensure we don't miss anything relevant
+        usedAnn = false;
+      }
+      const lowerQuery = query.toLowerCase();
+      const queryWords =
+        lowerQuery.length > 1 ? lowerQuery.split(/\s+/).filter((word) => word.length > 2) : [];
+      const queryWordCount = queryWords.length;
+      if (usedAnn && candidateIndices && lowerQuery.length > 1) {
+        let exactMatchCount = 0;
+        for (const index of candidateIndices) {
+          const content = await this.getChunkContent(index);
+          if (content && content.toLowerCase().includes(lowerQuery)) {
+            exactMatchCount++;
+          }
+        }
+        if (exactMatchCount < maxResults) {
+          // Fallback to full scan if keyword constraint isn't met in candidates
+          // Note: This is expensive as it iterates everything.
+          // Optimization: Only do this for small-ish codebases to avoid UI freeze
+          const MAX_FULL_SCAN_SIZE = this.config.fullScanThreshold ?? 2000;
+          if (storeSize <= MAX_FULL_SCAN_SIZE) {
+            const seen = new Set(candidateIndices);
+            // Full scan logic for keyword augmentation
+            // Batch content loading to reduce async overhead
+            const FALLBACK_BATCH = 100;
+            let additionalMatches = 0;
+            const targetMatches = maxResults - exactMatchCount;
+            outerLoop:
+            for (let i = 0; i < storeSize; i += FALLBACK_BATCH) {
+              if (i > 0) await new Promise((r) => setTimeout(r, 0)); // Yield
+              const limit = Math.min(storeSize, i + FALLBACK_BATCH);
+              // Build batch of indices to check (excluding already seen)
+              const batchIndices = [];
+              for (let j = i; j < limit; j++) {
+                if (!seen.has(j)) batchIndices.push(j);
+              }
+              // Batch load content in parallel
+              const contents = await Promise.all(
+                batchIndices.map(idx => this.getChunkContent(idx))
+              );
+              // Check each loaded content
+              for (let k = 0; k < batchIndices.length; k++) {
+                const content = contents[k];
+                if (content && content.toLowerCase().includes(lowerQuery)) {
+                  const idx = batchIndices[k];
+                  seen.add(idx);
+                  candidateIndices.push(idx);
+                  additionalMatches++;
+                  // Early exit once we have enough additional matches
+                  if (additionalMatches >= targetMatches) break outerLoop;
+                }
+              }
+            }
+          } else {
+            console.info(
+              `[Search] Skipping full scan fallback (store size ${storeSize} > ${MAX_FULL_SCAN_SIZE})`
+            );
+          }
+        }
+      }
+      // Recency pre-processing
+      let recencyBoostEnabled = this.config.recencyBoost > 0;
+      let now = Date.now();
+      let recencyDecayMs = (this.config.recencyDecayDays || 30) * 24 * 60 * 60 * 1000;
+      let semanticWeight = this.config.semanticWeight;
+      let exactMatchBoost = this.config.exactMatchBoost;
+      let recencyBoost = this.config.recencyBoost;
+      if (recencyBoostEnabled) {
+        const candidates = candidateIndices
+          ? candidateIndices.map((idx) => this.cache.getChunk(idx)).filter(Boolean)
+          : Array.from({ length: storeSize }, (_, i) => this.cache.getChunk(i)).filter(Boolean);
+        // optimization: avoid IO storm during full scan fallbacks
+        // For large candidate sets, we strictly rely on cached metadata
+        // For small sets, we allow best-effort fs.stat
+        if (candidates.length <= 1000) {
+          await this.populateFileModTimes(candidates.map((chunk) => chunk.file));
+        } else {
+          // Bulk pre-populate from cache only (no syscalls)
+          for (const chunk of candidates) {
+            if (!this.fileModTimes.has(chunk.file)) {
+              const meta = this.cache.getFileMeta(chunk.file);
+              if (meta && typeof meta.mtimeMs === 'number') {
+                this.fileModTimes.set(chunk.file, meta.mtimeMs);
+              }
+            }
+          }
+        }
+      }
+      // Score all chunks (batched to prevent blocking event loop)
+      const scoredChunks = [];
+      // Process in batches
+      // Candidates is now implicitly range 0..storeSize OR candidateIndices
+      const totalCandidates = candidateIndices ? candidateIndices.length : storeSize;
+      const textMatchMaxCandidates = Number.isInteger(this.config.textMatchMaxCandidates)
+        ? this.config.textMatchMaxCandidates
+        : 2000;
+      const shouldApplyTextMatch = lowerQuery.length > 1;
+      const deferTextMatch = shouldApplyTextMatch && totalCandidates > textMatchMaxCandidates;
+      for (let i = 0; i < totalCandidates; i += SEARCH_BATCH_SIZE) {
+        // Allow event loop to tick between batches
+        if (i > 0) {
+          await new Promise((resolve) => setTimeout(resolve, 0));
+        }
+        const limit = Math.min(totalCandidates, i + SEARCH_BATCH_SIZE);
+        for (let j = i; j < limit; j++) {
+          const idx = candidateIndices ? candidateIndices[j] : j;
+          // CRITICAL: Fetch chunk info FIRST to ensure atomicity with index.
+          // If we fetch vector and chunk separately, the store could be modified
+          // between calls (e.g., by removeFileFromStore compacting the array).
+          const chunkInfo = this.cache.getChunk(idx);
+          if (!chunkInfo) {
+            // Chunk was removed or index is stale - skip silently
+            continue;
+          }
+          // Get vector from chunk or via index (now safe since we have valid chunkInfo)
+          const vector = this.cache.getChunkVector(chunkInfo, idx);
+          if (!vector) continue;
+          // Ensure vector compatibility with try-catch for dimension mismatch
+          let score;
+          try {
+            score = dotSimilarity(queryVector, vector) * semanticWeight;
+          } catch (err) {
+            // Dimension mismatch indicates config change - log and skip this chunk
+            if (this.config.verbose) {
+              console.warn(`[Search] ${err.message} at index ${idx}`);
+            }
+            continue;
+          }
+          let content;
+          if (shouldApplyTextMatch && !deferTextMatch) {
+            content = await this.getChunkContent(idx);
+            const lowerContent = content ? content.toLowerCase() : '';
+            if (lowerContent && lowerContent.includes(lowerQuery)) {
+              score += exactMatchBoost;
+            } else if (lowerContent && queryWordCount > 0) {
+              // Partial word matching (optimized)
+              let matchedWords = 0;
+              for (let k = 0; k < queryWordCount; k++) {
+                if (lowerContent.includes(queryWords[k])) matchedWords++;
+              }
+              score += (matchedWords / queryWordCount) * PARTIAL_MATCH_BOOST;
+            }
+          }
+          // Recency boost
+          if (recencyBoostEnabled) {
+            const mtime = this.fileModTimes.get(chunkInfo.file);
+            if (typeof mtime === 'number') {
+              const ageMs = now - mtime;
+              const recencyFactor = Math.max(0, 1 - ageMs / recencyDecayMs);
+              score += recencyFactor * recencyBoost;
+            }
+          }
+          const scoredChunk = { ...chunkInfo, score };
+          if (content !== undefined) {
+            scoredChunk.content = content;
+          }
+          scoredChunks.push(scoredChunk);
+        }
+      }
+      // Sort by initial score
+      scoredChunks.sort((a, b) => b.score - a.score);
+      // Defer expensive text matching for large candidate sets
+      if (deferTextMatch) {
+        const textMatchCount = Math.min(textMatchMaxCandidates, scoredChunks.length);
+        for (let i = 0; i < textMatchCount; i++) {
+          const chunk = scoredChunks[i];
+          const content = chunk.content ?? (await this.getChunkContent(chunk));
+          const lowerContent = content ? content.toLowerCase() : '';
+          if (lowerContent && lowerContent.includes(lowerQuery)) {
+            chunk.score += exactMatchBoost;
+          } else if (lowerContent && queryWordCount > 0) {
+            let matchedWords = 0;
+            for (let k = 0; k < queryWordCount; k++) {
+              if (lowerContent.includes(queryWords[k])) matchedWords++;
+            }
+            chunk.score += (matchedWords / queryWordCount) * 0.3;
+          }
+          if (chunk.content === undefined) {
+            chunk.content = content;
+          }
+        }
+        scoredChunks.sort((a, b) => b.score - a.score);
+      }
+      // Apply call graph proximity boost if enabled
+      if (this.config.callGraphEnabled && this.config.callGraphBoost > 0) {
+        // Extract symbols from top initial results
+        const topN = Math.min(5, scoredChunks.length);
+        const symbolsFromTop = new Set();
+        for (let i = 0; i < topN; i++) {
+          const content = await this.getChunkContent(scoredChunks[i]);
+          const symbols = extractSymbolsFromContent(content || '');
+          for (const sym of symbols) {
+            symbolsFromTop.add(sym);
+          }
+        }
+        if (symbolsFromTop.size > 0) {
+          // Get related files from call graph
+          const relatedFiles = await this.cache.getRelatedFiles(Array.from(symbolsFromTop));
+          // Apply boost to chunks from related files
+          for (const chunk of scoredChunks) {
+            const proximity = relatedFiles.get(chunk.file);
+            if (proximity) {
+              chunk.score += proximity * this.config.callGraphBoost;
+            }
+          }
+          // Re-sort after applying call graph boost
+          scoredChunks.sort((a, b) => b.score - a.score);
+        }
+      }
+      // Get top results
+      const results = await Promise.all(
+        scoredChunks.slice(0, maxResults).map(async (chunk) => {
+          if (chunk.content === undefined || chunk.content === null) {
+            return { ...chunk, content: await this.getChunkContent(chunk) };
+          }
+          return chunk;
+        })
+      );
+      if (results.length > 0) {
+        console.info(
+          `[Search] Found ${results.length} results. Top score: ${results[0].score.toFixed(4)}`
+        );
+      } else {
+        console.info('[Search] No results found.');
+      }
+      return { results, message: null };
+    } finally {
+      this.cache.endRead();
+    }
+  }
+  async formatResults(results) {
+    if (results.length === 0) {
+      return 'No matching code found for your query.';
+    }
+    const formatted = await Promise.all(
+      results.map(async (r, idx) => {
+        if (!r.file) {
+          return `## Result ${idx + 1} (Relevance: ${(r.score * 100).toFixed(1)}%)\n**Error:** Missing file path\n`;
+        }
+        const relPath = path.relative(this.config.searchDirectory, r.file);
+        const content = r.content ?? (await this.getChunkContent(r));
+        return (
+          `## Result ${idx + 1} (Relevance: ${(r.score * 100).toFixed(1)}%)\n` +
+          `**File:** \`${relPath}\`\n` +
+          `**Lines:** ${r.startLine}-${r.endLine}\n\n` +
+          '```' +
+          path.extname(r.file).slice(1) +
+          '\n' +
+          content +
+          '\n' +
+          '```\n'
+        );
+      })
+    );
+    return formatted.join('\n');
+  }
+}
+// MCP Tool definition for this feature
+export function getToolDefinition(config) {
+  return {
+    name: 'a_semantic_search',
+    description:
+      "Performs intelligent hybrid code search combining semantic understanding with exact text matching. Ideal for finding code by meaning (e.g., 'authentication logic', 'database queries') even with typos or variations. Returns the most relevant code snippets with file locations and line numbers.",
+    inputSchema: {
+      type: 'object',
+      properties: {
+        query: {
+          type: 'string',
+          description:
+            "Search query - can be natural language (e.g., 'where do we handle user login') or specific terms",
+        },
+        maxResults: {
+          type: 'number',
+          description: 'Maximum number of results to return (default: from config)',
+          default: config.maxResults,
+        },
+      },
+      required: ['query'],
+    },
+    annotations: {
+      title: 'Semantic Code Search',
+      readOnlyHint: true,
+      destructiveHint: false,
+      idempotentHint: true,
+      openWorldHint: false,
+    },
+  };
+}
+// Tool handler
+export async function handleToolCall(request, hybridSearch) {
+  const args = request.params?.arguments || {};
+  const query = args.query;
+  // Input validation
+  if (typeof query !== 'string' || query.trim().length === 0) {
+    return {
+      content: [{ type: 'text', text: 'Error: A non-empty query string is required.' }],
+      isError: true,
+    };
+  }
+  const maxResults =
+    typeof args.maxResults === 'number' && args.maxResults > 0
+      ? args.maxResults
+      : hybridSearch.config.maxResults;
+  const { results, message } = await hybridSearch.search(query, maxResults);
+  if (message) {
+    return {
+      content: [{ type: 'text', text: message }],
+    };
+  }
+  const formattedText = await hybridSearch.formatResults(results);
+  return {
+    content: [{ type: 'text', text: formattedText }],
+  };
+}