npm - sweet-search - Versions diffs - 2.4.2 → 2.5.1 - Mend

sweet-search 2.4.2 → 2.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

package/core/cli.js +19 -5
package/core/embedding/embedding-cache.js +177 -15
package/core/embedding/embedding-service.js +18 -4
package/core/graph/graph-expansion.js +52 -12
package/core/graph/graph-extractor.js +30 -1
package/core/indexing/ast-chunker.js +331 -16
package/core/indexing/chunking/chunk-builder.js +34 -1
package/core/indexing/index.js +6 -3
package/core/indexing/indexer-ann.js +45 -6
package/core/indexing/indexer-build.js +9 -1
package/core/indexing/indexer-phases.js +6 -4
package/core/indexing/indexing-file-policy.js +140 -0
package/core/indexing/li-skip-policy.js +11 -220
package/core/infrastructure/codebase-repository.js +21 -0
package/core/infrastructure/config/embedding.js +20 -1
package/core/infrastructure/config/graph.js +2 -2
package/core/infrastructure/config/ranking.js +10 -0
package/core/infrastructure/config/vector-store.js +1 -1
package/core/infrastructure/coreml-cascade.js +236 -30
package/core/infrastructure/coreml-cascade.json +25 -0
package/core/infrastructure/index.js +15 -0
package/core/infrastructure/init-config.js +78 -0
package/core/infrastructure/language-patterns/registry-core.js +18 -0
package/core/infrastructure/model-registry.js +12 -0
package/core/infrastructure/native-inference.js +143 -51
package/core/infrastructure/tree-sitter-provider.js +92 -2
package/core/ranking/cascaded-scorer.js +6 -2
package/core/ranking/file-kind-ranking.js +264 -0
package/core/ranking/late-interaction-index.js +10 -4
package/core/ranking/late-interaction-policy.js +304 -0
package/core/search/context-expander.js +267 -28
package/core/search/index.js +4 -0
package/core/search/search-cli.js +3 -1
package/core/search/search-pattern.js +4 -3
package/core/search/search-postprocess.js +189 -8
package/core/search/search-read-semantic.js +717 -0
package/core/search/search-read.js +481 -0
package/core/search/search-server.js +6 -4
package/core/search/sweet-search.js +119 -15
package/mcp/server.js +41 -0
package/mcp/tool-handlers.js +117 -6
package/package.json +9 -7
package/scripts/init.js +386 -5

package/core/search/search-postprocess.js CHANGED Viewed

@@ -14,6 +14,7 @@ import { expandResults } from '../graph/graph-expansion.js';
 import { int8CosineSimilarity } from '../embedding/embedding-service.js';
 import { QualityScorer } from '../ranking/quality-scorer.js';
 import { classifyIntent, getIntentPolicy } from '../query/intent-router.js';
+import { applyFileKindRanking, classifyFileKindIntent } from '../ranking/file-kind-ranking.js';
 import { recordQueryTelemetry } from '../embedding/embedding-cache.js';
 import { expandAliases } from './dedup/sibling-expander.js';
@@ -175,10 +176,20 @@ export async function applyPostRetrieval(results, query, options, searchContext)
           ...(intentEdgeTypes && !graphExpandOptions.edgeTypes ? { edgeTypes: intentEdgeTypes } : {}),
           ...graphExpandOptions,
         });
+        // Attach LI chunk ids to expanded entities so they can participate
+        // in the post-expansion MaxSim rerank pool. The graph stores entities
+        // (entity_id keyed by code-graph.db) while LI is keyed by chunk id;
+        // without this bridge expanded entries fall through hasTokens() and
+        // are appended to the result tail without ever competing for top-K.
+        const expandedAttached = attachChunkIdsToExpanded(results, this.codebaseRepo);
         stats.graphExpansion = {
           mode: effectiveGraphExpand,
           latency_ms: Date.now() - expandStart,
           total: results.length,
+          expanded: results.filter(r => r.is_expanded).length,
+          expandedWithLiChunk: expandedAttached,
         };
       }
     } catch (err) {
@@ -255,8 +266,22 @@ export async function applyPostRetrieval(results, query, options, searchContext)
     if (shouldRunLateInteraction) {
       try {
         const liStart = performance.now();
-        const liCandidateCount = this.stage3Candidates || 20;
-        const topCandidates = results.slice(0, liCandidateCount);
+        // Pool size and original/expanded split are overridable per call so
+        // the graph-2hop sweep can compare allocations without forking the
+        // pipeline. Defaults preserve production behaviour.
+        const liCandidateCount =
+          options.liPoolSize ?? this.stage3Candidates ?? 20;
+        const liExpandedFraction = options.liExpandedFraction;  // undefined → builder default
+        // Build a bounded MIXED rerank pool: top originals + top expanded.
+        // Without this, expanded entries always sit behind the originals'
+        // tail and the LI rerank only re-orders the original head — graph
+        // expansion has zero effect on top-K. Reserve a slice of the rerank
+        // pool for the highest-scoring expanded candidates so they actually
+        // compete for top-K positions.
+        const { topCandidates, expandedQuotaUsed } = buildMixedRerankPool(
+          results, liCandidateCount, liExpandedFraction,
+        );
         const { encodeQuery } = await import('../ranking/late-interaction-model.js');
         const queryTokens = await encodeQuery(query);
@@ -276,20 +301,21 @@ export async function applyPostRetrieval(results, query, options, searchContext)
           scored.sort((a, b) => b.score - a.score);
-          results = [
-            ...scored,
-            ...results.slice(liCandidateCount),
-          ];
+          // Anything not in the rerank pool keeps original ordering at the tail.
+          const pickedKeys = new Set(topCandidates.map(c => c.id || c.entity_id));
+          const tail = results.filter(r => !pickedKeys.has(r.id || r.entity_id));
+          results = [...scored, ...tail];
         }
         stats.lateInteraction = {
           position: 'post-expansion',
-          mode: 'pure-reranker',
+          mode: 'pure-reranker-mixed-pool',
           latency_us: Math.round((performance.now() - liStart) * 1000),
           candidates: topCandidates.length,
+          expandedInPool: expandedQuotaUsed,
           queryTokens: queryTokens?.length || 0,
         };
-        this.log(`LateInteraction (pure reranker): ${stats.lateInteraction.latency_us}us for ${topCandidates.length} candidates (${queryTokens?.length || 0} query tokens)`);
+        this.log(`LateInteraction (mixed-pool): ${stats.lateInteraction.latency_us}us for ${topCandidates.length} candidates (${expandedQuotaUsed} expanded, ${queryTokens?.length || 0} query tokens)`);
       } catch (err) {
         this.log(`LateInteraction rerank failed: ${err.message}`);
         stats.lateInteraction = { position: 'post-expansion', error: err.message };
@@ -374,6 +400,32 @@ export async function applyPostRetrieval(results, query, options, searchContext)
     }
   }
+  // =========================================================================
+  // Intent-aware file-kind ranking
+  // =========================================================================
+  // Soft-demote docs/tests/types files when the query is confidently
+  // implementation-seeking AND the top-N window contains both docs/tests/
+  // types and implementation candidates. No-op otherwise. Disable with
+  // SWEET_SEARCH_FILE_KIND_RANKING=0; tune SWEET_SEARCH_FILE_KIND_FACTOR.
+  if (Array.isArray(results) && results.length > 0) {
+    const fileKindIntent = classifyFileKindIntent(query);
+    const beforeTop = results[0];
+    const afterFK = applyFileKindRanking(results, { intent: fileKindIntent });
+    if (afterFK !== results) {
+      results = afterFK;
+      stats.fileKindRanking = {
+        intent: fileKindIntent,
+        applied: true,
+        top1Changed: !!beforeTop && results[0] && (beforeTop !== results[0]),
+      };
+    } else {
+      stats.fileKindRanking = {
+        intent: fileKindIntent,
+        applied: false,
+      };
+    }
+  }
   stats.total_ms = Date.now() - start;
   stats.results_count = Array.isArray(results) ? results.length : 0;
@@ -450,3 +502,132 @@ export function computeCacheHit(mode, {
   return { lexSubLatency, lexHit, semHit, cacheHit };
 }
+// =============================================================================
+// Mixed rerank pool helpers (post-expansion LI / cascade)
+// =============================================================================
+/**
+ * For each `is_expanded` result with a known file_path + line range, find the
+ * codebase chunk that best covers it and stash its id under `_liChunkId`.
+ *
+ * Why: graph expansion produces results keyed by entity_id (from code-graph.db)
+ * but the LI index is keyed by chunk id (from codebase.db). Without bridging
+ * the two ID spaces, expanded results can never participate in MaxSim rerank.
+ *
+ * Best-effort: missing/zero-overlap entries are left as-is and will fall
+ * through to the unscored path.
+ *
+ * @param {Array} results
+ * @param {import('../infrastructure/codebase-repository.js').CodebaseRepository} codebaseRepo
+ * @returns {number} count of expanded results that received a _liChunkId
+ */
+export function attachChunkIdsToExpanded(results, codebaseRepo) {
+  if (!Array.isArray(results) || results.length === 0 || !codebaseRepo) return 0;
+  const fileChunkCache = new Map(); // file_path -> Array<{ id, file_path, text, metadata }>
+  let attached = 0;
+  for (const r of results) {
+    if (!r.is_expanded || r._liChunkId) continue;
+    const fp = r.file_path || r.file || r.metadata?.file || r.metadata?.path;
+    const sl = r.start_line ?? r.startLine ?? r.metadata?.start_line ?? r.metadata?.startLine;
+    if (!fp || sl == null) continue;
+    const el = r.end_line ?? r.endLine ?? r.metadata?.end_line ?? r.metadata?.endLine ?? sl;
+    let chunks = fileChunkCache.get(fp);
+    if (!chunks) {
+      try { chunks = codebaseRepo.getChunksByFilePath(fp) || []; }
+      catch { chunks = []; }
+      fileChunkCache.set(fp, chunks);
+    }
+    if (chunks.length === 0) continue;
+    // Greatest line-range overlap with the entity wins; ties broken by smaller
+    // chunk (tighter match). Chunk metadata is the primary signal; chunk id
+    // pattern `<path>:<start>-<end>:<n>` is a fallback when metadata is sparse.
+    let bestId = null;
+    let bestOverlap = 0;
+    let bestSize = Infinity;
+    for (const c of chunks) {
+      let cs, ce;
+      let meta = c.metadata;
+      if (typeof meta === 'string') { try { meta = JSON.parse(meta); } catch { meta = null; } }
+      if (meta) {
+        cs = meta.start_line ?? meta.startLine;
+        ce = meta.end_line ?? meta.endLine;
+      }
+      if (cs == null || ce == null) {
+        const m = typeof c.id === 'string' ? c.id.match(/:(\d+)-(\d+)(?::|$)/) : null;
+        if (m) { cs = parseInt(m[1], 10); ce = parseInt(m[2], 10); }
+      }
+      if (cs == null || ce == null) continue;
+      const overlap = Math.max(0, Math.min(el, ce) - Math.max(sl, cs) + 1);
+      if (overlap <= 0) continue;
+      const size = ce - cs + 1;
+      if (overlap > bestOverlap || (overlap === bestOverlap && size < bestSize)) {
+        bestOverlap = overlap;
+        bestSize = size;
+        bestId = c.id;
+      }
+    }
+    if (bestId) {
+      r._liChunkId = bestId;
+      attached++;
+    }
+  }
+  return attached;
+}
+/**
+ * Build a bounded LI rerank pool that mixes top originals and top expanded.
+ *
+ * Reserves `expandedQuota = floor(slot * expandedFraction)` of the rerank
+ * slots for the highest-scoring expanded candidates (so adaptive 2-hop's
+ * scoring choices actually influence the top-K), with the remainder going
+ * to the highest-scoring originals (preserving lexical/HNSW lead).
+ *
+ * If there are fewer expanded (or fewer originals) than the quota, the
+ * unused slots flow to the other side.
+ *
+ * @param {Array} results - Combined original + expanded result list
+ * @param {number} slot   - Total rerank slots (e.g. stage3Candidates)
+ * @param {number} [expandedFraction=0.4] - Fraction of pool reserved for expanded
+ * @returns {{ topCandidates: Array, expandedQuotaUsed: number }}
+ */
+export function buildMixedRerankPool(results, slot, expandedFraction = 0.4) {
+  const EXPANDED_FRACTION = Math.max(0, Math.min(1, expandedFraction));
+  const originals = results.filter(r => !r.is_expanded);
+  const expanded = results.filter(r => r.is_expanded);
+  if (expanded.length === 0) {
+    return { topCandidates: originals.slice(0, slot), expandedQuotaUsed: 0 };
+  }
+  const expandedScore = (r) =>
+    r.expansion?.adaptiveScore ?? r.score ?? 0;
+  const originalScore = (r) =>
+    r.score ?? r.int8Score ?? r.hybridScore ?? 0;
+  const sortedOriginals = [...originals].sort((a, b) => originalScore(b) - originalScore(a));
+  const sortedExpanded  = [...expanded].sort((a, b) => expandedScore(b)  - expandedScore(a));
+  const expandedQuota = Math.min(
+    Math.floor(slot * EXPANDED_FRACTION),
+    sortedExpanded.length,
+  );
+  const originalQuota = Math.min(slot - expandedQuota, sortedOriginals.length);
+  // If originals can't fill their quota, redirect the surplus to expanded.
+  const originalShort = (slot - expandedQuota) - originalQuota;
+  const finalExpandedQuota = Math.min(expandedQuota + originalShort, sortedExpanded.length);
+  const topOriginals = sortedOriginals.slice(0, originalQuota);
+  const topExpanded  = sortedExpanded.slice(0, finalExpandedQuota);
+  return {
+    topCandidates: [...topOriginals, ...topExpanded],
+    expandedQuotaUsed: topExpanded.length,
+  };
+}