npm - @softerist/heuristic-mcp - Versions diffs - 3.0.14 → 3.0.16 - Mend

@softerist/heuristic-mcp 3.0.14 → 3.0.16

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (49) hide show

package/README.md +90 -82
package/config.jsonc +173 -173
package/features/ann-config.js +131 -0
package/features/clear-cache.js +84 -0
package/features/find-similar-code.js +291 -0
package/features/hybrid-search.js +544 -0
package/features/index-codebase.js +3268 -0
package/features/lifecycle.js +1189 -0
package/features/package-version.js +302 -0
package/features/register.js +408 -0
package/features/resources.js +156 -0
package/features/set-workspace.js +265 -0
package/index.js +136 -69
package/lib/cache-ops.js +22 -22
package/lib/cache-utils.js +565 -565
package/lib/cache.js +1870 -1870
package/lib/call-graph.js +396 -396
package/lib/cli.js +1 -1
package/lib/config.js +487 -427
package/lib/constants.js +31 -0
package/lib/embed-query-process.js +7 -7
package/lib/embedding-process.js +7 -7
package/lib/embedding-worker.js +299 -299
package/lib/ignore-patterns.js +316 -316
package/lib/json-worker.js +14 -14
package/lib/json-writer.js +337 -337
package/lib/logging.js +164 -164
package/lib/memory-logger.js +13 -13
package/lib/onnx-backend.js +193 -193
package/lib/project-detector.js +84 -84
package/lib/server-lifecycle.js +165 -165
package/lib/settings-editor.js +754 -638
package/lib/tokenizer.js +256 -256
package/lib/utils.js +428 -428
package/lib/vector-store-binary.js +627 -627
package/lib/vector-store-sqlite.js +95 -95
package/lib/workspace-env.js +28 -0
package/mcp_config.json +9 -9
package/package.json +86 -75
package/scripts/clear-cache.js +20 -0
package/scripts/download-model.js +43 -0
package/scripts/mcp-launcher.js +49 -0
package/scripts/postinstall.js +12 -0
package/search-configs.js +36 -36
package/.prettierrc +0 -7
package/debug-pids.js +0 -30
package/eslint.config.js +0 -36
package/specs/plan.md +0 -23
package/vitest.config.js +0 -39

package/lib/config.js CHANGED Viewed

@@ -5,127 +5,128 @@ import crypto from 'crypto';
 import { fileURLToPath } from 'url';
 import { ProjectDetector } from './project-detector.js';
 import { parseJsonc } from './settings-editor.js';
-import {
-  EMBEDDING_PROCESS_DEFAULT_GC_MAX_REQUESTS_WITHOUT_COLLECTION,
-  EMBEDDING_PROCESS_DEFAULT_GC_MIN_INTERVAL_MS,
-  EMBEDDING_PROCESS_DEFAULT_GC_RSS_THRESHOLD_MB,
-} from './constants.js';
-const DEFAULT_MEMORY_CLEANUP_CONFIG = {
-  enableExplicitGc: true, // Require --expose-gc for more aggressive memory cleanup
-  clearCacheAfterIndex: true, // Drop in-memory vectors after indexing completes
-  unloadModelAfterIndex: true, // Unload embedding model from memory after indexing completes to free RAM
-  shutdownQueryEmbeddingPoolAfterIndex: true, // Force shutdown search embedding child pool after index operations
-  unloadModelAfterSearch: true, // Unload embedding model after search queries to keep memory low (trades speed for RAM)
-  embeddingPoolIdleTimeoutMs: 2000, // Idle timeout before killing persistent embedding child process (ms)
-  incrementalGcThresholdMb: 512, // RSS threshold for optional incremental GC
-  incrementalMemoryProfile: false, // Enable phase-level incremental indexing memory traces (diagnostics)
-  recycleServerOnHighRssAfterIncremental: false, // Recycle server process after incremental cleanup if RSS remains high
-  recycleServerOnHighRssThresholdMb: 4096, // RSS threshold (MB) that triggers incremental recycle
-  recycleServerOnHighRssCooldownMs: 300000, // Minimum interval between recycle attempts
-  recycleServerOnHighRssDelayMs: 2000, // Delay before recycle to allow logs/responses to flush
-};
-const DEFAULT_INDEXING_CONFIG = {
-  smartIndexing: true, // Enable automatic project type detection and smart ignore patterns
-  chunkSize: 16, // Lines per chunk (tuned for speed/memory balance)
-  chunkOverlap: 4, // Overlap between chunks for context continuity
-  batchSize: 50, // Number of files to process in a single indexing batch
-  maxFileSize: 1048576, // 1MB - skip files larger than this
-  prefilterContentMaxBytes: 512 * 1024, // 512KB - cache content during prefilter to avoid double reads
-  maxResults: 5, // Maximum number of semantic search results to return
-  watchFiles: true, // Enable file system watcher to re-index changed files in real-time
-};
-const DEFAULT_LOGGING_CONFIG = {
-  verbose: false, // Enable detailed logging for debugging and progress tracking
-  memoryLogIntervalMs: 5000, // Verbose memory log cadence during indexing (ms)
-};
-const DEFAULT_CACHE_CONFIG = {
-  enableCache: true, // Whether to persist and reload embeddings between sessions
-  saveReaderWaitTimeoutMs: 5000, // Max wait for active reads before saving binary cache
-  cacheVectorAssumeFinite: true, // Assume vectors are finite (skip validation)
-  cacheVectorFloatDigits: null, // Decimal precision for cached vectors (null = default)
-  cacheWriteHighWaterMark: 262144, // Write stream highWaterMark for cache files
-  cacheVectorFlushChars: 262144, // Flush threshold (chars) for JSON writer
-  cacheVectorCheckFinite: true, // Validate vectors contain only finite numbers
-  cacheVectorNoMutation: false, // Avoid mutating vectors during serialization
-  cacheVectorJoinThreshold: 8192, // Join threshold for JSON array chunks
-  cacheVectorJoinChunkSize: 2048, // Chunk size for JSON join optimization
-};
-const DEFAULT_WORKER_CONFIG = {
-  workerThreads: 'auto', // 0 = run in main thread (no workers), "auto" = CPU cores - 1, or set a number
-  workerBatchTimeoutMs: 120000, // Timeout per worker batch before fallback (ms)
-  workerFailureThreshold: 1, // Open circuit after N worker failures
-  workerFailureCooldownMs: 10 * 60 * 1000, // Cooldown before retrying workers
-  workerMaxChunksPerBatch: 100, // Cap chunks per worker batch to reduce hang risk
-  allowSingleThreadFallback: false, // Allow fallback to main-thread embeddings if workers fail
-  failFastEmbeddingErrors: false, // Abort worker embedding batch after repeated consecutive embed failures
-};
-const DEFAULT_EMBEDDING_CONFIG = {
-  embeddingModel: 'jinaai/jina-embeddings-v2-base-code', // AI model ID used for semantic search
-  embeddingDimension: null, // null = full dimensions, or 64/128/256/512/768 for MRL-trained models
-  preloadEmbeddingModel: true, // Preload the embedding model at startup (server mode)
-  embeddingProcessPerBatch: false, // Use child process per batch for memory isolation
-  autoEmbeddingProcessPerBatch: true, // Auto-enable child process embedding in single-threaded mode for heavy models
-  embeddingBatchSize: null, // Override embedding batch size (null = auto)
-  embeddingProcessNumThreads: 8, // ONNX threads used by embedding child process
-  embeddingProcessGcRssThresholdMb: EMBEDDING_PROCESS_DEFAULT_GC_RSS_THRESHOLD_MB, // RSS threshold for embedding-child adaptive GC
-  embeddingProcessGcMinIntervalMs: EMBEDDING_PROCESS_DEFAULT_GC_MIN_INTERVAL_MS, // Minimum interval between embedding-child GC runs
-  embeddingProcessGcMaxRequestsWithoutCollection:
-    EMBEDDING_PROCESS_DEFAULT_GC_MAX_REQUESTS_WITHOUT_COLLECTION, // Backstop GC cadence for embedding child
-};
-const DEFAULT_VECTOR_STORE_CONFIG = {
-  vectorStoreFormat: 'binary', // json | binary | sqlite (binary uses mmap-friendly on-disk store)
-  vectorStoreContentMode: 'external', // external = content loaded on-demand for binary store
-  contentCacheEntries: 256, // In-memory content cache entries for binary store
-  vectorStoreLoadMode: 'memory', // memory | disk (disk streams vectors from disk / memory is faster but requires more RAM)
-  vectorCacheEntries: 0, // In-memory vector cache entries for disk-backed loads
-};
-const DEFAULT_SEARCH_CONFIG = {
-  semanticWeight: 0.7, // Balance between semantic and keyword scores (0.0 to 1.0)
-  exactMatchBoost: 1.5, // Multiplier applied when an exact string match is found
-  recencyBoost: 0.1, // Boost for recently modified files (max 0.1 added to score)
-  recencyDecayDays: 30, // After this many days, recency boost is 0
-  textMatchMaxCandidates: 2000, // Max candidates for full text matching before deferring
-};
-const DEFAULT_CALL_GRAPH_CONFIG = {
-  callGraphEnabled: true, // Enable call graph extraction for proximity boosting
-  callGraphBoost: 0.15, // Boost for files related via call graph (0-1)
-  callGraphMaxHops: 1, // How many levels of calls to follow (1 = direct only)
-};
-const DEFAULT_ANN_CONFIG = {
-  annEnabled: true, // Enable Approximate Nearest Neighbor (ANN) index for large codebases
-  annMinChunks: 5000, // Minimum number of chunks required to trigger ANN indexing
-  annMinCandidates: 50, // Minimum initial candidates to pull from ANN before refinement
-  annMaxCandidates: 200, // Hard limit on the number of ANN candidates to process
-  annCandidateMultiplier: 20, // Scale initial search depth based on requested maxResults
-  annEfConstruction: 200, // HNSW index construction quality (higher = better index, slower build)
-  annEfSearch: 64, // HNSW search parameter (higher = more accurate, slower search)
-  annM: 16, // Number of connections per element in HNSW index
-  annIndexCache: true, // Whether to cache the built HNSW index on disk
-  annMetric: 'cosine', // Distance metric for similarity (currently locked to cosine)
-};
-const MEMORY_CLEANUP_KEYS = Object.freeze(Object.keys(DEFAULT_MEMORY_CLEANUP_CONFIG));
-const INDEXING_KEYS = Object.freeze(Object.keys(DEFAULT_INDEXING_CONFIG));
-const LOGGING_KEYS = Object.freeze(Object.keys(DEFAULT_LOGGING_CONFIG));
-const CACHE_KEYS = Object.freeze(Object.keys(DEFAULT_CACHE_CONFIG));
-const WORKER_KEYS = Object.freeze(Object.keys(DEFAULT_WORKER_CONFIG));
-const EMBEDDING_KEYS = Object.freeze(Object.keys(DEFAULT_EMBEDDING_CONFIG));
-const VECTOR_STORE_KEYS = Object.freeze(Object.keys(DEFAULT_VECTOR_STORE_CONFIG));
-const SEARCH_KEYS = Object.freeze(Object.keys(DEFAULT_SEARCH_CONFIG));
-const CALL_GRAPH_KEYS = Object.freeze(Object.keys(DEFAULT_CALL_GRAPH_CONFIG));
-const ANN_KEYS = Object.freeze(Object.keys(DEFAULT_ANN_CONFIG));
-const DEFAULT_CONFIG = {
+import {
+  EMBEDDING_PROCESS_DEFAULT_GC_MAX_REQUESTS_WITHOUT_COLLECTION,
+  EMBEDDING_PROCESS_DEFAULT_GC_MIN_INTERVAL_MS,
+  EMBEDDING_PROCESS_DEFAULT_GC_RSS_THRESHOLD_MB,
+} from './constants.js';
+import { getWorkspaceEnvKeys } from './workspace-env.js';
+const DEFAULT_MEMORY_CLEANUP_CONFIG = {
+  enableExplicitGc: true, // Require --expose-gc for more aggressive memory cleanup
+  clearCacheAfterIndex: true, // Drop in-memory vectors after indexing completes
+  unloadModelAfterIndex: true, // Unload embedding model from memory after indexing completes to free RAM
+  shutdownQueryEmbeddingPoolAfterIndex: true, // Force shutdown search embedding child pool after index operations
+  unloadModelAfterSearch: true, // Unload embedding model after search queries to keep memory low (trades speed for RAM)
+  embeddingPoolIdleTimeoutMs: 2000, // Idle timeout before killing persistent embedding child process (ms)
+  incrementalGcThresholdMb: 512, // RSS threshold for optional incremental GC
+  incrementalMemoryProfile: false, // Enable phase-level incremental indexing memory traces (diagnostics)
+  recycleServerOnHighRssAfterIncremental: false, // Recycle server process after incremental cleanup if RSS remains high
+  recycleServerOnHighRssThresholdMb: 4096, // RSS threshold (MB) that triggers incremental recycle
+  recycleServerOnHighRssCooldownMs: 300000, // Minimum interval between recycle attempts
+  recycleServerOnHighRssDelayMs: 2000, // Delay before recycle to allow logs/responses to flush
+};
+const DEFAULT_INDEXING_CONFIG = {
+  smartIndexing: true, // Enable automatic project type detection and smart ignore patterns
+  chunkSize: 16, // Lines per chunk (tuned for speed/memory balance)
+  chunkOverlap: 4, // Overlap between chunks for context continuity
+  batchSize: 50, // Number of files to process in a single indexing batch
+  maxFileSize: 1048576, // 1MB - skip files larger than this
+  prefilterContentMaxBytes: 512 * 1024, // 512KB - cache content during prefilter to avoid double reads
+  maxResults: 5, // Maximum number of semantic search results to return
+  watchFiles: true, // Enable file system watcher to re-index changed files in real-time
+};
+const DEFAULT_LOGGING_CONFIG = {
+  verbose: false, // Enable detailed logging for debugging and progress tracking
+  memoryLogIntervalMs: 5000, // Verbose memory log cadence during indexing (ms)
+};
+const DEFAULT_CACHE_CONFIG = {
+  enableCache: true, // Whether to persist and reload embeddings between sessions
+  saveReaderWaitTimeoutMs: 5000, // Max wait for active reads before saving binary cache
+  cacheVectorAssumeFinite: true, // Assume vectors are finite (skip validation)
+  cacheVectorFloatDigits: null, // Decimal precision for cached vectors (null = default)
+  cacheWriteHighWaterMark: 262144, // Write stream highWaterMark for cache files
+  cacheVectorFlushChars: 262144, // Flush threshold (chars) for JSON writer
+  cacheVectorCheckFinite: true, // Validate vectors contain only finite numbers
+  cacheVectorNoMutation: false, // Avoid mutating vectors during serialization
+  cacheVectorJoinThreshold: 8192, // Join threshold for JSON array chunks
+  cacheVectorJoinChunkSize: 2048, // Chunk size for JSON join optimization
+};
+const DEFAULT_WORKER_CONFIG = {
+  workerThreads: 'auto', // 0 = run in main thread (no workers), "auto" = CPU cores - 1, or set a number
+  workerBatchTimeoutMs: 120000, // Timeout per worker batch before fallback (ms)
+  workerFailureThreshold: 1, // Open circuit after N worker failures
+  workerFailureCooldownMs: 10 * 60 * 1000, // Cooldown before retrying workers
+  workerMaxChunksPerBatch: 100, // Cap chunks per worker batch to reduce hang risk
+  allowSingleThreadFallback: false, // Allow fallback to main-thread embeddings if workers fail
+  failFastEmbeddingErrors: false, // Abort worker embedding batch after repeated consecutive embed failures
+};
+const DEFAULT_EMBEDDING_CONFIG = {
+  embeddingModel: 'jinaai/jina-embeddings-v2-base-code', // AI model ID used for semantic search
+  embeddingDimension: null, // null = full dimensions, or 64/128/256/512/768 for MRL-trained models
+  preloadEmbeddingModel: true, // Preload the embedding model at startup (server mode)
+  embeddingProcessPerBatch: false, // Use child process per batch for memory isolation
+  autoEmbeddingProcessPerBatch: true, // Auto-enable child process embedding in single-threaded mode for heavy models
+  embeddingBatchSize: null, // Override embedding batch size (null = auto)
+  embeddingProcessNumThreads: 8, // ONNX threads used by embedding child process
+  embeddingProcessGcRssThresholdMb: EMBEDDING_PROCESS_DEFAULT_GC_RSS_THRESHOLD_MB, // RSS threshold for embedding-child adaptive GC
+  embeddingProcessGcMinIntervalMs: EMBEDDING_PROCESS_DEFAULT_GC_MIN_INTERVAL_MS, // Minimum interval between embedding-child GC runs
+  embeddingProcessGcMaxRequestsWithoutCollection:
+    EMBEDDING_PROCESS_DEFAULT_GC_MAX_REQUESTS_WITHOUT_COLLECTION, // Backstop GC cadence for embedding child
+};
+const DEFAULT_VECTOR_STORE_CONFIG = {
+  vectorStoreFormat: 'binary', // json | binary | sqlite (binary uses mmap-friendly on-disk store)
+  vectorStoreContentMode: 'external', // external = content loaded on-demand for binary store
+  contentCacheEntries: 256, // In-memory content cache entries for binary store
+  vectorStoreLoadMode: 'memory', // memory | disk (disk streams vectors from disk / memory is faster but requires more RAM)
+  vectorCacheEntries: 0, // In-memory vector cache entries for disk-backed loads
+};
+const DEFAULT_SEARCH_CONFIG = {
+  semanticWeight: 0.7, // Balance between semantic and keyword scores (0.0 to 1.0)
+  exactMatchBoost: 1.5, // Multiplier applied when an exact string match is found
+  recencyBoost: 0.1, // Boost for recently modified files (max 0.1 added to score)
+  recencyDecayDays: 30, // After this many days, recency boost is 0
+  textMatchMaxCandidates: 2000, // Max candidates for full text matching before deferring
+};
+const DEFAULT_CALL_GRAPH_CONFIG = {
+  callGraphEnabled: true, // Enable call graph extraction for proximity boosting
+  callGraphBoost: 0.15, // Boost for files related via call graph (0-1)
+  callGraphMaxHops: 1, // How many levels of calls to follow (1 = direct only)
+};
+const DEFAULT_ANN_CONFIG = {
+  annEnabled: true, // Enable Approximate Nearest Neighbor (ANN) index for large codebases
+  annMinChunks: 5000, // Minimum number of chunks required to trigger ANN indexing
+  annMinCandidates: 50, // Minimum initial candidates to pull from ANN before refinement
+  annMaxCandidates: 200, // Hard limit on the number of ANN candidates to process
+  annCandidateMultiplier: 20, // Scale initial search depth based on requested maxResults
+  annEfConstruction: 200, // HNSW index construction quality (higher = better index, slower build)
+  annEfSearch: 64, // HNSW search parameter (higher = more accurate, slower search)
+  annM: 16, // Number of connections per element in HNSW index
+  annIndexCache: true, // Whether to cache the built HNSW index on disk
+  annMetric: 'cosine', // Distance metric for similarity (currently locked to cosine)
+};
+const MEMORY_CLEANUP_KEYS = Object.freeze(Object.keys(DEFAULT_MEMORY_CLEANUP_CONFIG));
+const INDEXING_KEYS = Object.freeze(Object.keys(DEFAULT_INDEXING_CONFIG));
+const LOGGING_KEYS = Object.freeze(Object.keys(DEFAULT_LOGGING_CONFIG));
+const CACHE_KEYS = Object.freeze(Object.keys(DEFAULT_CACHE_CONFIG));
+const WORKER_KEYS = Object.freeze(Object.keys(DEFAULT_WORKER_CONFIG));
+const EMBEDDING_KEYS = Object.freeze(Object.keys(DEFAULT_EMBEDDING_CONFIG));
+const VECTOR_STORE_KEYS = Object.freeze(Object.keys(DEFAULT_VECTOR_STORE_CONFIG));
+const SEARCH_KEYS = Object.freeze(Object.keys(DEFAULT_SEARCH_CONFIG));
+const CALL_GRAPH_KEYS = Object.freeze(Object.keys(DEFAULT_CALL_GRAPH_CONFIG));
+const ANN_KEYS = Object.freeze(Object.keys(DEFAULT_ANN_CONFIG));
+const DEFAULT_CONFIG = {
   searchDirectory: '.',
   fileExtensions: [
     // JavaScript/TypeScript
@@ -361,16 +362,16 @@ const DEFAULT_CONFIG = {
     '**/scripts/**',
     '**/tools/**',
   ],
-  chunkSize: DEFAULT_INDEXING_CONFIG.chunkSize,
-  chunkOverlap: DEFAULT_INDEXING_CONFIG.chunkOverlap,
-  batchSize: DEFAULT_INDEXING_CONFIG.batchSize,
-  maxFileSize: DEFAULT_INDEXING_CONFIG.maxFileSize,
-  prefilterContentMaxBytes: DEFAULT_INDEXING_CONFIG.prefilterContentMaxBytes,
-  maxResults: DEFAULT_INDEXING_CONFIG.maxResults,
-  enableCache: DEFAULT_CACHE_CONFIG.enableCache,
-  cacheDirectory: null, // Will be set dynamically by loadConfig()
-  // Cache cleanup behavior (consolidated namespace)
-  cacheCleanup: {
+  chunkSize: DEFAULT_INDEXING_CONFIG.chunkSize,
+  chunkOverlap: DEFAULT_INDEXING_CONFIG.chunkOverlap,
+  batchSize: DEFAULT_INDEXING_CONFIG.batchSize,
+  maxFileSize: DEFAULT_INDEXING_CONFIG.maxFileSize,
+  prefilterContentMaxBytes: DEFAULT_INDEXING_CONFIG.prefilterContentMaxBytes,
+  maxResults: DEFAULT_INDEXING_CONFIG.maxResults,
+  enableCache: DEFAULT_CACHE_CONFIG.enableCache,
+  cacheDirectory: null, // Will be set dynamically by loadConfig()
+  // Cache cleanup behavior (consolidated namespace)
+  cacheCleanup: {
     autoCleanup: true, // Automatically remove stale caches on startup
     staleNoMetaHours: 6, // Hours before incomplete cache (no meta.json) is considered stale
     emptyThresholdHours: 24, // Hours before empty cache (0 files/chunks) is removed
@@ -378,97 +379,86 @@ const DEFAULT_CONFIG = {
     maxUnusedDays: 30, // Days before unused cache is removed
     tempThresholdHours: 24, // Hours before temp workspace cache is removed
     staleProgressHours: 6, // Hours before stuck indexing is considered stale
-    safetyWindowMinutes: 10, // Minutes of recent activity to never delete
-    removeDuplicates: true, // Remove duplicate workspace caches
-  },
-  watchFiles: DEFAULT_INDEXING_CONFIG.watchFiles,
-  verbose: DEFAULT_LOGGING_CONFIG.verbose,
-  memoryLogIntervalMs: DEFAULT_LOGGING_CONFIG.memoryLogIntervalMs,
-  saveReaderWaitTimeoutMs: DEFAULT_CACHE_CONFIG.saveReaderWaitTimeoutMs,
-  workerThreads: DEFAULT_WORKER_CONFIG.workerThreads,
-  workerBatchTimeoutMs: DEFAULT_WORKER_CONFIG.workerBatchTimeoutMs,
-  workerFailureThreshold: DEFAULT_WORKER_CONFIG.workerFailureThreshold,
-  workerFailureCooldownMs: DEFAULT_WORKER_CONFIG.workerFailureCooldownMs,
-  workerMaxChunksPerBatch: DEFAULT_WORKER_CONFIG.workerMaxChunksPerBatch,
-  allowSingleThreadFallback: DEFAULT_WORKER_CONFIG.allowSingleThreadFallback,
-  failFastEmbeddingErrors: DEFAULT_WORKER_CONFIG.failFastEmbeddingErrors,
-  embeddingProcessPerBatch: DEFAULT_EMBEDDING_CONFIG.embeddingProcessPerBatch,
-  autoEmbeddingProcessPerBatch: DEFAULT_EMBEDDING_CONFIG.autoEmbeddingProcessPerBatch,
-  embeddingBatchSize: DEFAULT_EMBEDDING_CONFIG.embeddingBatchSize,
-  embeddingProcessNumThreads: DEFAULT_EMBEDDING_CONFIG.embeddingProcessNumThreads,
-  embeddingProcessGcRssThresholdMb: DEFAULT_EMBEDDING_CONFIG.embeddingProcessGcRssThresholdMb,
-  embeddingProcessGcMinIntervalMs: DEFAULT_EMBEDDING_CONFIG.embeddingProcessGcMinIntervalMs,
-  embeddingProcessGcMaxRequestsWithoutCollection:
-    DEFAULT_EMBEDDING_CONFIG.embeddingProcessGcMaxRequestsWithoutCollection,
-  enableExplicitGc: DEFAULT_MEMORY_CLEANUP_CONFIG.enableExplicitGc,
-  embeddingModel: DEFAULT_EMBEDDING_CONFIG.embeddingModel,
-  embeddingDimension: DEFAULT_EMBEDDING_CONFIG.embeddingDimension,
-  preloadEmbeddingModel: DEFAULT_EMBEDDING_CONFIG.preloadEmbeddingModel,
-  vectorStoreFormat: DEFAULT_VECTOR_STORE_CONFIG.vectorStoreFormat,
-  vectorStoreContentMode: DEFAULT_VECTOR_STORE_CONFIG.vectorStoreContentMode,
-  contentCacheEntries: DEFAULT_VECTOR_STORE_CONFIG.contentCacheEntries,
-  vectorStoreLoadMode: DEFAULT_VECTOR_STORE_CONFIG.vectorStoreLoadMode,
-  vectorCacheEntries: DEFAULT_VECTOR_STORE_CONFIG.vectorCacheEntries,
-  clearCacheAfterIndex: DEFAULT_MEMORY_CLEANUP_CONFIG.clearCacheAfterIndex,
-  unloadModelAfterIndex: DEFAULT_MEMORY_CLEANUP_CONFIG.unloadModelAfterIndex,
-  shutdownQueryEmbeddingPoolAfterIndex:
-    DEFAULT_MEMORY_CLEANUP_CONFIG.shutdownQueryEmbeddingPoolAfterIndex,
-  unloadModelAfterSearch: DEFAULT_MEMORY_CLEANUP_CONFIG.unloadModelAfterSearch,
-  embeddingPoolIdleTimeoutMs: DEFAULT_MEMORY_CLEANUP_CONFIG.embeddingPoolIdleTimeoutMs,
-  incrementalGcThresholdMb: DEFAULT_MEMORY_CLEANUP_CONFIG.incrementalGcThresholdMb,
-  incrementalMemoryProfile: DEFAULT_MEMORY_CLEANUP_CONFIG.incrementalMemoryProfile,
-  recycleServerOnHighRssAfterIncremental:
-    DEFAULT_MEMORY_CLEANUP_CONFIG.recycleServerOnHighRssAfterIncremental,
-  recycleServerOnHighRssThresholdMb:
-    DEFAULT_MEMORY_CLEANUP_CONFIG.recycleServerOnHighRssThresholdMb,
-  recycleServerOnHighRssCooldownMs:
-    DEFAULT_MEMORY_CLEANUP_CONFIG.recycleServerOnHighRssCooldownMs,
-  recycleServerOnHighRssDelayMs: DEFAULT_MEMORY_CLEANUP_CONFIG.recycleServerOnHighRssDelayMs,
-  memoryCleanup: { ...DEFAULT_MEMORY_CLEANUP_CONFIG },
-  semanticWeight: DEFAULT_SEARCH_CONFIG.semanticWeight,
-  exactMatchBoost: DEFAULT_SEARCH_CONFIG.exactMatchBoost,
-  recencyBoost: DEFAULT_SEARCH_CONFIG.recencyBoost,
-  recencyDecayDays: DEFAULT_SEARCH_CONFIG.recencyDecayDays,
-  textMatchMaxCandidates: DEFAULT_SEARCH_CONFIG.textMatchMaxCandidates,
-  smartIndexing: DEFAULT_INDEXING_CONFIG.smartIndexing,
-  callGraphEnabled: DEFAULT_CALL_GRAPH_CONFIG.callGraphEnabled,
-  callGraphBoost: DEFAULT_CALL_GRAPH_CONFIG.callGraphBoost,
-  callGraphMaxHops: DEFAULT_CALL_GRAPH_CONFIG.callGraphMaxHops,
-  annEnabled: DEFAULT_ANN_CONFIG.annEnabled,
-  annMinChunks: DEFAULT_ANN_CONFIG.annMinChunks,
-  annMinCandidates: DEFAULT_ANN_CONFIG.annMinCandidates,
-  annMaxCandidates: DEFAULT_ANN_CONFIG.annMaxCandidates,
-  annCandidateMultiplier: DEFAULT_ANN_CONFIG.annCandidateMultiplier,
-  annEfConstruction: DEFAULT_ANN_CONFIG.annEfConstruction,
-  annEfSearch: DEFAULT_ANN_CONFIG.annEfSearch,
-  annM: DEFAULT_ANN_CONFIG.annM,
-  annIndexCache: DEFAULT_ANN_CONFIG.annIndexCache,
-  annMetric: DEFAULT_ANN_CONFIG.annMetric,
-  indexing: { ...DEFAULT_INDEXING_CONFIG },
-  logging: { ...DEFAULT_LOGGING_CONFIG },
-  cache: { ...DEFAULT_CACHE_CONFIG },
-  worker: { ...DEFAULT_WORKER_CONFIG },
-  embedding: { ...DEFAULT_EMBEDDING_CONFIG },
-  vectorStore: { ...DEFAULT_VECTOR_STORE_CONFIG },
-  search: { ...DEFAULT_SEARCH_CONFIG },
-  callGraph: { ...DEFAULT_CALL_GRAPH_CONFIG },
-  ann: { ...DEFAULT_ANN_CONFIG },
-};
+    safetyWindowMinutes: 10, // Minutes of recent activity to never delete
+    removeDuplicates: true, // Remove duplicate workspace caches
+  },
+  watchFiles: DEFAULT_INDEXING_CONFIG.watchFiles,
+  verbose: DEFAULT_LOGGING_CONFIG.verbose,
+  memoryLogIntervalMs: DEFAULT_LOGGING_CONFIG.memoryLogIntervalMs,
+  saveReaderWaitTimeoutMs: DEFAULT_CACHE_CONFIG.saveReaderWaitTimeoutMs,
+  workerThreads: DEFAULT_WORKER_CONFIG.workerThreads,
+  workerBatchTimeoutMs: DEFAULT_WORKER_CONFIG.workerBatchTimeoutMs,
+  workerFailureThreshold: DEFAULT_WORKER_CONFIG.workerFailureThreshold,
+  workerFailureCooldownMs: DEFAULT_WORKER_CONFIG.workerFailureCooldownMs,
+  workerMaxChunksPerBatch: DEFAULT_WORKER_CONFIG.workerMaxChunksPerBatch,
+  allowSingleThreadFallback: DEFAULT_WORKER_CONFIG.allowSingleThreadFallback,
+  failFastEmbeddingErrors: DEFAULT_WORKER_CONFIG.failFastEmbeddingErrors,
+  embeddingProcessPerBatch: DEFAULT_EMBEDDING_CONFIG.embeddingProcessPerBatch,
+  autoEmbeddingProcessPerBatch: DEFAULT_EMBEDDING_CONFIG.autoEmbeddingProcessPerBatch,
+  embeddingBatchSize: DEFAULT_EMBEDDING_CONFIG.embeddingBatchSize,
+  embeddingProcessNumThreads: DEFAULT_EMBEDDING_CONFIG.embeddingProcessNumThreads,
+  embeddingProcessGcRssThresholdMb: DEFAULT_EMBEDDING_CONFIG.embeddingProcessGcRssThresholdMb,
+  embeddingProcessGcMinIntervalMs: DEFAULT_EMBEDDING_CONFIG.embeddingProcessGcMinIntervalMs,
+  embeddingProcessGcMaxRequestsWithoutCollection:
+    DEFAULT_EMBEDDING_CONFIG.embeddingProcessGcMaxRequestsWithoutCollection,
+  enableExplicitGc: DEFAULT_MEMORY_CLEANUP_CONFIG.enableExplicitGc,
+  embeddingModel: DEFAULT_EMBEDDING_CONFIG.embeddingModel,
+  embeddingDimension: DEFAULT_EMBEDDING_CONFIG.embeddingDimension,
+  preloadEmbeddingModel: DEFAULT_EMBEDDING_CONFIG.preloadEmbeddingModel,
+  vectorStoreFormat: DEFAULT_VECTOR_STORE_CONFIG.vectorStoreFormat,
+  vectorStoreContentMode: DEFAULT_VECTOR_STORE_CONFIG.vectorStoreContentMode,
+  contentCacheEntries: DEFAULT_VECTOR_STORE_CONFIG.contentCacheEntries,
+  vectorStoreLoadMode: DEFAULT_VECTOR_STORE_CONFIG.vectorStoreLoadMode,
+  vectorCacheEntries: DEFAULT_VECTOR_STORE_CONFIG.vectorCacheEntries,
+  clearCacheAfterIndex: DEFAULT_MEMORY_CLEANUP_CONFIG.clearCacheAfterIndex,
+  unloadModelAfterIndex: DEFAULT_MEMORY_CLEANUP_CONFIG.unloadModelAfterIndex,
+  shutdownQueryEmbeddingPoolAfterIndex:
+    DEFAULT_MEMORY_CLEANUP_CONFIG.shutdownQueryEmbeddingPoolAfterIndex,
+  unloadModelAfterSearch: DEFAULT_MEMORY_CLEANUP_CONFIG.unloadModelAfterSearch,
+  embeddingPoolIdleTimeoutMs: DEFAULT_MEMORY_CLEANUP_CONFIG.embeddingPoolIdleTimeoutMs,
+  incrementalGcThresholdMb: DEFAULT_MEMORY_CLEANUP_CONFIG.incrementalGcThresholdMb,
+  incrementalMemoryProfile: DEFAULT_MEMORY_CLEANUP_CONFIG.incrementalMemoryProfile,
+  recycleServerOnHighRssAfterIncremental:
+    DEFAULT_MEMORY_CLEANUP_CONFIG.recycleServerOnHighRssAfterIncremental,
+  recycleServerOnHighRssThresholdMb:
+    DEFAULT_MEMORY_CLEANUP_CONFIG.recycleServerOnHighRssThresholdMb,
+  recycleServerOnHighRssCooldownMs:
+    DEFAULT_MEMORY_CLEANUP_CONFIG.recycleServerOnHighRssCooldownMs,
+  recycleServerOnHighRssDelayMs: DEFAULT_MEMORY_CLEANUP_CONFIG.recycleServerOnHighRssDelayMs,
+  memoryCleanup: { ...DEFAULT_MEMORY_CLEANUP_CONFIG },
+  semanticWeight: DEFAULT_SEARCH_CONFIG.semanticWeight,
+  exactMatchBoost: DEFAULT_SEARCH_CONFIG.exactMatchBoost,
+  recencyBoost: DEFAULT_SEARCH_CONFIG.recencyBoost,
+  recencyDecayDays: DEFAULT_SEARCH_CONFIG.recencyDecayDays,
+  textMatchMaxCandidates: DEFAULT_SEARCH_CONFIG.textMatchMaxCandidates,
+  smartIndexing: DEFAULT_INDEXING_CONFIG.smartIndexing,
+  callGraphEnabled: DEFAULT_CALL_GRAPH_CONFIG.callGraphEnabled,
+  callGraphBoost: DEFAULT_CALL_GRAPH_CONFIG.callGraphBoost,
+  callGraphMaxHops: DEFAULT_CALL_GRAPH_CONFIG.callGraphMaxHops,
+  annEnabled: DEFAULT_ANN_CONFIG.annEnabled,
+  annMinChunks: DEFAULT_ANN_CONFIG.annMinChunks,
+  annMinCandidates: DEFAULT_ANN_CONFIG.annMinCandidates,
+  annMaxCandidates: DEFAULT_ANN_CONFIG.annMaxCandidates,
+  annCandidateMultiplier: DEFAULT_ANN_CONFIG.annCandidateMultiplier,
+  annEfConstruction: DEFAULT_ANN_CONFIG.annEfConstruction,
+  annEfSearch: DEFAULT_ANN_CONFIG.annEfSearch,
+  annM: DEFAULT_ANN_CONFIG.annM,
+  annIndexCache: DEFAULT_ANN_CONFIG.annIndexCache,
+  annMetric: DEFAULT_ANN_CONFIG.annMetric,
+  indexing: { ...DEFAULT_INDEXING_CONFIG },
+  logging: { ...DEFAULT_LOGGING_CONFIG },
+  cache: { ...DEFAULT_CACHE_CONFIG },
+  worker: { ...DEFAULT_WORKER_CONFIG },
+  embedding: { ...DEFAULT_EMBEDDING_CONFIG },
+  vectorStore: { ...DEFAULT_VECTOR_STORE_CONFIG },
+  search: { ...DEFAULT_SEARCH_CONFIG },
+  callGraph: { ...DEFAULT_CALL_GRAPH_CONFIG },
+  ann: { ...DEFAULT_ANN_CONFIG },
+};
 let config = { ...DEFAULT_CONFIG };
-const WORKSPACE_ENV_VARS = [
-  'HEURISTIC_MCP_WORKSPACE',
-  'MCP_WORKSPACE',
-  'WORKSPACE_FOLDER',
-  'WORKSPACE_ROOT',
-  'CURSOR_WORKSPACE',
-  'CLAUDE_WORKSPACE',
-  'ANTIGRAVITY_WORKSPACE',
-  'INIT_CWD',
-];
-const WORKSPACE_MARKERS = [
+const WORKSPACE_MARKERS = [
   '.git',
   'package.json',
   'pyproject.toml',
@@ -480,118 +470,118 @@ const WORKSPACE_MARKERS = [
   'requirements.txt',
   'Gemfile',
   'Makefile',
-  'CMakeLists.txt',
-];
-function hasOwn(obj, key) {
-  return Object.prototype.hasOwnProperty.call(obj, key);
-}
-const CONFIG_NAMESPACES = Object.freeze([
-  {
-    name: 'memoryCleanup',
-    keys: MEMORY_CLEANUP_KEYS,
-    defaults: DEFAULT_MEMORY_CLEANUP_CONFIG,
-  },
-  {
-    name: 'indexing',
-    keys: INDEXING_KEYS,
-    defaults: DEFAULT_INDEXING_CONFIG,
-  },
-  {
-    name: 'logging',
-    keys: LOGGING_KEYS,
-    defaults: DEFAULT_LOGGING_CONFIG,
-  },
-  {
-    name: 'cache',
-    keys: CACHE_KEYS,
-    defaults: DEFAULT_CACHE_CONFIG,
-  },
-  {
-    name: 'worker',
-    keys: WORKER_KEYS,
-    defaults: DEFAULT_WORKER_CONFIG,
-  },
-  {
-    name: 'embedding',
-    keys: EMBEDDING_KEYS,
-    defaults: DEFAULT_EMBEDDING_CONFIG,
-  },
-  {
-    name: 'vectorStore',
-    keys: VECTOR_STORE_KEYS,
-    defaults: DEFAULT_VECTOR_STORE_CONFIG,
-  },
-  {
-    name: 'search',
-    keys: SEARCH_KEYS,
-    defaults: DEFAULT_SEARCH_CONFIG,
-  },
-  {
-    name: 'callGraph',
-    keys: CALL_GRAPH_KEYS,
-    defaults: DEFAULT_CALL_GRAPH_CONFIG,
-  },
-  {
-    name: 'ann',
-    keys: ANN_KEYS,
-    defaults: DEFAULT_ANN_CONFIG,
-  },
-]);
-function applyNamespace(targetConfig, sourceConfig, namespaceName, keys, defaults) {
-  const sourceNamespace =
-    sourceConfig && typeof sourceConfig[namespaceName] === 'object'
-      ? sourceConfig[namespaceName]
-      : {};
-  const mergedNamespace = {
-    ...defaults,
-    ...(targetConfig[namespaceName] && typeof targetConfig[namespaceName] === 'object'
-      ? targetConfig[namespaceName]
-      : {}),
-  };
-  for (const key of keys) {
-    if (hasOwn(sourceNamespace, key)) {
-      targetConfig[key] = mergedNamespace[key];
-    } else {
-      mergedNamespace[key] = targetConfig[key];
-    }
-  }
-  targetConfig[namespaceName] = mergedNamespace;
-}
-function syncNamespace(targetConfig, namespaceName, keys, defaults) {
-  const currentNamespace =
-    targetConfig[namespaceName] && typeof targetConfig[namespaceName] === 'object'
-      ? targetConfig[namespaceName]
-      : {};
-  const mergedNamespace = { ...defaults, ...currentNamespace };
-  for (const key of keys) {
-    mergedNamespace[key] = targetConfig[key];
-  }
-  targetConfig[namespaceName] = mergedNamespace;
-}
-function applyAllNamespaces(targetConfig, sourceConfig) {
-  for (const namespace of CONFIG_NAMESPACES) {
-    applyNamespace(
-      targetConfig,
-      sourceConfig,
-      namespace.name,
-      namespace.keys,
-      namespace.defaults
-    );
-  }
-}
-function syncAllNamespaces(targetConfig) {
-  for (const namespace of CONFIG_NAMESPACES) {
-    syncNamespace(targetConfig, namespace.name, namespace.keys, namespace.defaults);
-  }
-}
+  'CMakeLists.txt',
+];
+function hasOwn(obj, key) {
+  return Object.prototype.hasOwnProperty.call(obj, key);
+}
+const CONFIG_NAMESPACES = Object.freeze([
+  {
+    name: 'memoryCleanup',
+    keys: MEMORY_CLEANUP_KEYS,
+    defaults: DEFAULT_MEMORY_CLEANUP_CONFIG,
+  },
+  {
+    name: 'indexing',
+    keys: INDEXING_KEYS,
+    defaults: DEFAULT_INDEXING_CONFIG,
+  },
+  {
+    name: 'logging',
+    keys: LOGGING_KEYS,
+    defaults: DEFAULT_LOGGING_CONFIG,
+  },
+  {
+    name: 'cache',
+    keys: CACHE_KEYS,
+    defaults: DEFAULT_CACHE_CONFIG,
+  },
+  {
+    name: 'worker',
+    keys: WORKER_KEYS,
+    defaults: DEFAULT_WORKER_CONFIG,
+  },
+  {
+    name: 'embedding',
+    keys: EMBEDDING_KEYS,
+    defaults: DEFAULT_EMBEDDING_CONFIG,
+  },
+  {
+    name: 'vectorStore',
+    keys: VECTOR_STORE_KEYS,
+    defaults: DEFAULT_VECTOR_STORE_CONFIG,
+  },
+  {
+    name: 'search',
+    keys: SEARCH_KEYS,
+    defaults: DEFAULT_SEARCH_CONFIG,
+  },
+  {
+    name: 'callGraph',
+    keys: CALL_GRAPH_KEYS,
+    defaults: DEFAULT_CALL_GRAPH_CONFIG,
+  },
+  {
+    name: 'ann',
+    keys: ANN_KEYS,
+    defaults: DEFAULT_ANN_CONFIG,
+  },
+]);
+function applyNamespace(targetConfig, sourceConfig, namespaceName, keys, defaults) {
+  const sourceNamespace =
+    sourceConfig && typeof sourceConfig[namespaceName] === 'object'
+      ? sourceConfig[namespaceName]
+      : {};
+  const mergedNamespace = {
+    ...defaults,
+    ...(targetConfig[namespaceName] && typeof targetConfig[namespaceName] === 'object'
+      ? targetConfig[namespaceName]
+      : {}),
+  };
+  for (const key of keys) {
+    if (hasOwn(sourceNamespace, key)) {
+      targetConfig[key] = mergedNamespace[key];
+    } else {
+      mergedNamespace[key] = targetConfig[key];
+    }
+  }
+  targetConfig[namespaceName] = mergedNamespace;
+}
+function syncNamespace(targetConfig, namespaceName, keys, defaults) {
+  const currentNamespace =
+    targetConfig[namespaceName] && typeof targetConfig[namespaceName] === 'object'
+      ? targetConfig[namespaceName]
+      : {};
+  const mergedNamespace = { ...defaults, ...currentNamespace };
+  for (const key of keys) {
+    mergedNamespace[key] = targetConfig[key];
+  }
+  targetConfig[namespaceName] = mergedNamespace;
+}
+function applyAllNamespaces(targetConfig, sourceConfig) {
+  for (const namespace of CONFIG_NAMESPACES) {
+    applyNamespace(
+      targetConfig,
+      sourceConfig,
+      namespace.name,
+      namespace.keys,
+      namespace.defaults
+    );
+  }
+}
+function syncAllNamespaces(targetConfig) {
+  for (const namespace of CONFIG_NAMESPACES) {
+    syncNamespace(targetConfig, namespace.name, namespace.keys, namespace.defaults);
+  }
+}
 async function pathExists(filePath) {
   try {
@@ -627,20 +617,86 @@ async function findWorkspaceRoot(startDir) {
   return path.resolve(startDir);
 }
+async function resolveWorkspaceCandidate(rawValue) {
+  if (!rawValue || rawValue.includes('${')) return null;
+  const candidate = path.resolve(rawValue);
+  if (!(await pathExists(candidate))) return null;
+  try {
+    const stats = await fs.stat(candidate);
+    if (!stats.isDirectory()) return null;
+  } catch {
+    return null;
+  }
+  return candidate;
+}
+function logWorkspaceResolution(resolution) {
+  if (!resolution || !resolution.path) return;
+  if (resolution.source === 'workspace-arg') {
+    console.info(`[Config] Workspace resolution: --workspace -> ${resolution.path}`);
+    return;
+  }
+  if (resolution.source === 'env' && resolution.envKey) {
+    console.info(`[Config] Workspace resolution: env ${resolution.envKey} -> ${resolution.path}`);
+    return;
+  }
+  if (resolution.source === 'test-cwd') {
+    console.info(`[Config] Workspace resolution: process.cwd() (test mode) -> ${resolution.path}`);
+    return;
+  }
+  if (resolution.source === 'cwd-root-search') {
+    const from = resolution.fromPath || process.cwd();
+    console.info(
+      `[Config] Workspace resolution: workspace root from cwd (${from}) -> ${resolution.path}`
+    );
+    return;
+  }
+  console.info(`[Config] Workspace resolution: process.cwd() -> ${resolution.path}`);
+}
 async function resolveWorkspaceDir(workspaceDir) {
-  if (workspaceDir) return path.resolve(workspaceDir);
+  if (workspaceDir) {
+    return {
+      path: path.resolve(workspaceDir),
+      source: 'workspace-arg',
+    };
+  }
   if (process.env.VITEST === 'true' || process.env.NODE_ENV === 'test') {
-    return path.resolve(process.cwd());
+    return {
+      path: path.resolve(process.cwd()),
+      source: 'test-cwd',
+    };
   }
-  for (const key of WORKSPACE_ENV_VARS) {
-    const value = process.env[key];
-    if (!value || value.includes('${')) continue;
-    const candidate = path.resolve(value);
-    if (await pathExists(candidate)) return candidate;
+  for (const key of getWorkspaceEnvKeys()) {
+    const candidate = await resolveWorkspaceCandidate(process.env[key]);
+    if (candidate) {
+      return {
+        path: candidate,
+        source: 'env',
+        envKey: key,
+      };
+    }
   }
-  return await findWorkspaceRoot(process.cwd());
+  const cwd = path.resolve(process.cwd());
+  const root = await findWorkspaceRoot(cwd);
+  if (root !== cwd) {
+    return {
+      path: root,
+      source: 'cwd-root-search',
+      fromPath: cwd,
+    };
+  }
+  return {
+    path: cwd,
+    source: 'cwd',
+  };
 }
 export async function loadConfig(workspaceDir = null) {
@@ -652,14 +708,18 @@ export async function loadConfig(workspaceDir = null) {
     let serverDir = null;
     if (workspaceDir) {
       // Workspace mode: load config from workspace root
-      baseDir = path.resolve(workspaceDir);
+      const workspaceResolution = await resolveWorkspaceDir(workspaceDir);
+      baseDir = workspaceResolution.path;
       console.info(`[Config] Workspace mode: ${baseDir}`);
+      logWorkspaceResolution(workspaceResolution);
     } else {
       // Server mode: load config from server directory for global settings,
       // but use process.cwd() as base for searching if not specified otherwise
       const scriptDir = path.dirname(fileURLToPath(import.meta.url));
       serverDir = path.resolve(scriptDir, '..');
-      baseDir = await resolveWorkspaceDir(null);
+      const workspaceResolution = await resolveWorkspaceDir(null);
+      baseDir = workspaceResolution.path;
+      logWorkspaceResolution(workspaceResolution);
     }
     let userConfig = {};
@@ -699,16 +759,16 @@ export async function loadConfig(workspaceDir = null) {
       }
     }
-    config = { ...DEFAULT_CONFIG, ...userConfig };
-    applyAllNamespaces(config, userConfig);
-    // Backward compatibility for legacy top-level cache cleanup toggle.
-    if (
-      hasOwn(userConfig, 'autoCleanStaleCaches') &&
-      !(userConfig.cacheCleanup && hasOwn(userConfig.cacheCleanup, 'autoCleanup'))
-    ) {
-      config.cacheCleanup.autoCleanup = Boolean(userConfig.autoCleanStaleCaches);
-    }
+    config = { ...DEFAULT_CONFIG, ...userConfig };
+    applyAllNamespaces(config, userConfig);
+    // Backward compatibility for legacy top-level cache cleanup toggle.
+    if (
+      hasOwn(userConfig, 'autoCleanStaleCaches') &&
+      !(userConfig.cacheCleanup && hasOwn(userConfig.cacheCleanup, 'autoCleanup'))
+    ) {
+      config.cacheCleanup.autoCleanup = Boolean(userConfig.autoCleanStaleCaches);
+    }
     // Set search directory (respect user override when provided)
     if (userConfig.searchDirectory) {
@@ -990,74 +1050,74 @@ export async function loadConfig(workspaceDir = null) {
     }
   }
-  if (process.env.SMART_CODING_INCREMENTAL_GC_THRESHOLD_MB !== undefined) {
-    const value = parseInt(process.env.SMART_CODING_INCREMENTAL_GC_THRESHOLD_MB, 10);
-    if (!isNaN(value) && value >= 0) {
-      config.incrementalGcThresholdMb = value;
+  if (process.env.SMART_CODING_INCREMENTAL_GC_THRESHOLD_MB !== undefined) {
+    const value = parseInt(process.env.SMART_CODING_INCREMENTAL_GC_THRESHOLD_MB, 10);
+    if (!isNaN(value) && value >= 0) {
+      config.incrementalGcThresholdMb = value;
     } else {
       console.warn(
         `[Config] Invalid SMART_CODING_INCREMENTAL_GC_THRESHOLD_MB: ${process.env.SMART_CODING_INCREMENTAL_GC_THRESHOLD_MB}, using default`
-      );
-    }
-  }
-  if (process.env.SMART_CODING_INCREMENTAL_MEMORY_PROFILE !== undefined) {
-    const value = process.env.SMART_CODING_INCREMENTAL_MEMORY_PROFILE;
-    if (value === 'true' || value === 'false') {
-      config.incrementalMemoryProfile = value === 'true';
-    } else {
-      console.warn(
-        `[Config] Invalid SMART_CODING_INCREMENTAL_MEMORY_PROFILE: ${value}, using default`
-      );
-    }
-  }
-  if (process.env.SMART_CODING_RECYCLE_SERVER_ON_HIGH_RSS_AFTER_INCREMENTAL !== undefined) {
-    const value = process.env.SMART_CODING_RECYCLE_SERVER_ON_HIGH_RSS_AFTER_INCREMENTAL;
-    if (value === 'true' || value === 'false') {
-      config.recycleServerOnHighRssAfterIncremental = value === 'true';
-    } else {
-      console.warn(
-        `[Config] Invalid SMART_CODING_RECYCLE_SERVER_ON_HIGH_RSS_AFTER_INCREMENTAL: ${value}, using default`
-      );
-    }
-  }
-  if (process.env.SMART_CODING_RECYCLE_SERVER_RSS_THRESHOLD_MB !== undefined) {
-    const value = parseInt(process.env.SMART_CODING_RECYCLE_SERVER_RSS_THRESHOLD_MB, 10);
-    if (!isNaN(value) && value > 0) {
-      config.recycleServerOnHighRssThresholdMb = value;
-    } else {
-      console.warn(
-        `[Config] Invalid SMART_CODING_RECYCLE_SERVER_RSS_THRESHOLD_MB: ${process.env.SMART_CODING_RECYCLE_SERVER_RSS_THRESHOLD_MB}, using default`
-      );
-    }
-  }
-  if (process.env.SMART_CODING_RECYCLE_SERVER_COOLDOWN_MS !== undefined) {
-    const value = parseInt(process.env.SMART_CODING_RECYCLE_SERVER_COOLDOWN_MS, 10);
-    if (!isNaN(value) && value >= 0) {
-      config.recycleServerOnHighRssCooldownMs = value;
-    } else {
-      console.warn(
-        `[Config] Invalid SMART_CODING_RECYCLE_SERVER_COOLDOWN_MS: ${process.env.SMART_CODING_RECYCLE_SERVER_COOLDOWN_MS}, using default`
-      );
-    }
-  }
-  if (process.env.SMART_CODING_RECYCLE_SERVER_DELAY_MS !== undefined) {
-    const value = parseInt(process.env.SMART_CODING_RECYCLE_SERVER_DELAY_MS, 10);
-    if (!isNaN(value) && value >= 0) {
-      config.recycleServerOnHighRssDelayMs = value;
-    } else {
-      console.warn(
-        `[Config] Invalid SMART_CODING_RECYCLE_SERVER_DELAY_MS: ${process.env.SMART_CODING_RECYCLE_SERVER_DELAY_MS}, using default`
-      );
-    }
-  }
-  if (process.env.SMART_CODING_CONTENT_CACHE_ENTRIES !== undefined) {
-    const value = parseInt(process.env.SMART_CODING_CONTENT_CACHE_ENTRIES, 10);
+      );
+    }
+  }
+  if (process.env.SMART_CODING_INCREMENTAL_MEMORY_PROFILE !== undefined) {
+    const value = process.env.SMART_CODING_INCREMENTAL_MEMORY_PROFILE;
+    if (value === 'true' || value === 'false') {
+      config.incrementalMemoryProfile = value === 'true';
+    } else {
+      console.warn(
+        `[Config] Invalid SMART_CODING_INCREMENTAL_MEMORY_PROFILE: ${value}, using default`
+      );
+    }
+  }
+  if (process.env.SMART_CODING_RECYCLE_SERVER_ON_HIGH_RSS_AFTER_INCREMENTAL !== undefined) {
+    const value = process.env.SMART_CODING_RECYCLE_SERVER_ON_HIGH_RSS_AFTER_INCREMENTAL;
+    if (value === 'true' || value === 'false') {
+      config.recycleServerOnHighRssAfterIncremental = value === 'true';
+    } else {
+      console.warn(
+        `[Config] Invalid SMART_CODING_RECYCLE_SERVER_ON_HIGH_RSS_AFTER_INCREMENTAL: ${value}, using default`
+      );
+    }
+  }
+  if (process.env.SMART_CODING_RECYCLE_SERVER_RSS_THRESHOLD_MB !== undefined) {
+    const value = parseInt(process.env.SMART_CODING_RECYCLE_SERVER_RSS_THRESHOLD_MB, 10);
+    if (!isNaN(value) && value > 0) {
+      config.recycleServerOnHighRssThresholdMb = value;
+    } else {
+      console.warn(
+        `[Config] Invalid SMART_CODING_RECYCLE_SERVER_RSS_THRESHOLD_MB: ${process.env.SMART_CODING_RECYCLE_SERVER_RSS_THRESHOLD_MB}, using default`
+      );
+    }
+  }
+  if (process.env.SMART_CODING_RECYCLE_SERVER_COOLDOWN_MS !== undefined) {
+    const value = parseInt(process.env.SMART_CODING_RECYCLE_SERVER_COOLDOWN_MS, 10);
+    if (!isNaN(value) && value >= 0) {
+      config.recycleServerOnHighRssCooldownMs = value;
+    } else {
+      console.warn(
+        `[Config] Invalid SMART_CODING_RECYCLE_SERVER_COOLDOWN_MS: ${process.env.SMART_CODING_RECYCLE_SERVER_COOLDOWN_MS}, using default`
+      );
+    }
+  }
+  if (process.env.SMART_CODING_RECYCLE_SERVER_DELAY_MS !== undefined) {
+    const value = parseInt(process.env.SMART_CODING_RECYCLE_SERVER_DELAY_MS, 10);
+    if (!isNaN(value) && value >= 0) {
+      config.recycleServerOnHighRssDelayMs = value;
+    } else {
+      console.warn(
+        `[Config] Invalid SMART_CODING_RECYCLE_SERVER_DELAY_MS: ${process.env.SMART_CODING_RECYCLE_SERVER_DELAY_MS}, using default`
+      );
+    }
+  }
+  if (process.env.SMART_CODING_CONTENT_CACHE_ENTRIES !== undefined) {
+    const value = parseInt(process.env.SMART_CODING_CONTENT_CACHE_ENTRIES, 10);
     if (!isNaN(value) && value >= 0 && value <= 10000) {
       config.contentCacheEntries = value;
     } else {
@@ -1354,9 +1414,9 @@ export async function loadConfig(workspaceDir = null) {
     }
   }
-  if (
-    config.embeddingProcessGcMaxRequestsWithoutCollection !== null &&
-    config.embeddingProcessGcMaxRequestsWithoutCollection !== undefined
+  if (
+    config.embeddingProcessGcMaxRequestsWithoutCollection !== null &&
+    config.embeddingProcessGcMaxRequestsWithoutCollection !== undefined
   ) {
     const value = parseInt(config.embeddingProcessGcMaxRequestsWithoutCollection, 10);
     if (!isNaN(value) && value > 0) {
@@ -1365,14 +1425,14 @@ export async function loadConfig(workspaceDir = null) {
       console.warn(
         `[Config] Invalid embeddingProcessGcMaxRequestsWithoutCollection: ${config.embeddingProcessGcMaxRequestsWithoutCollection}, using default`
       );
-      config.embeddingProcessGcMaxRequestsWithoutCollection =
-        DEFAULT_CONFIG.embeddingProcessGcMaxRequestsWithoutCollection;
-    }
-  }
-  syncAllNamespaces(config);
-  return config;
-}
+      config.embeddingProcessGcMaxRequestsWithoutCollection =
+        DEFAULT_CONFIG.embeddingProcessGcMaxRequestsWithoutCollection;
+    }
+  }
+  syncAllNamespaces(config);
+  return config;
+}
 /**
  * Get platform-specific global cache directory