npm - mdcontext - Versions diffs - 0.1.0 → 0.2.0 - Mend

mdcontext 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (251) hide show

package/.changeset/config.json +9 -9
package/.claude/settings.local.json +25 -0
package/.github/workflows/claude-code-review.yml +44 -0
package/.github/workflows/claude.yml +85 -0
package/CONTRIBUTING.md +186 -0
package/NOTES/NOTES +44 -0
package/README.md +206 -3
package/biome.json +1 -1
package/dist/chunk-23UPXDNL.js +3044 -0
package/dist/chunk-2W7MO2DL.js +1366 -0
package/dist/chunk-3NUAZGMA.js +1689 -0
package/dist/chunk-7TOWB2XB.js +366 -0
package/dist/chunk-7XOTOADQ.js +3065 -0
package/dist/chunk-AH2PDM2K.js +3042 -0
package/dist/chunk-BNXWSZ63.js +3742 -0
package/dist/chunk-BTL5DJVU.js +3222 -0
package/dist/chunk-HDHYG7E4.js +104 -0
package/dist/chunk-HLR4KZBP.js +3234 -0
package/dist/chunk-IP3FRFEB.js +1045 -0
package/dist/chunk-KHU56VDO.js +3042 -0
package/dist/chunk-KRYIFLQR.js +85 -89
package/dist/chunk-LBSDNLEM.js +287 -0
package/dist/chunk-MNTQ7HCP.js +2643 -0
package/dist/chunk-MUJELQQ6.js +1387 -0
package/dist/chunk-MXJGMSLV.js +2199 -0
package/dist/chunk-N6QJGC3Z.js +2636 -0
package/dist/chunk-OBELGBPM.js +1713 -0
package/dist/chunk-OT7R5XTA.js +3192 -0
package/dist/chunk-P7X4RA2T.js +106 -0
package/dist/chunk-PIDUQNC2.js +3185 -0
package/dist/chunk-POGCDIH4.js +3187 -0
package/dist/chunk-PSIEOQGZ.js +3043 -0
package/dist/chunk-PVRT3IHA.js +3238 -0
package/dist/chunk-QNN4TT23.js +1430 -0
package/dist/chunk-RE3R45RJ.js +3042 -0
package/dist/chunk-S7E6TFX6.js +718 -657
package/dist/chunk-SG6GLU4U.js +1378 -0
package/dist/chunk-SJCDV2ST.js +274 -0
package/dist/chunk-SYE5XLF3.js +104 -0
package/dist/chunk-T5VLYBZD.js +103 -0
package/dist/chunk-TOQB7VWU.js +3238 -0
package/dist/chunk-VFNMZ4ZQ.js +3228 -0
package/dist/chunk-VVTGZNBT.js +1533 -1423
package/dist/chunk-W7Q4RFEV.js +104 -0
package/dist/chunk-XTYYVRLO.js +3190 -0
package/dist/chunk-Y6MDYVJD.js +3063 -0
package/dist/cli/main.js +4072 -629
package/dist/index.d.ts +420 -33
package/dist/index.js +8 -15
package/dist/mcp/server.js +103 -7
package/dist/schema-BAWSG7KY.js +22 -0
package/dist/schema-E3QUPL26.js +20 -0
package/dist/schema-EHL7WUT6.js +20 -0
package/docs/019-USAGE.md +44 -5
package/docs/020-current-implementation.md +8 -8
package/docs/021-DOGFOODING-FINDINGS.md +1 -1
package/docs/CONFIG.md +1123 -0
package/docs/ERRORS.md +383 -0
package/docs/summarization.md +320 -0
package/justfile +40 -0
package/package.json +39 -33
package/research/INDEX.md +315 -0
package/research/code-review/README.md +90 -0
package/research/code-review/cli-error-handling-review.md +979 -0
package/research/code-review/code-review-validation-report.md +464 -0
package/research/code-review/main-ts-review.md +1128 -0
package/research/config-docs/SUMMARY.md +357 -0
package/research/config-docs/TEST-RESULTS.md +776 -0
package/research/config-docs/TODO.md +542 -0
package/research/config-docs/analysis.md +744 -0
package/research/config-docs/fix-validation.md +502 -0
package/research/config-docs/help-audit.md +264 -0
package/research/config-docs/help-system-analysis.md +890 -0
package/research/frontmatter/COMMENTS-ARE-SKIPPED.md +149 -0
package/research/frontmatter/LLM-CODE-NAVIGATION.md +276 -0
package/research/issue-review.md +603 -0
package/research/llm-summarization/agent-cli-tools-2026.md +1082 -0
package/research/llm-summarization/alternative-providers-2026.md +1428 -0
package/research/llm-summarization/anthropic-2026.md +367 -0
package/research/llm-summarization/claude-cli-integration.md +1706 -0
package/research/llm-summarization/cli-integration-patterns.md +3155 -0
package/research/llm-summarization/openai-2026.md +473 -0
package/research/llm-summarization/openai-compatible-providers-2026.md +1022 -0
package/research/llm-summarization/opencode-cli-integration.md +1552 -0
package/research/llm-summarization/prompt-engineering-2026.md +1426 -0
package/research/llm-summarization/prototype-results.md +56 -0
package/research/llm-summarization/provider-switching-patterns-2026.md +2153 -0
package/research/llm-summarization/typescript-llm-libraries-2026.md +2436 -0
package/research/mdcontext-pudding/00-EXECUTIVE-SUMMARY.md +282 -0
package/research/mdcontext-pudding/01-index-embed.md +956 -0
package/research/mdcontext-pudding/02-search-COMMANDS.md +142 -0
package/research/mdcontext-pudding/02-search-SUMMARY.md +146 -0
package/research/mdcontext-pudding/02-search.md +970 -0
package/research/mdcontext-pudding/03-context.md +779 -0
package/research/mdcontext-pudding/04-navigation-and-analytics.md +803 -0
package/research/mdcontext-pudding/04-tree.md +704 -0
package/research/mdcontext-pudding/05-config.md +1038 -0
package/research/mdcontext-pudding/06-links-summary.txt +87 -0
package/research/mdcontext-pudding/06-links.md +679 -0
package/research/mdcontext-pudding/07-stats.md +693 -0
package/research/mdcontext-pudding/BUG-FIX-PLAN.md +388 -0
package/research/mdcontext-pudding/P0-BUG-VALIDATION.md +167 -0
package/research/mdcontext-pudding/README.md +168 -0
package/research/mdcontext-pudding/TESTING-SUMMARY.md +128 -0
package/research/research-quality-review.md +834 -0
package/research/semantic-search/embedding-text-analysis.md +156 -0
package/research/semantic-search/multi-word-failure-reproduction.md +171 -0
package/research/semantic-search/query-processing-analysis.md +207 -0
package/research/semantic-search/root-cause-and-solution.md +114 -0
package/research/semantic-search/threshold-validation-report.md +69 -0
package/research/semantic-search/vector-search-analysis.md +63 -0
package/research/test-path-issues.md +276 -0
package/review/ALP-76/1-error-type-design.md +962 -0
package/review/ALP-76/2-error-handling-patterns.md +906 -0
package/review/ALP-76/3-error-presentation.md +624 -0
package/review/ALP-76/4-test-coverage.md +625 -0
package/review/ALP-76/5-migration-completeness.md +440 -0
package/review/ALP-76/6-effect-best-practices.md +755 -0
package/scripts/apply-branch-protection.sh +47 -0
package/scripts/branch-protection-templates.json +79 -0
package/scripts/prototype-summarization.ts +346 -0
package/scripts/rebuild-hnswlib.js +32 -37
package/scripts/setup-branch-protection.sh +64 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/active-provider.json +7 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/bm25.json +541 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/bm25.meta.json +5 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/config.json +8 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin +0 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin +0 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/documents.json +60 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/links.json +13 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/sections.json +1197 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/configuration-management.md +99 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/distributed-systems.md +92 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/error-handling.md +78 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/failure-automation.md +55 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/job-context.md +69 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/process-orchestration.md +99 -0
package/src/cli/argv-preprocessor.test.ts +2 -2
package/src/cli/cli.test.ts +230 -33
package/src/cli/commands/config-cmd.ts +642 -0
package/src/cli/commands/context.ts +97 -9
package/src/cli/commands/duplicates.ts +122 -0
package/src/cli/commands/embeddings.ts +529 -0
package/src/cli/commands/index-cmd.ts +210 -30
package/src/cli/commands/index.ts +3 -0
package/src/cli/commands/search.ts +894 -64
package/src/cli/commands/stats.ts +3 -0
package/src/cli/commands/tree.ts +26 -5
package/src/cli/config-layer.ts +176 -0
package/src/cli/error-handler.test.ts +235 -0
package/src/cli/error-handler.ts +655 -0
package/src/cli/flag-schemas.ts +66 -0
package/src/cli/help.ts +209 -7
package/src/cli/main.ts +348 -58
package/src/cli/options.ts +10 -0
package/src/cli/shared-error-handling.ts +199 -0
package/src/cli/utils.ts +150 -17
package/src/config/file-provider.test.ts +320 -0
package/src/config/file-provider.ts +273 -0
package/src/config/index.ts +72 -0
package/src/config/integration.test.ts +667 -0
package/src/config/precedence.test.ts +277 -0
package/src/config/precedence.ts +451 -0
package/src/config/schema.test.ts +414 -0
package/src/config/schema.ts +603 -0
package/src/config/service.test.ts +320 -0
package/src/config/service.ts +243 -0
package/src/config/testing.test.ts +264 -0
package/src/config/testing.ts +110 -0
package/src/core/types.ts +6 -33
package/src/duplicates/detector.test.ts +183 -0
package/src/duplicates/detector.ts +414 -0
package/src/duplicates/index.ts +18 -0
package/src/embeddings/embedding-namespace.test.ts +300 -0
package/src/embeddings/embedding-namespace.ts +947 -0
package/src/embeddings/heading-boost.test.ts +222 -0
package/src/embeddings/hnsw-build-options.test.ts +198 -0
package/src/embeddings/hyde.test.ts +272 -0
package/src/embeddings/hyde.ts +264 -0
package/src/embeddings/index.ts +2 -0
package/src/embeddings/openai-provider.ts +332 -83
package/src/embeddings/pricing.json +22 -0
package/src/embeddings/provider-constants.ts +204 -0
package/src/embeddings/provider-errors.test.ts +967 -0
package/src/embeddings/provider-errors.ts +565 -0
package/src/embeddings/provider-factory.test.ts +240 -0
package/src/embeddings/provider-factory.ts +225 -0
package/src/embeddings/provider-integration.test.ts +788 -0
package/src/embeddings/query-preprocessing.test.ts +187 -0
package/src/embeddings/semantic-search-threshold.test.ts +508 -0
package/src/embeddings/semantic-search.ts +780 -93
package/src/embeddings/types.ts +293 -16
package/src/embeddings/vector-store.ts +486 -77
package/src/embeddings/voyage-provider.ts +313 -0
package/src/errors/errors.test.ts +845 -0
package/src/errors/index.ts +533 -0
package/src/index/ignore-patterns.test.ts +354 -0
package/src/index/ignore-patterns.ts +305 -0
package/src/index/indexer.ts +286 -48
package/src/index/storage.ts +94 -30
package/src/index/types.ts +40 -2
package/src/index/watcher.ts +67 -9
package/src/index.ts +22 -0
package/src/integration/search-keyword.test.ts +678 -0
package/src/mcp/server.ts +135 -6
package/src/parser/parser.ts +18 -19
package/src/parser/section-filter.test.ts +277 -0
package/src/parser/section-filter.ts +125 -3
package/src/search/__tests__/hybrid-search.test.ts +650 -0
package/src/search/bm25-store.ts +366 -0
package/src/search/cross-encoder.test.ts +253 -0
package/src/search/cross-encoder.ts +406 -0
package/src/search/fuzzy-search.test.ts +419 -0
package/src/search/fuzzy-search.ts +273 -0
package/src/search/hybrid-search.ts +448 -0
package/src/search/path-matcher.test.ts +276 -0
package/src/search/path-matcher.ts +33 -0
package/src/search/searcher.test.ts +99 -1
package/src/search/searcher.ts +189 -67
package/src/search/wink-bm25.d.ts +30 -0
package/src/summarization/cli-providers/claude.ts +202 -0
package/src/summarization/cli-providers/detection.test.ts +273 -0
package/src/summarization/cli-providers/detection.ts +118 -0
package/src/summarization/cli-providers/index.ts +8 -0
package/src/summarization/cost.test.ts +139 -0
package/src/summarization/cost.ts +102 -0
package/src/summarization/error-handler.test.ts +127 -0
package/src/summarization/error-handler.ts +111 -0
package/src/summarization/index.ts +102 -0
package/src/summarization/pipeline.test.ts +498 -0
package/src/summarization/pipeline.ts +231 -0
package/src/summarization/prompts.test.ts +269 -0
package/src/summarization/prompts.ts +133 -0
package/src/summarization/provider-factory.test.ts +396 -0
package/src/summarization/provider-factory.ts +178 -0
package/src/summarization/types.ts +184 -0
package/src/summarize/summarizer.ts +104 -35
package/src/types/huggingface-transformers.d.ts +66 -0
package/tests/fixtures/cli/.mdcontext/active-provider.json +7 -0
package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin +0 -0
package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin +0 -0
package/tests/fixtures/cli/.mdcontext/indexes/documents.json +4 -4
package/tests/fixtures/cli/.mdcontext/indexes/sections.json +14 -0
package/tests/integration/embed-index.test.ts +712 -0
package/tests/integration/search-context.test.ts +469 -0
package/tests/integration/search-semantic.test.ts +522 -0
package/vitest.config.ts +1 -6
package/AGENTS.md +0 -46
package/tests/fixtures/cli/.mdcontext/vectors.bin +0 -0
package/tests/fixtures/cli/.mdcontext/vectors.meta.json +0 -1264

package/src/embeddings/query-preprocessing.test.ts ADDED Viewed

@@ -0,0 +1,187 @@
+/**
+ * Query Preprocessing Tests
+ *
+ * Tests for query preprocessing before embedding generation.
+ * Preprocessing normalizes queries to improve semantic search recall.
+ */
+import { describe, expect, it } from 'vitest'
+import { preprocessQuery, type SemanticSearchOptions } from './types.js'
+describe('Query Preprocessing', () => {
+  describe('preprocessQuery function', () => {
+    it('should convert query to lowercase', () => {
+      expect(preprocessQuery('How Does Authentication Work')).toBe(
+        'how does authentication work',
+      )
+    })
+    it('should replace punctuation with spaces', () => {
+      expect(preprocessQuery('user-authentication')).toBe('user authentication')
+      expect(preprocessQuery('what is config.json?')).toBe(
+        'what is config json',
+      )
+      expect(preprocessQuery('test@example.com')).toBe('test example com')
+    })
+    it('should collapse multiple spaces to single space', () => {
+      expect(preprocessQuery('how   does   it   work')).toBe('how does it work')
+      expect(preprocessQuery('user  -  auth')).toBe('user auth')
+    })
+    it('should trim leading/trailing whitespace', () => {
+      expect(preprocessQuery('  query  ')).toBe('query')
+      expect(preprocessQuery('   how does it work   ')).toBe('how does it work')
+    })
+    it('should handle empty string', () => {
+      expect(preprocessQuery('')).toBe('')
+    })
+    it('should handle whitespace-only string', () => {
+      expect(preprocessQuery('   ')).toBe('')
+    })
+    it('should preserve alphanumeric content', () => {
+      expect(preprocessQuery('user123')).toBe('user123')
+      expect(preprocessQuery('v2 api')).toBe('v2 api')
+    })
+    it('should handle complex queries', () => {
+      expect(preprocessQuery("What's the best way to handle errors?")).toBe(
+        'what s the best way to handle errors',
+      )
+      expect(preprocessQuery('API v2.0 - authentication')).toBe(
+        'api v2 0 authentication',
+      )
+    })
+    it('should handle special characters', () => {
+      expect(preprocessQuery('C++ programming')).toBe('c programming')
+      expect(preprocessQuery('Node.js')).toBe('node js')
+      expect(preprocessQuery('$PATH variable')).toBe('path variable')
+    })
+    it('should handle unicode and accented characters', () => {
+      // Accented characters are stripped by the regex (non-word chars in ASCII)
+      // This is intentional as embeddings handle normalized ASCII better
+      expect(preprocessQuery('café')).toBe('caf')
+      expect(preprocessQuery('naïve')).toBe('na ve')
+      // Basic ASCII preserved
+      expect(preprocessQuery('cafe')).toBe('cafe')
+      expect(preprocessQuery('naive')).toBe('naive')
+    })
+    it('should handle quotes', () => {
+      expect(preprocessQuery('"exact match"')).toBe('exact match')
+      expect(preprocessQuery("'single quotes'")).toBe('single quotes')
+    })
+    it('should handle brackets and parentheses', () => {
+      expect(preprocessQuery('function(args)')).toBe('function args')
+      expect(preprocessQuery('[array]')).toBe('array')
+      expect(preprocessQuery('{object}')).toBe('object')
+    })
+  })
+  describe('SemanticSearchOptions skipPreprocessing', () => {
+    it('should accept skipPreprocessing option in interface', () => {
+      const options: SemanticSearchOptions = {
+        skipPreprocessing: true,
+      }
+      expect(options.skipPreprocessing).toBe(true)
+    })
+    it('should default to undefined (preprocessing enabled)', () => {
+      const options: SemanticSearchOptions = {}
+      expect(options.skipPreprocessing).toBeUndefined()
+    })
+    it('should accept skipPreprocessing with other options', () => {
+      const options: SemanticSearchOptions = {
+        limit: 10,
+        threshold: 0.35,
+        skipPreprocessing: false,
+      }
+      expect(options.skipPreprocessing).toBe(false)
+      expect(options.limit).toBe(10)
+      expect(options.threshold).toBe(0.35)
+    })
+  })
+  describe('Preprocessing benefits', () => {
+    it('should normalize case variations', () => {
+      // Same query with different case should produce same result
+      const query1 = 'Authentication'
+      const query2 = 'authentication'
+      const query3 = 'AUTHENTICATION'
+      expect(preprocessQuery(query1)).toBe(preprocessQuery(query2))
+      expect(preprocessQuery(query2)).toBe(preprocessQuery(query3))
+    })
+    it('should normalize punctuation variations', () => {
+      // Similar queries with punctuation differences should be closer
+      const query1 = 'user-auth'
+      const query2 = 'user auth'
+      expect(preprocessQuery(query1)).toBe(preprocessQuery(query2))
+    })
+    it('should handle file path references gracefully', () => {
+      // File paths in queries should be handled
+      expect(preprocessQuery('src/components/Button.tsx')).toBe(
+        'src components button tsx',
+      )
+    })
+    it('should handle code references gracefully', () => {
+      // Code snippets in queries should be handled
+      expect(preprocessQuery('function handleClick()')).toBe(
+        'function handleclick',
+      )
+    })
+  })
+  describe('Edge cases', () => {
+    it('should handle only punctuation', () => {
+      expect(preprocessQuery('...')).toBe('')
+      expect(preprocessQuery('???')).toBe('')
+    })
+    it('should handle only numbers', () => {
+      expect(preprocessQuery('12345')).toBe('12345')
+    })
+    it('should handle mixed numbers and punctuation', () => {
+      expect(preprocessQuery('123-456-789')).toBe('123 456 789')
+    })
+    it('should handle underscores (word characters)', () => {
+      // Underscores are word characters in regex, so they're preserved
+      expect(preprocessQuery('user_name')).toBe('user_name')
+    })
+    it('should handle newlines', () => {
+      expect(preprocessQuery('line1\nline2')).toBe('line1 line2')
+    })
+    it('should handle tabs', () => {
+      expect(preprocessQuery('tab\ttab')).toBe('tab tab')
+    })
+  })
+})
+describe('Export verification', () => {
+  it('should export preprocessQuery from types module', async () => {
+    const { preprocessQuery } = await import('./types.js')
+    expect(preprocessQuery).toBeDefined()
+    expect(typeof preprocessQuery).toBe('function')
+  })
+  it('should export preprocessQuery from main embeddings module', async () => {
+    const { preprocessQuery } = await import('./index.js')
+    expect(preprocessQuery).toBeDefined()
+    expect(typeof preprocessQuery).toBe('function')
+  })
+})

package/src/embeddings/semantic-search-threshold.test.ts ADDED Viewed

@@ -0,0 +1,508 @@
+/**
+ * Semantic Search Threshold Tests
+ *
+ * Tests for threshold-related functionality including:
+ * - VectorStore searchWithStats() API
+ * - Below-threshold feedback mechanism
+ * - Default threshold configuration
+ * - Threshold boundary conditions
+ *
+ * Uses pre-built test corpus at:
+ * src/__tests__/fixtures/semantic-search/multi-word-corpus/
+ */
+import * as path from 'node:path'
+import { Effect } from 'effect'
+import { describe, expect, it } from 'vitest'
+import {
+  createNamespacedVectorStore,
+  createVectorStore,
+  type VectorSearchResultWithStats,
+} from './vector-store.js'
+// Path to test corpus with pre-built embeddings
+const TEST_CORPUS_PATH = path.join(
+  __dirname,
+  '../__tests__/fixtures/semantic-search/multi-word-corpus',
+)
+// Test corpus uses 512 dimensions (text-embedding-3-small with Matryoshka reduction)
+const TEST_CORPUS_DIMENSIONS = 512
+const TEST_CORPUS_PROVIDER = 'openai'
+const TEST_CORPUS_MODEL = 'text-embedding-3-small'
+// Helper to create the namespaced vector store for test corpus
+const createTestVectorStore = () =>
+  createNamespacedVectorStore(
+    TEST_CORPUS_PATH,
+    TEST_CORPUS_PROVIDER,
+    TEST_CORPUS_MODEL,
+    TEST_CORPUS_DIMENSIONS,
+  )
+describe('Semantic Search Threshold', () => {
+  describe('VectorStore searchWithStats', () => {
+    it('should load test corpus with embeddings', async () => {
+      const vectorStore = createTestVectorStore()
+      const loadResult = await Effect.runPromise(vectorStore.load())
+      expect(loadResult.loaded).toBe(true)
+      const stats = vectorStore.getStats()
+      expect(stats.count).toBeGreaterThan(0)
+      expect(stats.dimensions).toBe(TEST_CORPUS_DIMENSIONS)
+    })
+    it('should return results with searchWithStats', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      // Use a zero threshold to get all results
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          0,
+        ),
+      )
+      expect(result.results).toBeDefined()
+      expect(Array.isArray(result.results)).toBe(true)
+      expect(result.results.length).toBeGreaterThan(0)
+    })
+    it('should track below-threshold results count', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      // Use a very high threshold to push all results below it
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          0.99,
+        ),
+      )
+      // With 0.99 threshold, most/all results should be below threshold
+      expect(result.belowThresholdCount).toBeGreaterThanOrEqual(0)
+    })
+    it('should track highest below-threshold similarity', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      // Use high threshold to force below-threshold results
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          0.99,
+        ),
+      )
+      // When there are below-threshold results, highest should be tracked
+      if (result.belowThresholdCount > 0) {
+        expect(result.belowThresholdHighest).not.toBeNull()
+        expect(result.belowThresholdHighest).toBeLessThan(0.99)
+        expect(result.belowThresholdHighest).toBeGreaterThan(0)
+      }
+    })
+    it('should return empty results when no embeddings exist', async () => {
+      const vectorStore = createVectorStore('/nonexistent/path', 1536)
+      const loadResult = await Effect.runPromise(vectorStore.load())
+      expect(loadResult.loaded).toBe(false)
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0),
+          10,
+          0,
+        ),
+      )
+      expect(result.results).toHaveLength(0)
+      expect(result.belowThresholdCount).toBe(0)
+      expect(result.belowThresholdHighest).toBeNull()
+    })
+  })
+  describe('Threshold boundaries', () => {
+    it('should return all results with threshold of 0', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      // Use 0 threshold - everything should be above
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          0,
+        ),
+      )
+      expect(result.belowThresholdCount).toBe(0)
+      expect(result.results.length).toBeGreaterThan(0)
+    })
+    it('should return no results with threshold of 1', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          1,
+        ),
+      )
+      // With threshold of 1, nothing should pass (similarity is never >= 1 in practice)
+      // Note: if a result has exactly similarity=1, it would pass
+      expect(result.results.length).toBeLessThanOrEqual(1)
+    })
+    it('should respect the limit parameter', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      const stats = vectorStore.getStats()
+      const limit = 3
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          limit,
+          0,
+        ),
+      )
+      // Should not return more than limit
+      expect(result.results.length).toBeLessThanOrEqual(limit)
+      // Should return results if corpus has entries
+      if (stats.count > 0) {
+        expect(result.results.length).toBeGreaterThan(0)
+      }
+    })
+  })
+  describe('Default threshold value (0.35)', () => {
+    it('should use 0.35 as the default threshold in config schema', async () => {
+      const { defaultConfig } = await import('../config/schema.js')
+      expect(defaultConfig.search.minSimilarity).toBe(0.35)
+    })
+    it('should document 0.35 threshold in help text', async () => {
+      const { helpContent } = await import('../cli/help.js')
+      const searchHelp = helpContent.search
+      expect(searchHelp).toBeDefined()
+      expect(searchHelp!.notes).toBeDefined()
+      // Verify notes mention 0.35
+      const notesText = searchHelp!.notes?.join(' ') ?? ''
+      expect(notesText).toContain('0.35')
+    })
+    it('should mention threshold in search options', async () => {
+      const { helpContent } = await import('../cli/help.js')
+      const searchHelp = helpContent.search
+      expect(searchHelp).toBeDefined()
+      // Find threshold option
+      const thresholdOption = searchHelp!.options.find((opt) =>
+        opt.name.includes('--threshold'),
+      )
+      expect(thresholdOption).toBeDefined()
+      expect(thresholdOption?.description).toContain('0.35')
+    })
+  })
+  describe('VectorSearchResultWithStats type shape', () => {
+    it('should have correct structure', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          0.35,
+        ),
+      )
+      // Type assertions
+      const typed: VectorSearchResultWithStats = result
+      expect('results' in typed).toBe(true)
+      expect('belowThresholdCount' in typed).toBe(true)
+      expect('belowThresholdHighest' in typed).toBe(true)
+      // Results array should have proper shape
+      for (const r of typed.results) {
+        expect(typeof r.id).toBe('string')
+        expect(typeof r.sectionId).toBe('string')
+        expect(typeof r.documentPath).toBe('string')
+        expect(typeof r.heading).toBe('string')
+        expect(typeof r.similarity).toBe('number')
+      }
+    })
+  })
+  describe('Test corpus validation', () => {
+    it('should have test corpus with multiple documents', async () => {
+      const vectorStore = createTestVectorStore()
+      const loadResult = await Effect.runPromise(vectorStore.load())
+      expect(loadResult.loaded).toBe(true)
+      const stats = vectorStore.getStats()
+      // Test corpus has 6 documents with multiple sections each
+      expect(stats.count).toBeGreaterThan(10)
+    })
+    it('should have correct dimensions (512 for test corpus)', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      const stats = vectorStore.getStats()
+      expect(stats.dimensions).toBe(TEST_CORPUS_DIMENSIONS)
+    })
+  })
+  describe('Similarity score validation', () => {
+    it('should return similarity scores between 0 and 1', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          20,
+          0,
+        ),
+      )
+      for (const r of result.results) {
+        expect(r.similarity).toBeGreaterThanOrEqual(0)
+        expect(r.similarity).toBeLessThanOrEqual(1)
+      }
+    })
+    it('should return results sorted by similarity (highest first)', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          20,
+          0,
+        ),
+      )
+      // Verify descending order
+      for (let i = 1; i < result.results.length; i++) {
+        expect(result.results[i]!.similarity).toBeLessThanOrEqual(
+          result.results[i - 1]!.similarity,
+        )
+      }
+    })
+  })
+  describe('Below-threshold feedback', () => {
+    it('should provide count when results are below threshold', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      // Use very high threshold to get 0 passing results
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          0.95,
+        ),
+      )
+      // When 0 results pass, we should have below-threshold stats
+      if (result.results.length === 0) {
+        expect(result.belowThresholdCount).toBeGreaterThan(0)
+        expect(result.belowThresholdHighest).not.toBeNull()
+      }
+    })
+    it('should allow calculating suggested threshold', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          0.9,
+        ),
+      )
+      if (
+        result.results.length === 0 &&
+        result.belowThresholdHighest !== null
+      ) {
+        // Suggested threshold formula: max(0.1, highest - 0.05)
+        const suggestedThreshold = Math.max(
+          0.1,
+          result.belowThresholdHighest - 0.05,
+        )
+        expect(suggestedThreshold).toBeLessThan(0.9)
+        expect(suggestedThreshold).toBeGreaterThanOrEqual(0.1)
+      }
+    })
+  })
+})
+describe('Hybrid Search Threshold', () => {
+  it('should export hybridSearch function', async () => {
+    const { hybridSearch } = await import('../search/hybrid-search.js')
+    expect(hybridSearch).toBeDefined()
+    expect(typeof hybridSearch).toBe('function')
+  })
+})
+describe('Search Quality Modes', () => {
+  describe('QUALITY_EF_SEARCH constants', () => {
+    it('should export quality mode constants', async () => {
+      const { QUALITY_EF_SEARCH } = await import('./types.js')
+      expect(QUALITY_EF_SEARCH).toBeDefined()
+      expect(QUALITY_EF_SEARCH.fast).toBe(64)
+      expect(QUALITY_EF_SEARCH.balanced).toBe(100)
+      expect(QUALITY_EF_SEARCH.thorough).toBe(256)
+    })
+    it('should have fast mode with lowest efSearch', async () => {
+      const { QUALITY_EF_SEARCH } = await import('./types.js')
+      expect(QUALITY_EF_SEARCH.fast).toBeLessThan(QUALITY_EF_SEARCH.balanced)
+    })
+    it('should have thorough mode with highest efSearch', async () => {
+      const { QUALITY_EF_SEARCH } = await import('./types.js')
+      expect(QUALITY_EF_SEARCH.thorough).toBeGreaterThan(
+        QUALITY_EF_SEARCH.balanced,
+      )
+    })
+  })
+  describe('VectorStore efSearch support', () => {
+    it('should accept efSearch option in search method', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      // Should not throw when passing efSearch
+      const result = await Effect.runPromise(
+        vectorStore.search(new Array(TEST_CORPUS_DIMENSIONS).fill(0.1), 10, 0, {
+          efSearch: 64,
+        }),
+      )
+      expect(Array.isArray(result)).toBe(true)
+    })
+    it('should accept efSearch option in searchWithStats method', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      // Should not throw when passing efSearch
+      const result = await Effect.runPromise(
+        vectorStore.searchWithStats(
+          new Array(TEST_CORPUS_DIMENSIONS).fill(0.1),
+          10,
+          0,
+          { efSearch: 256 },
+        ),
+      )
+      expect(result.results).toBeDefined()
+      expect(Array.isArray(result.results)).toBe(true)
+    })
+    it('should work without efSearch option (defaults)', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      // Should not throw without efSearch option
+      const result = await Effect.runPromise(
+        vectorStore.search(new Array(TEST_CORPUS_DIMENSIONS).fill(0.1), 10, 0),
+      )
+      expect(Array.isArray(result)).toBe(true)
+    })
+    it('should return consistent results for same query with different efSearch', async () => {
+      const vectorStore = createTestVectorStore()
+      await Effect.runPromise(vectorStore.load())
+      const queryVector = new Array(TEST_CORPUS_DIMENSIONS).fill(0.1)
+      const fastResult = await Effect.runPromise(
+        vectorStore.search(queryVector, 5, 0, { efSearch: 64 }),
+      )
+      const thoroughResult = await Effect.runPromise(
+        vectorStore.search(queryVector, 5, 0, { efSearch: 256 }),
+      )
+      // Both should return results
+      expect(fastResult.length).toBeGreaterThan(0)
+      expect(thoroughResult.length).toBeGreaterThan(0)
+      // Top result should likely be the same (though not guaranteed with HNSW)
+      // At minimum, both should return valid results
+      expect(fastResult[0]?.sectionId).toBeDefined()
+      expect(thoroughResult[0]?.sectionId).toBeDefined()
+    })
+  })
+  describe('SemanticSearchOptions quality field', () => {
+    it('should accept quality in SemanticSearchOptions type', async () => {
+      // Type check - if this compiles, the type has the quality field
+      const options: import('./types.js').SemanticSearchOptions = {
+        limit: 10,
+        threshold: 0.35,
+        quality: 'balanced',
+      }
+      expect(options.quality).toBe('balanced')
+    })
+    it('should accept all three quality modes', async () => {
+      const fastOptions: import('./types.js').SemanticSearchOptions = {
+        quality: 'fast',
+      }
+      const balancedOptions: import('./types.js').SemanticSearchOptions = {
+        quality: 'balanced',
+      }
+      const thoroughOptions: import('./types.js').SemanticSearchOptions = {
+        quality: 'thorough',
+      }
+      expect(fastOptions.quality).toBe('fast')
+      expect(balancedOptions.quality).toBe('balanced')
+      expect(thoroughOptions.quality).toBe('thorough')
+    })
+  })
+  describe('HybridSearchOptions quality field', () => {
+    it('should accept quality in HybridSearchOptions type', async () => {
+      type HybridSearchOptions =
+        import('../search/hybrid-search.js').HybridSearchOptions
+      const options: HybridSearchOptions = {
+        limit: 10,
+        quality: 'thorough',
+      }
+      expect(options.quality).toBe('thorough')
+    })
+  })
+})
+describe('CLI Search Threshold', () => {
+  it('should have 0.35 as config default threshold', async () => {
+    const { defaultConfig } = await import('../config/schema.js')
+    expect(defaultConfig.search.minSimilarity).toBe(0.35)
+  })
+})