npm - mdcontext - Versions diffs - 0.0.1 → 0.2.0 - Mend

mdcontext 0.0.1 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (337) hide show

package/.changeset/README.md +28 -0
package/.changeset/config.json +11 -0
package/.claude/settings.local.json +25 -0
package/.github/workflows/ci.yml +83 -0
package/.github/workflows/claude-code-review.yml +44 -0
package/.github/workflows/claude.yml +85 -0
package/.github/workflows/release.yml +113 -0
package/.tldrignore +112 -0
package/BACKLOG.md +338 -0
package/CONTRIBUTING.md +186 -0
package/NOTES/NOTES +44 -0
package/README.md +434 -11
package/biome.json +36 -0
package/cspell.config.yaml +14 -0
package/dist/chunk-23UPXDNL.js +3044 -0
package/dist/chunk-2W7MO2DL.js +1366 -0
package/dist/chunk-3NUAZGMA.js +1689 -0
package/dist/chunk-7TOWB2XB.js +366 -0
package/dist/chunk-7XOTOADQ.js +3065 -0
package/dist/chunk-AH2PDM2K.js +3042 -0
package/dist/chunk-BNXWSZ63.js +3742 -0
package/dist/chunk-BTL5DJVU.js +3222 -0
package/dist/chunk-HDHYG7E4.js +104 -0
package/dist/chunk-HLR4KZBP.js +3234 -0
package/dist/chunk-IP3FRFEB.js +1045 -0
package/dist/chunk-KHU56VDO.js +3042 -0
package/dist/chunk-KRYIFLQR.js +88 -0
package/dist/chunk-LBSDNLEM.js +287 -0
package/dist/chunk-MNTQ7HCP.js +2643 -0
package/dist/chunk-MUJELQQ6.js +1387 -0
package/dist/chunk-MXJGMSLV.js +2199 -0
package/dist/chunk-N6QJGC3Z.js +2636 -0
package/dist/chunk-OBELGBPM.js +1713 -0
package/dist/chunk-OT7R5XTA.js +3192 -0
package/dist/chunk-P7X4RA2T.js +106 -0
package/dist/chunk-PIDUQNC2.js +3185 -0
package/dist/chunk-POGCDIH4.js +3187 -0
package/dist/chunk-PSIEOQGZ.js +3043 -0
package/dist/chunk-PVRT3IHA.js +3238 -0
package/dist/chunk-QNN4TT23.js +1430 -0
package/dist/chunk-RE3R45RJ.js +3042 -0
package/dist/chunk-S7E6TFX6.js +803 -0
package/dist/chunk-SG6GLU4U.js +1378 -0
package/dist/chunk-SJCDV2ST.js +274 -0
package/dist/chunk-SYE5XLF3.js +104 -0
package/dist/chunk-T5VLYBZD.js +103 -0
package/dist/chunk-TOQB7VWU.js +3238 -0
package/dist/chunk-VFNMZ4ZQ.js +3228 -0
package/dist/chunk-VVTGZNBT.js +1629 -0
package/dist/chunk-W7Q4RFEV.js +104 -0
package/dist/chunk-XTYYVRLO.js +3190 -0
package/dist/chunk-Y6MDYVJD.js +3063 -0
package/dist/cli/main.d.ts +1 -0
package/dist/cli/main.js +5458 -0
package/dist/index.d.ts +653 -0
package/dist/index.js +79 -0
package/dist/mcp/server.d.ts +1 -0
package/dist/mcp/server.js +472 -0
package/dist/schema-BAWSG7KY.js +22 -0
package/dist/schema-E3QUPL26.js +20 -0
package/dist/schema-EHL7WUT6.js +20 -0
package/docs/019-USAGE.md +625 -0
package/docs/020-current-implementation.md +364 -0
package/docs/021-DOGFOODING-FINDINGS.md +175 -0
package/docs/BACKLOG.md +80 -0
package/docs/CONFIG.md +1123 -0
package/docs/DESIGN.md +439 -0
package/docs/ERRORS.md +383 -0
package/docs/PROJECT.md +88 -0
package/docs/ROADMAP.md +407 -0
package/docs/summarization.md +320 -0
package/docs/test-links.md +9 -0
package/justfile +40 -0
package/package.json +74 -9
package/pnpm-workspace.yaml +5 -0
package/research/INDEX.md +315 -0
package/research/code-review/README.md +90 -0
package/research/code-review/cli-error-handling-review.md +979 -0
package/research/code-review/code-review-validation-report.md +464 -0
package/research/code-review/main-ts-review.md +1128 -0
package/research/config-analysis/01-current-implementation.md +470 -0
package/research/config-analysis/02-strategy-recommendation.md +428 -0
package/research/config-analysis/03-task-candidates.md +715 -0
package/research/config-analysis/033-research-configuration-management.md +828 -0
package/research/config-analysis/034-research-effect-cli-config.md +1504 -0
package/research/config-analysis/04-consolidated-task-candidates.md +277 -0
package/research/config-docs/SUMMARY.md +357 -0
package/research/config-docs/TEST-RESULTS.md +776 -0
package/research/config-docs/TODO.md +542 -0
package/research/config-docs/analysis.md +744 -0
package/research/config-docs/fix-validation.md +502 -0
package/research/config-docs/help-audit.md +264 -0
package/research/config-docs/help-system-analysis.md +890 -0
package/research/dogfood/consolidated-tool-evaluation.md +373 -0
package/research/dogfood/strategy-a/a-synthesis.md +184 -0
package/research/dogfood/strategy-a/a1-docs.md +226 -0
package/research/dogfood/strategy-a/a2-amorphic.md +156 -0
package/research/dogfood/strategy-a/a3-llm.md +164 -0
package/research/dogfood/strategy-b/b-synthesis.md +228 -0
package/research/dogfood/strategy-b/b1-architecture.md +207 -0
package/research/dogfood/strategy-b/b2-gaps.md +258 -0
package/research/dogfood/strategy-b/b3-workflows.md +250 -0
package/research/dogfood/strategy-c/c-synthesis.md +451 -0
package/research/dogfood/strategy-c/c1-explorer.md +192 -0
package/research/dogfood/strategy-c/c2-diver-memory.md +145 -0
package/research/dogfood/strategy-c/c3-diver-control.md +148 -0
package/research/dogfood/strategy-c/c4-diver-failure.md +151 -0
package/research/dogfood/strategy-c/c5-diver-execution.md +221 -0
package/research/dogfood/strategy-c/c6-diver-org.md +221 -0
package/research/effect-cli-error-handling.md +845 -0
package/research/effect-errors-as-values.md +943 -0
package/research/errors-task-analysis/00-consolidated-tasks.md +207 -0
package/research/errors-task-analysis/cli-commands-analysis.md +909 -0
package/research/errors-task-analysis/embeddings-analysis.md +709 -0
package/research/errors-task-analysis/index-search-analysis.md +812 -0
package/research/frontmatter/COMMENTS-ARE-SKIPPED.md +149 -0
package/research/frontmatter/LLM-CODE-NAVIGATION.md +276 -0
package/research/issue-review.md +603 -0
package/research/llm-summarization/agent-cli-tools-2026.md +1082 -0
package/research/llm-summarization/alternative-providers-2026.md +1428 -0
package/research/llm-summarization/anthropic-2026.md +367 -0
package/research/llm-summarization/claude-cli-integration.md +1706 -0
package/research/llm-summarization/cli-integration-patterns.md +3155 -0
package/research/llm-summarization/openai-2026.md +473 -0
package/research/llm-summarization/openai-compatible-providers-2026.md +1022 -0
package/research/llm-summarization/opencode-cli-integration.md +1552 -0
package/research/llm-summarization/prompt-engineering-2026.md +1426 -0
package/research/llm-summarization/prototype-results.md +56 -0
package/research/llm-summarization/provider-switching-patterns-2026.md +2153 -0
package/research/llm-summarization/typescript-llm-libraries-2026.md +2436 -0
package/research/mdcontext-error-analysis.md +521 -0
package/research/mdcontext-pudding/00-EXECUTIVE-SUMMARY.md +282 -0
package/research/mdcontext-pudding/01-index-embed.md +956 -0
package/research/mdcontext-pudding/02-search-COMMANDS.md +142 -0
package/research/mdcontext-pudding/02-search-SUMMARY.md +146 -0
package/research/mdcontext-pudding/02-search.md +970 -0
package/research/mdcontext-pudding/03-context.md +779 -0
package/research/mdcontext-pudding/04-navigation-and-analytics.md +803 -0
package/research/mdcontext-pudding/04-tree.md +704 -0
package/research/mdcontext-pudding/05-config.md +1038 -0
package/research/mdcontext-pudding/06-links-summary.txt +87 -0
package/research/mdcontext-pudding/06-links.md +679 -0
package/research/mdcontext-pudding/07-stats.md +693 -0
package/research/mdcontext-pudding/BUG-FIX-PLAN.md +388 -0
package/research/mdcontext-pudding/P0-BUG-VALIDATION.md +167 -0
package/research/mdcontext-pudding/README.md +168 -0
package/research/mdcontext-pudding/TESTING-SUMMARY.md +128 -0
package/research/npm_publish/011-npm-workflow-research-agent2.md +792 -0
package/research/npm_publish/012-npm-workflow-research-agent1.md +530 -0
package/research/npm_publish/013-npm-workflow-research-agent3.md +722 -0
package/research/npm_publish/014-npm-workflow-synthesis.md +556 -0
package/research/npm_publish/031-npm-workflow-task-analysis.md +134 -0
package/research/research-quality-review.md +834 -0
package/research/semantic-search/002-research-embedding-models.md +490 -0
package/research/semantic-search/003-research-rag-alternatives.md +523 -0
package/research/semantic-search/004-research-vector-search.md +841 -0
package/research/semantic-search/032-research-semantic-search.md +427 -0
package/research/semantic-search/embedding-text-analysis.md +156 -0
package/research/semantic-search/multi-word-failure-reproduction.md +171 -0
package/research/semantic-search/query-processing-analysis.md +207 -0
package/research/semantic-search/root-cause-and-solution.md +114 -0
package/research/semantic-search/threshold-validation-report.md +69 -0
package/research/semantic-search/vector-search-analysis.md +63 -0
package/research/task-management-2026/00-synthesis-recommendations.md +295 -0
package/research/task-management-2026/01-ai-workflow-tools.md +416 -0
package/research/task-management-2026/02-agent-framework-patterns.md +476 -0
package/research/task-management-2026/03-lightweight-file-based.md +567 -0
package/research/task-management-2026/04-established-tools-ai-features.md +541 -0
package/research/task-management-2026/linear/01-core-features-workflow.md +771 -0
package/research/task-management-2026/linear/02-api-integrations.md +930 -0
package/research/task-management-2026/linear/03-ai-features.md +368 -0
package/research/task-management-2026/linear/04-pricing-setup.md +205 -0
package/research/task-management-2026/linear/05-usage-patterns-best-practices.md +605 -0
package/research/test-path-issues.md +276 -0
package/review/ALP-76/1-error-type-design.md +962 -0
package/review/ALP-76/2-error-handling-patterns.md +906 -0
package/review/ALP-76/3-error-presentation.md +624 -0
package/review/ALP-76/4-test-coverage.md +625 -0
package/review/ALP-76/5-migration-completeness.md +440 -0
package/review/ALP-76/6-effect-best-practices.md +755 -0
package/scripts/apply-branch-protection.sh +47 -0
package/scripts/branch-protection-templates.json +79 -0
package/scripts/prototype-summarization.ts +346 -0
package/scripts/rebuild-hnswlib.js +58 -0
package/scripts/setup-branch-protection.sh +64 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/active-provider.json +7 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/bm25.json +541 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/bm25.meta.json +5 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/config.json +8 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin +0 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin +0 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/documents.json +60 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/links.json +13 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/sections.json +1197 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/configuration-management.md +99 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/distributed-systems.md +92 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/error-handling.md +78 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/failure-automation.md +55 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/job-context.md +69 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/process-orchestration.md +99 -0
package/src/cli/argv-preprocessor.test.ts +210 -0
package/src/cli/argv-preprocessor.ts +202 -0
package/src/cli/cli.test.ts +627 -0
package/src/cli/commands/backlinks.ts +54 -0
package/src/cli/commands/config-cmd.ts +642 -0
package/src/cli/commands/context.ts +285 -0
package/src/cli/commands/duplicates.ts +122 -0
package/src/cli/commands/embeddings.ts +529 -0
package/src/cli/commands/index-cmd.ts +480 -0
package/src/cli/commands/index.ts +16 -0
package/src/cli/commands/links.ts +52 -0
package/src/cli/commands/search.ts +1281 -0
package/src/cli/commands/stats.ts +149 -0
package/src/cli/commands/tree.ts +128 -0
package/src/cli/config-layer.ts +176 -0
package/src/cli/error-handler.test.ts +235 -0
package/src/cli/error-handler.ts +655 -0
package/src/cli/flag-schemas.ts +341 -0
package/src/cli/help.ts +588 -0
package/src/cli/index.ts +9 -0
package/src/cli/main.ts +435 -0
package/src/cli/options.ts +41 -0
package/src/cli/shared-error-handling.ts +199 -0
package/src/cli/typo-suggester.test.ts +105 -0
package/src/cli/typo-suggester.ts +130 -0
package/src/cli/utils.ts +259 -0
package/src/config/file-provider.test.ts +320 -0
package/src/config/file-provider.ts +273 -0
package/src/config/index.ts +72 -0
package/src/config/integration.test.ts +667 -0
package/src/config/precedence.test.ts +277 -0
package/src/config/precedence.ts +451 -0
package/src/config/schema.test.ts +414 -0
package/src/config/schema.ts +603 -0
package/src/config/service.test.ts +320 -0
package/src/config/service.ts +243 -0
package/src/config/testing.test.ts +264 -0
package/src/config/testing.ts +110 -0
package/src/core/index.ts +1 -0
package/src/core/types.ts +113 -0
package/src/duplicates/detector.test.ts +183 -0
package/src/duplicates/detector.ts +414 -0
package/src/duplicates/index.ts +18 -0
package/src/embeddings/embedding-namespace.test.ts +300 -0
package/src/embeddings/embedding-namespace.ts +947 -0
package/src/embeddings/heading-boost.test.ts +222 -0
package/src/embeddings/hnsw-build-options.test.ts +198 -0
package/src/embeddings/hyde.test.ts +272 -0
package/src/embeddings/hyde.ts +264 -0
package/src/embeddings/index.ts +10 -0
package/src/embeddings/openai-provider.ts +414 -0
package/src/embeddings/pricing.json +22 -0
package/src/embeddings/provider-constants.ts +204 -0
package/src/embeddings/provider-errors.test.ts +967 -0
package/src/embeddings/provider-errors.ts +565 -0
package/src/embeddings/provider-factory.test.ts +240 -0
package/src/embeddings/provider-factory.ts +225 -0
package/src/embeddings/provider-integration.test.ts +788 -0
package/src/embeddings/query-preprocessing.test.ts +187 -0
package/src/embeddings/semantic-search-threshold.test.ts +508 -0
package/src/embeddings/semantic-search.ts +1270 -0
package/src/embeddings/types.ts +359 -0
package/src/embeddings/vector-store.ts +708 -0
package/src/embeddings/voyage-provider.ts +313 -0
package/src/errors/errors.test.ts +845 -0
package/src/errors/index.ts +533 -0
package/src/index/ignore-patterns.test.ts +354 -0
package/src/index/ignore-patterns.ts +305 -0
package/src/index/index.ts +4 -0
package/src/index/indexer.ts +684 -0
package/src/index/storage.ts +260 -0
package/src/index/types.ts +147 -0
package/src/index/watcher.ts +189 -0
package/src/index.ts +30 -0
package/src/integration/search-keyword.test.ts +678 -0
package/src/mcp/server.ts +612 -0
package/src/parser/index.ts +1 -0
package/src/parser/parser.test.ts +291 -0
package/src/parser/parser.ts +394 -0
package/src/parser/section-filter.test.ts +277 -0
package/src/parser/section-filter.ts +392 -0
package/src/search/__tests__/hybrid-search.test.ts +650 -0
package/src/search/bm25-store.ts +366 -0
package/src/search/cross-encoder.test.ts +253 -0
package/src/search/cross-encoder.ts +406 -0
package/src/search/fuzzy-search.test.ts +419 -0
package/src/search/fuzzy-search.ts +273 -0
package/src/search/hybrid-search.ts +448 -0
package/src/search/path-matcher.test.ts +276 -0
package/src/search/path-matcher.ts +33 -0
package/src/search/query-parser.test.ts +260 -0
package/src/search/query-parser.ts +319 -0
package/src/search/searcher.test.ts +280 -0
package/src/search/searcher.ts +724 -0
package/src/search/wink-bm25.d.ts +30 -0
package/src/summarization/cli-providers/claude.ts +202 -0
package/src/summarization/cli-providers/detection.test.ts +273 -0
package/src/summarization/cli-providers/detection.ts +118 -0
package/src/summarization/cli-providers/index.ts +8 -0
package/src/summarization/cost.test.ts +139 -0
package/src/summarization/cost.ts +102 -0
package/src/summarization/error-handler.test.ts +127 -0
package/src/summarization/error-handler.ts +111 -0
package/src/summarization/index.ts +102 -0
package/src/summarization/pipeline.test.ts +498 -0
package/src/summarization/pipeline.ts +231 -0
package/src/summarization/prompts.test.ts +269 -0
package/src/summarization/prompts.ts +133 -0
package/src/summarization/provider-factory.test.ts +396 -0
package/src/summarization/provider-factory.ts +178 -0
package/src/summarization/types.ts +184 -0
package/src/summarize/budget-bugs.test.ts +620 -0
package/src/summarize/formatters.ts +419 -0
package/src/summarize/index.ts +20 -0
package/src/summarize/summarizer.test.ts +275 -0
package/src/summarize/summarizer.ts +597 -0
package/src/summarize/verify-bugs.test.ts +238 -0
package/src/types/huggingface-transformers.d.ts +66 -0
package/src/utils/index.ts +1 -0
package/src/utils/tokens.test.ts +142 -0
package/src/utils/tokens.ts +186 -0
package/tests/fixtures/cli/.mdcontext/active-provider.json +7 -0
package/tests/fixtures/cli/.mdcontext/config.json +8 -0
package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin +0 -0
package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin +0 -0
package/tests/fixtures/cli/.mdcontext/indexes/documents.json +33 -0
package/tests/fixtures/cli/.mdcontext/indexes/links.json +12 -0
package/tests/fixtures/cli/.mdcontext/indexes/sections.json +247 -0
package/tests/fixtures/cli/README.md +9 -0
package/tests/fixtures/cli/api-reference.md +11 -0
package/tests/fixtures/cli/getting-started.md +11 -0
package/tests/integration/embed-index.test.ts +712 -0
package/tests/integration/search-context.test.ts +469 -0
package/tests/integration/search-semantic.test.ts +522 -0
package/tsconfig.json +26 -0
package/vitest.config.ts +16 -0
package/vitest.setup.ts +12 -0

package/src/search/query-parser.ts ADDED Viewed

@@ -0,0 +1,319 @@
+/**
+ * Query Parser for mdcontext search
+ *
+ * Supports:
+ * - Boolean operators: AND, OR, NOT (case-insensitive)
+ * - Quoted phrases: "exact phrase"
+ * - Grouping: (term1 OR term2) AND term3
+ * - Precedence: NOT > AND > OR
+ */
+// ============================================================================
+// Types
+// ============================================================================
+export type QueryNode =
+  | { type: 'term'; value: string }
+  | { type: 'phrase'; value: string }
+  | { type: 'and'; left: QueryNode; right: QueryNode }
+  | { type: 'or'; left: QueryNode; right: QueryNode }
+  | { type: 'not'; operand: QueryNode }
+export interface ParsedQuery {
+  readonly ast: QueryNode
+  readonly terms: readonly string[]
+  readonly phrases: readonly string[]
+}
+// ============================================================================
+// Tokenizer
+// ============================================================================
+type TokenType = 'AND' | 'OR' | 'NOT' | 'LPAREN' | 'RPAREN' | 'PHRASE' | 'TERM'
+interface Token {
+  type: TokenType
+  value: string
+}
+/**
+ * Tokenize query string into tokens
+ */
+const tokenize = (query: string): Token[] => {
+  const tokens: Token[] = []
+  let i = 0
+  while (i < query.length) {
+    // Skip whitespace
+    if (/\s/.test(query[i]!)) {
+      i++
+      continue
+    }
+    // Quoted phrase
+    if (query[i] === '"') {
+      const start = i + 1
+      i++
+      while (i < query.length && query[i] !== '"') {
+        i++
+      }
+      const value = query.slice(start, i)
+      tokens.push({ type: 'PHRASE', value })
+      i++ // Skip closing quote
+      continue
+    }
+    // Parentheses
+    if (query[i] === '(') {
+      tokens.push({ type: 'LPAREN', value: '(' })
+      i++
+      continue
+    }
+    if (query[i] === ')') {
+      tokens.push({ type: 'RPAREN', value: ')' })
+      i++
+      continue
+    }
+    // Words (operators or terms)
+    const wordMatch = query.slice(i).match(/^[^\s()"]+/)
+    if (wordMatch) {
+      const word = wordMatch[0]
+      const upperWord = word.toUpperCase()
+      if (upperWord === 'AND') {
+        tokens.push({ type: 'AND', value: 'AND' })
+      } else if (upperWord === 'OR') {
+        tokens.push({ type: 'OR', value: 'OR' })
+      } else if (upperWord === 'NOT') {
+        tokens.push({ type: 'NOT', value: 'NOT' })
+      } else {
+        tokens.push({ type: 'TERM', value: word })
+      }
+      i += word.length
+      continue
+    }
+    // Unknown character, skip
+    i++
+  }
+  return tokens
+}
+// ============================================================================
+// Parser (Recursive Descent)
+// ============================================================================
+/**
+ * Parser for boolean query expressions.
+ * Grammar:
+ *   expr     -> andExpr (OR andExpr)*
+ *   andExpr  -> notExpr (AND notExpr)*
+ *   notExpr  -> NOT notExpr | primary
+ *   primary  -> TERM | PHRASE | LPAREN expr RPAREN
+ */
+class Parser {
+  private tokens: Token[]
+  private pos: number = 0
+  readonly terms: string[] = []
+  readonly phrases: string[] = []
+  constructor(tokens: Token[]) {
+    this.tokens = tokens
+  }
+  private current(): Token | undefined {
+    return this.tokens[this.pos]
+  }
+  private advance(): Token | undefined {
+    return this.tokens[this.pos++]
+  }
+  private match(type: TokenType): boolean {
+    if (this.current()?.type === type) {
+      this.advance()
+      return true
+    }
+    return false
+  }
+  parse(): QueryNode | null {
+    if (this.tokens.length === 0) {
+      return null
+    }
+    return this.parseExpr()
+  }
+  private parseExpr(): QueryNode {
+    let left = this.parseAndExpr()
+    while (this.match('OR')) {
+      const right = this.parseAndExpr()
+      left = { type: 'or', left, right }
+    }
+    return left
+  }
+  private parseAndExpr(): QueryNode {
+    let left = this.parseNotExpr()
+    // Handle implicit AND (terms without explicit AND between them)
+    while (this.match('AND') || this.isImplicitAnd()) {
+      const right = this.parseNotExpr()
+      left = { type: 'and', left, right }
+    }
+    return left
+  }
+  private isImplicitAnd(): boolean {
+    const tok = this.current()
+    // If next token is a TERM, PHRASE, NOT, or LPAREN, treat as implicit AND
+    return (
+      tok?.type === 'TERM' ||
+      tok?.type === 'PHRASE' ||
+      tok?.type === 'NOT' ||
+      tok?.type === 'LPAREN'
+    )
+  }
+  private parseNotExpr(): QueryNode {
+    if (this.match('NOT')) {
+      const operand = this.parseNotExpr()
+      return { type: 'not', operand }
+    }
+    return this.parsePrimary()
+  }
+  private parsePrimary(): QueryNode {
+    const tok = this.current()
+    if (this.match('LPAREN')) {
+      const expr = this.parseExpr()
+      this.match('RPAREN') // Consume closing paren (ignore if missing)
+      return expr
+    }
+    if (tok?.type === 'PHRASE') {
+      this.advance()
+      this.phrases.push(tok.value)
+      return { type: 'phrase', value: tok.value }
+    }
+    if (tok?.type === 'TERM') {
+      this.advance()
+      this.terms.push(tok.value)
+      return { type: 'term', value: tok.value }
+    }
+    // Unexpected token, return empty term
+    return { type: 'term', value: '' }
+  }
+}
+// ============================================================================
+// Public API
+// ============================================================================
+/**
+ * Parse a search query into an AST
+ */
+export const parseQuery = (query: string): ParsedQuery | null => {
+  const tokens = tokenize(query)
+  if (tokens.length === 0) {
+    return null
+  }
+  const parser = new Parser(tokens)
+  const ast = parser.parse()
+  if (!ast) {
+    return null
+  }
+  return {
+    ast,
+    terms: parser.terms,
+    phrases: parser.phrases,
+  }
+}
+/**
+ * Check if a query contains boolean operators or phrases
+ */
+export const isAdvancedQuery = (query: string): boolean => {
+  const tokens = tokenize(query)
+  return tokens.some(
+    (t) =>
+      t.type === 'AND' ||
+      t.type === 'OR' ||
+      t.type === 'NOT' ||
+      t.type === 'PHRASE' ||
+      t.type === 'LPAREN',
+  )
+}
+/**
+ * Evaluate a parsed query against text content
+ * Returns true if the text matches the query
+ */
+export const evaluateQuery = (ast: QueryNode, text: string): boolean => {
+  const lowerText = text.toLowerCase()
+  const evaluate = (node: QueryNode): boolean => {
+    switch (node.type) {
+      case 'term': {
+        // Empty term matches anything
+        if (!node.value) return true
+        return lowerText.includes(node.value.toLowerCase())
+      }
+      case 'phrase': {
+        // Phrase must match exactly (case-insensitive)
+        return lowerText.includes(node.value.toLowerCase())
+      }
+      case 'and': {
+        return evaluate(node.left) && evaluate(node.right)
+      }
+      case 'or': {
+        return evaluate(node.left) || evaluate(node.right)
+      }
+      case 'not': {
+        return !evaluate(node.operand)
+      }
+    }
+  }
+  return evaluate(ast)
+}
+/**
+ * Build a regex pattern from a parsed query for highlighting matches
+ * This creates a pattern that matches any of the terms/phrases
+ */
+export const buildHighlightPattern = (parsed: ParsedQuery): RegExp => {
+  const patterns: string[] = []
+  // Escape special regex chars
+  const escapeChars = (s: string) => s.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')
+  for (const term of parsed.terms) {
+    if (term) {
+      patterns.push(`\\b${escapeChars(term)}\\b`)
+    }
+  }
+  for (const phrase of parsed.phrases) {
+    if (phrase) {
+      patterns.push(escapeChars(phrase))
+    }
+  }
+  if (patterns.length === 0) {
+    return /.^/ // Match nothing
+  }
+  return new RegExp(patterns.join('|'), 'gi')
+}

package/src/search/searcher.test.ts ADDED Viewed

@@ -0,0 +1,280 @@
+/**
+ * Tests for keyword search
+ */
+import * as fs from 'node:fs/promises'
+import * as path from 'node:path'
+import { Effect } from 'effect'
+import { afterAll, beforeAll, describe, expect, it } from 'vitest'
+import { buildIndex } from '../index/indexer.js'
+import {
+  formatContextForLLM,
+  getContext,
+  search,
+  searchContent,
+} from './searcher.js'
+// Test fixture directory
+const TEST_DIR = path.join(process.cwd(), 'tests', 'fixtures', 'search')
+// Helper to run Effect
+const runEffect = <A, E>(effect: Effect.Effect<A, E>) =>
+  Effect.runPromise(effect)
+describe('search', () => {
+  beforeAll(async () => {
+    // Create test fixtures
+    await fs.mkdir(TEST_DIR, { recursive: true })
+    // Create test markdown files
+    await fs.writeFile(
+      path.join(TEST_DIR, 'doc1.md'),
+      `# Document One
+## Introduction
+This is the introduction section.
+## Code Example
+Here's some code:
+\`\`\`typescript
+const x = 1;
+\`\`\`
+## Summary
+A brief summary.
+`,
+    )
+    await fs.writeFile(
+      path.join(TEST_DIR, 'doc2.md'),
+      `# Document Two
+## Overview
+An overview of the document.
+## Data Table
+| Column A | Column B |
+|----------|----------|
+| Value 1  | Value 2  |
+## Tasks
+- Task 1
+- Task 2
+- Task 3
+`,
+    )
+    // Create test file for fuzzy/stem search
+    await fs.writeFile(
+      path.join(TEST_DIR, 'stem-test.md'),
+      `# Failure Handling
+When the application fails, it logs the failure message.
+Failed operations are retried automatically.
+Failing gracefully is important for user experience.
+## Configuration
+The configration (typo) file is located at config.json.
+Set the configuration options carefully.
+`,
+    )
+    // Build index
+    await runEffect(buildIndex(TEST_DIR, { force: true }))
+  })
+  afterAll(async () => {
+    // Clean up
+    await fs.rm(TEST_DIR, { recursive: true, force: true })
+  })
+  describe('search()', () => {
+    it('should return all sections without filters', async () => {
+      const results = await runEffect(search(TEST_DIR))
+      expect(results.length).toBeGreaterThan(0)
+    })
+    it('should filter by heading pattern', async () => {
+      const results = await runEffect(
+        search(TEST_DIR, { heading: 'Introduction|Overview' }),
+      )
+      expect(results.length).toBe(2)
+      expect(results.map((r) => r.section.heading)).toContain('Introduction')
+      expect(results.map((r) => r.section.heading)).toContain('Overview')
+    })
+    it('should filter by path pattern', async () => {
+      const results = await runEffect(
+        search(TEST_DIR, { pathPattern: 'doc1*' }),
+      )
+      expect(results.length).toBeGreaterThan(0)
+      for (const result of results) {
+        expect(result.section.documentPath).toMatch(/doc1/)
+      }
+    })
+    it('should filter by hasCode', async () => {
+      const results = await runEffect(search(TEST_DIR, { hasCode: true }))
+      expect(results.length).toBeGreaterThan(0)
+      for (const result of results) {
+        expect(result.section.hasCode).toBe(true)
+      }
+    })
+    it('should filter by hasTable', async () => {
+      const results = await runEffect(search(TEST_DIR, { hasTable: true }))
+      expect(results.length).toBeGreaterThan(0)
+      for (const result of results) {
+        expect(result.section.hasTable).toBe(true)
+      }
+    })
+    it('should filter by hasList', async () => {
+      const results = await runEffect(search(TEST_DIR, { hasList: true }))
+      expect(results.length).toBeGreaterThan(0)
+      for (const result of results) {
+        expect(result.section.hasList).toBe(true)
+      }
+    })
+    it('should respect limit', async () => {
+      const results = await runEffect(search(TEST_DIR, { limit: 2 }))
+      expect(results.length).toBe(2)
+    })
+  })
+  describe('getContext()', () => {
+    it('should return document context', async () => {
+      const context = await runEffect(
+        getContext(TEST_DIR, path.join(TEST_DIR, 'doc1.md')),
+      )
+      expect(context.title).toBe('Document One')
+      expect(context.sections.length).toBeGreaterThan(0)
+    })
+    it('should respect maxTokens', async () => {
+      const fullContext = await runEffect(
+        getContext(TEST_DIR, path.join(TEST_DIR, 'doc1.md')),
+      )
+      // Use a limit that's definitely smaller than the full document
+      const limitTokens = Math.max(10, Math.floor(fullContext.totalTokens / 2))
+      const limitedContext = await runEffect(
+        getContext(TEST_DIR, path.join(TEST_DIR, 'doc1.md'), {
+          maxTokens: limitTokens,
+        }),
+      )
+      expect(limitedContext.includedTokens).toBeLessThanOrEqual(limitTokens)
+      // Only check for reduction if the full context exceeds the limit
+      if (fullContext.totalTokens > limitTokens) {
+        expect(limitedContext.includedTokens).toBeLessThan(
+          fullContext.totalTokens,
+        )
+      }
+    })
+  })
+  describe('formatContextForLLM()', () => {
+    it('should format context as readable text', async () => {
+      const context = await runEffect(
+        getContext(TEST_DIR, path.join(TEST_DIR, 'doc1.md')),
+      )
+      const formatted = formatContextForLLM(context)
+      expect(formatted).toContain('# Document One')
+      expect(formatted).toContain('Path: doc1.md')
+      expect(formatted).toContain('tokens')
+    })
+    it('should include content metadata markers', async () => {
+      const context = await runEffect(
+        getContext(TEST_DIR, path.join(TEST_DIR, 'doc1.md')),
+      )
+      const formatted = formatContextForLLM(context)
+      expect(formatted).toContain('[code]')
+    })
+  })
+  describe('searchContent() with fuzzy/stem matching', () => {
+    it('should match stemmed variations with --stem flag', async () => {
+      // Search for "fail" should match "fails", "failed", "failing", "failure"
+      const results = await runEffect(
+        searchContent(TEST_DIR, {
+          content: 'fail',
+          stem: true,
+          pathPattern: 'stem-test*',
+        }),
+      )
+      expect(results.length).toBe(1)
+      expect(results[0]?.section.heading).toBe('Failure Handling')
+      // Should have multiple line matches for different word forms
+      expect(results[0]?.matches?.length).toBeGreaterThan(1)
+    })
+    it('should match typos with --fuzzy flag', async () => {
+      // Search for "configration" (typo) should match "configuration"
+      const results = await runEffect(
+        searchContent(TEST_DIR, {
+          content: 'configration',
+          fuzzy: true,
+          pathPattern: 'stem-test*',
+        }),
+      )
+      expect(results.length).toBe(1)
+      expect(results[0]?.section.heading).toBe('Configuration')
+      // Should match both the typo line and the correct spelling line
+      expect(results[0]?.matches?.length).toBeGreaterThanOrEqual(1)
+    })
+    it('should respect fuzzyDistance option', async () => {
+      // With distance 1, "fail" should NOT match "file" (distance 2)
+      const strictResults = await runEffect(
+        searchContent(TEST_DIR, {
+          content: 'fail',
+          fuzzy: true,
+          fuzzyDistance: 1,
+          pathPattern: 'stem-test*',
+        }),
+      )
+      // With distance 1, only exact or 1-edit matches
+      const matchedWords = strictResults
+        .flatMap((r) => r.matches?.map((m) => m.line) ?? [])
+        .join(' ')
+        .toLowerCase()
+      // "fail" with distance 1 matches "fails" but not "file"
+      expect(matchedWords).toContain('fail')
+    })
+    it('should not match without fuzzy/stem flags', async () => {
+      // Exact search for "fail" should NOT match "failure" or "fails"
+      const results = await runEffect(
+        searchContent(TEST_DIR, {
+          content: 'fail',
+          pathPattern: 'stem-test*',
+        }),
+      )
+      // With exact search, "fail" appears as substring in "fails", "failure", "failing", "failed"
+      // so it still matches, but checks the regex-based behavior
+      expect(results.length).toBeGreaterThanOrEqual(1)
+    })
+    it('should combine fuzzy and stem matching', async () => {
+      // Both flags together should provide broader matching
+      const results = await runEffect(
+        searchContent(TEST_DIR, {
+          content: 'fail',
+          fuzzy: true,
+          stem: true,
+          pathPattern: 'stem-test*',
+        }),
+      )
+      expect(results.length).toBeGreaterThanOrEqual(1)
+    })
+  })
+})