npm - mdcontext - Versions diffs - 0.1.0 → 0.2.0 - Mend

mdcontext 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (251) hide show

package/.changeset/config.json +9 -9
package/.claude/settings.local.json +25 -0
package/.github/workflows/claude-code-review.yml +44 -0
package/.github/workflows/claude.yml +85 -0
package/CONTRIBUTING.md +186 -0
package/NOTES/NOTES +44 -0
package/README.md +206 -3
package/biome.json +1 -1
package/dist/chunk-23UPXDNL.js +3044 -0
package/dist/chunk-2W7MO2DL.js +1366 -0
package/dist/chunk-3NUAZGMA.js +1689 -0
package/dist/chunk-7TOWB2XB.js +366 -0
package/dist/chunk-7XOTOADQ.js +3065 -0
package/dist/chunk-AH2PDM2K.js +3042 -0
package/dist/chunk-BNXWSZ63.js +3742 -0
package/dist/chunk-BTL5DJVU.js +3222 -0
package/dist/chunk-HDHYG7E4.js +104 -0
package/dist/chunk-HLR4KZBP.js +3234 -0
package/dist/chunk-IP3FRFEB.js +1045 -0
package/dist/chunk-KHU56VDO.js +3042 -0
package/dist/chunk-KRYIFLQR.js +85 -89
package/dist/chunk-LBSDNLEM.js +287 -0
package/dist/chunk-MNTQ7HCP.js +2643 -0
package/dist/chunk-MUJELQQ6.js +1387 -0
package/dist/chunk-MXJGMSLV.js +2199 -0
package/dist/chunk-N6QJGC3Z.js +2636 -0
package/dist/chunk-OBELGBPM.js +1713 -0
package/dist/chunk-OT7R5XTA.js +3192 -0
package/dist/chunk-P7X4RA2T.js +106 -0
package/dist/chunk-PIDUQNC2.js +3185 -0
package/dist/chunk-POGCDIH4.js +3187 -0
package/dist/chunk-PSIEOQGZ.js +3043 -0
package/dist/chunk-PVRT3IHA.js +3238 -0
package/dist/chunk-QNN4TT23.js +1430 -0
package/dist/chunk-RE3R45RJ.js +3042 -0
package/dist/chunk-S7E6TFX6.js +718 -657
package/dist/chunk-SG6GLU4U.js +1378 -0
package/dist/chunk-SJCDV2ST.js +274 -0
package/dist/chunk-SYE5XLF3.js +104 -0
package/dist/chunk-T5VLYBZD.js +103 -0
package/dist/chunk-TOQB7VWU.js +3238 -0
package/dist/chunk-VFNMZ4ZQ.js +3228 -0
package/dist/chunk-VVTGZNBT.js +1533 -1423
package/dist/chunk-W7Q4RFEV.js +104 -0
package/dist/chunk-XTYYVRLO.js +3190 -0
package/dist/chunk-Y6MDYVJD.js +3063 -0
package/dist/cli/main.js +4072 -629
package/dist/index.d.ts +420 -33
package/dist/index.js +8 -15
package/dist/mcp/server.js +103 -7
package/dist/schema-BAWSG7KY.js +22 -0
package/dist/schema-E3QUPL26.js +20 -0
package/dist/schema-EHL7WUT6.js +20 -0
package/docs/019-USAGE.md +44 -5
package/docs/020-current-implementation.md +8 -8
package/docs/021-DOGFOODING-FINDINGS.md +1 -1
package/docs/CONFIG.md +1123 -0
package/docs/ERRORS.md +383 -0
package/docs/summarization.md +320 -0
package/justfile +40 -0
package/package.json +39 -33
package/research/INDEX.md +315 -0
package/research/code-review/README.md +90 -0
package/research/code-review/cli-error-handling-review.md +979 -0
package/research/code-review/code-review-validation-report.md +464 -0
package/research/code-review/main-ts-review.md +1128 -0
package/research/config-docs/SUMMARY.md +357 -0
package/research/config-docs/TEST-RESULTS.md +776 -0
package/research/config-docs/TODO.md +542 -0
package/research/config-docs/analysis.md +744 -0
package/research/config-docs/fix-validation.md +502 -0
package/research/config-docs/help-audit.md +264 -0
package/research/config-docs/help-system-analysis.md +890 -0
package/research/frontmatter/COMMENTS-ARE-SKIPPED.md +149 -0
package/research/frontmatter/LLM-CODE-NAVIGATION.md +276 -0
package/research/issue-review.md +603 -0
package/research/llm-summarization/agent-cli-tools-2026.md +1082 -0
package/research/llm-summarization/alternative-providers-2026.md +1428 -0
package/research/llm-summarization/anthropic-2026.md +367 -0
package/research/llm-summarization/claude-cli-integration.md +1706 -0
package/research/llm-summarization/cli-integration-patterns.md +3155 -0
package/research/llm-summarization/openai-2026.md +473 -0
package/research/llm-summarization/openai-compatible-providers-2026.md +1022 -0
package/research/llm-summarization/opencode-cli-integration.md +1552 -0
package/research/llm-summarization/prompt-engineering-2026.md +1426 -0
package/research/llm-summarization/prototype-results.md +56 -0
package/research/llm-summarization/provider-switching-patterns-2026.md +2153 -0
package/research/llm-summarization/typescript-llm-libraries-2026.md +2436 -0
package/research/mdcontext-pudding/00-EXECUTIVE-SUMMARY.md +282 -0
package/research/mdcontext-pudding/01-index-embed.md +956 -0
package/research/mdcontext-pudding/02-search-COMMANDS.md +142 -0
package/research/mdcontext-pudding/02-search-SUMMARY.md +146 -0
package/research/mdcontext-pudding/02-search.md +970 -0
package/research/mdcontext-pudding/03-context.md +779 -0
package/research/mdcontext-pudding/04-navigation-and-analytics.md +803 -0
package/research/mdcontext-pudding/04-tree.md +704 -0
package/research/mdcontext-pudding/05-config.md +1038 -0
package/research/mdcontext-pudding/06-links-summary.txt +87 -0
package/research/mdcontext-pudding/06-links.md +679 -0
package/research/mdcontext-pudding/07-stats.md +693 -0
package/research/mdcontext-pudding/BUG-FIX-PLAN.md +388 -0
package/research/mdcontext-pudding/P0-BUG-VALIDATION.md +167 -0
package/research/mdcontext-pudding/README.md +168 -0
package/research/mdcontext-pudding/TESTING-SUMMARY.md +128 -0
package/research/research-quality-review.md +834 -0
package/research/semantic-search/embedding-text-analysis.md +156 -0
package/research/semantic-search/multi-word-failure-reproduction.md +171 -0
package/research/semantic-search/query-processing-analysis.md +207 -0
package/research/semantic-search/root-cause-and-solution.md +114 -0
package/research/semantic-search/threshold-validation-report.md +69 -0
package/research/semantic-search/vector-search-analysis.md +63 -0
package/research/test-path-issues.md +276 -0
package/review/ALP-76/1-error-type-design.md +962 -0
package/review/ALP-76/2-error-handling-patterns.md +906 -0
package/review/ALP-76/3-error-presentation.md +624 -0
package/review/ALP-76/4-test-coverage.md +625 -0
package/review/ALP-76/5-migration-completeness.md +440 -0
package/review/ALP-76/6-effect-best-practices.md +755 -0
package/scripts/apply-branch-protection.sh +47 -0
package/scripts/branch-protection-templates.json +79 -0
package/scripts/prototype-summarization.ts +346 -0
package/scripts/rebuild-hnswlib.js +32 -37
package/scripts/setup-branch-protection.sh +64 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/active-provider.json +7 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/bm25.json +541 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/bm25.meta.json +5 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/config.json +8 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin +0 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin +0 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/documents.json +60 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/links.json +13 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/sections.json +1197 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/configuration-management.md +99 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/distributed-systems.md +92 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/error-handling.md +78 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/failure-automation.md +55 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/job-context.md +69 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/process-orchestration.md +99 -0
package/src/cli/argv-preprocessor.test.ts +2 -2
package/src/cli/cli.test.ts +230 -33
package/src/cli/commands/config-cmd.ts +642 -0
package/src/cli/commands/context.ts +97 -9
package/src/cli/commands/duplicates.ts +122 -0
package/src/cli/commands/embeddings.ts +529 -0
package/src/cli/commands/index-cmd.ts +210 -30
package/src/cli/commands/index.ts +3 -0
package/src/cli/commands/search.ts +894 -64
package/src/cli/commands/stats.ts +3 -0
package/src/cli/commands/tree.ts +26 -5
package/src/cli/config-layer.ts +176 -0
package/src/cli/error-handler.test.ts +235 -0
package/src/cli/error-handler.ts +655 -0
package/src/cli/flag-schemas.ts +66 -0
package/src/cli/help.ts +209 -7
package/src/cli/main.ts +348 -58
package/src/cli/options.ts +10 -0
package/src/cli/shared-error-handling.ts +199 -0
package/src/cli/utils.ts +150 -17
package/src/config/file-provider.test.ts +320 -0
package/src/config/file-provider.ts +273 -0
package/src/config/index.ts +72 -0
package/src/config/integration.test.ts +667 -0
package/src/config/precedence.test.ts +277 -0
package/src/config/precedence.ts +451 -0
package/src/config/schema.test.ts +414 -0
package/src/config/schema.ts +603 -0
package/src/config/service.test.ts +320 -0
package/src/config/service.ts +243 -0
package/src/config/testing.test.ts +264 -0
package/src/config/testing.ts +110 -0
package/src/core/types.ts +6 -33
package/src/duplicates/detector.test.ts +183 -0
package/src/duplicates/detector.ts +414 -0
package/src/duplicates/index.ts +18 -0
package/src/embeddings/embedding-namespace.test.ts +300 -0
package/src/embeddings/embedding-namespace.ts +947 -0
package/src/embeddings/heading-boost.test.ts +222 -0
package/src/embeddings/hnsw-build-options.test.ts +198 -0
package/src/embeddings/hyde.test.ts +272 -0
package/src/embeddings/hyde.ts +264 -0
package/src/embeddings/index.ts +2 -0
package/src/embeddings/openai-provider.ts +332 -83
package/src/embeddings/pricing.json +22 -0
package/src/embeddings/provider-constants.ts +204 -0
package/src/embeddings/provider-errors.test.ts +967 -0
package/src/embeddings/provider-errors.ts +565 -0
package/src/embeddings/provider-factory.test.ts +240 -0
package/src/embeddings/provider-factory.ts +225 -0
package/src/embeddings/provider-integration.test.ts +788 -0
package/src/embeddings/query-preprocessing.test.ts +187 -0
package/src/embeddings/semantic-search-threshold.test.ts +508 -0
package/src/embeddings/semantic-search.ts +780 -93
package/src/embeddings/types.ts +293 -16
package/src/embeddings/vector-store.ts +486 -77
package/src/embeddings/voyage-provider.ts +313 -0
package/src/errors/errors.test.ts +845 -0
package/src/errors/index.ts +533 -0
package/src/index/ignore-patterns.test.ts +354 -0
package/src/index/ignore-patterns.ts +305 -0
package/src/index/indexer.ts +286 -48
package/src/index/storage.ts +94 -30
package/src/index/types.ts +40 -2
package/src/index/watcher.ts +67 -9
package/src/index.ts +22 -0
package/src/integration/search-keyword.test.ts +678 -0
package/src/mcp/server.ts +135 -6
package/src/parser/parser.ts +18 -19
package/src/parser/section-filter.test.ts +277 -0
package/src/parser/section-filter.ts +125 -3
package/src/search/__tests__/hybrid-search.test.ts +650 -0
package/src/search/bm25-store.ts +366 -0
package/src/search/cross-encoder.test.ts +253 -0
package/src/search/cross-encoder.ts +406 -0
package/src/search/fuzzy-search.test.ts +419 -0
package/src/search/fuzzy-search.ts +273 -0
package/src/search/hybrid-search.ts +448 -0
package/src/search/path-matcher.test.ts +276 -0
package/src/search/path-matcher.ts +33 -0
package/src/search/searcher.test.ts +99 -1
package/src/search/searcher.ts +189 -67
package/src/search/wink-bm25.d.ts +30 -0
package/src/summarization/cli-providers/claude.ts +202 -0
package/src/summarization/cli-providers/detection.test.ts +273 -0
package/src/summarization/cli-providers/detection.ts +118 -0
package/src/summarization/cli-providers/index.ts +8 -0
package/src/summarization/cost.test.ts +139 -0
package/src/summarization/cost.ts +102 -0
package/src/summarization/error-handler.test.ts +127 -0
package/src/summarization/error-handler.ts +111 -0
package/src/summarization/index.ts +102 -0
package/src/summarization/pipeline.test.ts +498 -0
package/src/summarization/pipeline.ts +231 -0
package/src/summarization/prompts.test.ts +269 -0
package/src/summarization/prompts.ts +133 -0
package/src/summarization/provider-factory.test.ts +396 -0
package/src/summarization/provider-factory.ts +178 -0
package/src/summarization/types.ts +184 -0
package/src/summarize/summarizer.ts +104 -35
package/src/types/huggingface-transformers.d.ts +66 -0
package/tests/fixtures/cli/.mdcontext/active-provider.json +7 -0
package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin +0 -0
package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin +0 -0
package/tests/fixtures/cli/.mdcontext/indexes/documents.json +4 -4
package/tests/fixtures/cli/.mdcontext/indexes/sections.json +14 -0
package/tests/integration/embed-index.test.ts +712 -0
package/tests/integration/search-context.test.ts +469 -0
package/tests/integration/search-semantic.test.ts +522 -0
package/vitest.config.ts +1 -6
package/AGENTS.md +0 -46
package/tests/fixtures/cli/.mdcontext/vectors.bin +0 -0
package/tests/fixtures/cli/.mdcontext/vectors.meta.json +0 -1264

package/src/cli/commands/search.ts CHANGED Viewed

@@ -4,23 +4,142 @@
  * Search markdown content by meaning or heading pattern.
  */
+import * as fs from 'node:fs/promises'
 import * as path from 'node:path'
 import * as readline from 'node:readline'
 import { Args, Command, Options } from '@effect/cli'
 import { Console, Effect, Option } from 'effect'
-import { handleApiKeyError } from '../../embeddings/openai-provider.js'
+import { ConfigService, defaultConfig } from '../../config/index.js'
+import type {
+  BuildEmbeddingsResult,
+  EmbeddingEstimate,
+} from '../../embeddings/semantic-search.js'
 import {
   buildEmbeddings,
   estimateEmbeddingCost,
-  semanticSearch,
+  semanticSearchWithStats,
 } from '../../embeddings/semantic-search.js'
+import type { SearchQuality } from '../../embeddings/types.js'
+import { createStorage, loadSectionIndex } from '../../index/storage.js'
+import { INDEX_DIR } from '../../index/types.js'
+import { initializeReranker } from '../../search/cross-encoder.js'
+import {
+  detectSearchModes,
+  hybridSearch,
+  type SearchMode,
+} from '../../search/hybrid-search.js'
 import { isAdvancedQuery } from '../../search/query-parser.js'
 import { search, searchContent } from '../../search/searcher.js'
+import {
+  type APIProviderName,
+  buildPrompt,
+  type CLIProviderName,
+  displaySummarizationError,
+  estimateSummaryCost,
+  formatResultsForSummary,
+  getBestAvailableSummarizer,
+  type SummarizableResult,
+} from '../../summarization/index.js'
 import { jsonOption, prettyOption } from '../options.js'
+import {
+  createCostEstimateErrorHandler,
+  createEmbeddingErrorHandler,
+} from '../shared-error-handling.js'
 import { formatJson, getIndexInfo, isRegexPattern } from '../utils.js'
-// Auto-index threshold in seconds
-const AUTO_INDEX_THRESHOLD_SECONDS = 10
+// Auto-index threshold is now configurable via search.autoIndexThreshold
+/**
+ * Check if content contains all the refine terms (case-insensitive).
+ */
+const contentMatchesAllTerms = (
+  content: string,
+  terms: readonly string[],
+): boolean => {
+  const lowerContent = content.toLowerCase()
+  return terms.every((term) => lowerContent.includes(term.toLowerCase()))
+}
+/**
+ * Section info for refine filtering.
+ */
+interface SectionInfo {
+  readonly documentPath: string
+  readonly startLine: number
+  readonly endLine: number
+}
+/**
+ * Filter search results by refine terms using parallel file loading.
+ * Uses a file cache and concurrency limit for performance.
+ *
+ * @param rootPath - Root path for file loading
+ * @param results - Search results to filter
+ * @param refineTerms - Terms that must all be present in section content
+ * @param limit - Maximum results to return
+ * @param getSectionInfo - Function to extract section info from a result
+ */
+const filterResultsByRefineTerms = <T>(
+  rootPath: string,
+  results: readonly T[],
+  refineTerms: readonly string[],
+  limit: number,
+  getSectionInfo: (result: T) => SectionInfo | null,
+): Effect.Effect<T[], never> =>
+  Effect.gen(function* () {
+    if (refineTerms.length === 0 || results.length === 0) {
+      return results.slice(0, limit) as T[]
+    }
+    // Cache for file contents to avoid re-reading files
+    const fileCache = new Map<string, string | null>()
+    const getFileContent = (
+      documentPath: string,
+    ): Effect.Effect<string | null, never> =>
+      Effect.gen(function* () {
+        if (fileCache.has(documentPath)) {
+          return fileCache.get(documentPath)!
+        }
+        const content = yield* Effect.promise(async () => {
+          try {
+            const filePath = path.join(rootPath, documentPath)
+            return await fs.readFile(filePath, 'utf-8')
+          } catch {
+            return null
+          }
+        })
+        fileCache.set(documentPath, content)
+        return content
+      })
+    // Check each result in parallel with concurrency limit
+    const checkedResults = yield* Effect.all(
+      results.map((result) =>
+        Effect.gen(function* () {
+          const info = getSectionInfo(result)
+          if (!info) return null
+          const fileContent = yield* getFileContent(info.documentPath)
+          if (!fileContent) return null
+          const lines = fileContent.split('\n')
+          const sectionContent = lines
+            .slice(info.startLine - 1, info.endLine)
+            .join('\n')
+          if (contentMatchesAllTerms(sectionContent, refineTerms)) {
+            return result
+          }
+          return null
+        }),
+      ),
+      { concurrency: 10 },
+    )
+    // Filter nulls and limit results
+    return checkedResults.filter((r): r is T => r !== null).slice(0, limit)
+  })
 const promptUser = (message: string): Promise<string> => {
   return new Promise((resolve) => {
@@ -55,9 +174,11 @@ export const searchCommand = Command.make(
       Options.withDescription('Search headings only (not content)'),
       Options.withDefault(false),
     ),
-    mode: Options.choice('mode', ['semantic', 'keyword']).pipe(
+    mode: Options.choice('mode', ['hybrid', 'semantic', 'keyword']).pipe(
       Options.withAlias('m'),
-      Options.withDescription('Force search mode: semantic or keyword'),
+      Options.withDescription(
+        'Search mode: hybrid (BM25+semantic), semantic, or keyword',
+      ),
       Options.optional,
     ),
     limit: Options.integer('limit').pipe(
@@ -67,7 +188,7 @@ export const searchCommand = Command.make(
     ),
     threshold: Options.float('threshold').pipe(
       Options.withDescription('Similarity threshold for semantic search (0-1)'),
-      Options.withDefault(0.45),
+      Options.withDefault(0.35),
     ),
     context: Options.integer('context').pipe(
       Options.withAlias('C'),
@@ -88,10 +209,93 @@ export const searchCommand = Command.make(
       Options.withDescription(
         'Auto-create semantic index if estimated time is under this threshold (seconds)',
       ),
-      Options.withDefault(AUTO_INDEX_THRESHOLD_SECONDS),
+      Options.optional,
+    ),
+    provider: Options.choice('provider', [
+      'openai',
+      'ollama',
+      'lm-studio',
+      'openrouter',
+      'voyage',
+    ]).pipe(
+      Options.withDescription(
+        'Embedding provider for semantic search: openai, ollama, lm-studio, openrouter, or voyage',
+      ),
+      Options.optional,
+    ),
+    rerank: Options.boolean('rerank').pipe(
+      Options.withAlias('r'),
+      Options.withDescription(
+        'Re-rank results using cross-encoder for improved precision. Downloads ~90MB model on first use. Requires @huggingface/transformers.',
+      ),
+      Options.withDefault(false),
+    ),
+    quality: Options.choice('quality', ['fast', 'balanced', 'thorough']).pipe(
+      Options.withAlias('q'),
+      Options.withDescription(
+        'Search quality mode: fast (quicker, lower recall), balanced (default), thorough (slower, better recall)',
+      ),
+      Options.optional,
+    ),
+    hyde: Options.boolean('hyde').pipe(
+      Options.withDescription(
+        'Use HyDE (Hypothetical Document Embeddings) for complex queries. Generates a hypothetical answer with LLM, then searches using that embedding. Improves recall 10-30% on complex/ambiguous queries at cost of ~1-2s latency and LLM API usage.',
+      ),
+      Options.withDefault(false),
+    ),
+    rerankInit: Options.boolean('rerank-init').pipe(
+      Options.withDescription(
+        'Pre-download the cross-encoder model (~90MB) for re-ranking. Use this before first search to avoid latency.',
+      ),
+      Options.withDefault(false),
+    ),
+    timeout: Options.integer('timeout').pipe(
+      Options.withDescription(
+        'Request timeout in milliseconds for embedding API calls (default: 30000)',
+      ),
+      Options.optional,
     ),
     json: jsonOption,
     pretty: prettyOption,
+    summarize: Options.boolean('summarize').pipe(
+      Options.withAlias('s'),
+      Options.withDescription('Generate AI summary of search results'),
+      Options.withDefault(false),
+    ),
+    yes: Options.boolean('yes').pipe(
+      Options.withAlias('y'),
+      Options.withDescription('Skip cost confirmation for paid AI providers'),
+      Options.withDefault(false),
+    ),
+    stream: Options.boolean('stream').pipe(
+      Options.withDescription('Stream AI summary output in real-time'),
+      Options.withDefault(false),
+    ),
+    fuzzy: Options.boolean('fuzzy').pipe(
+      Options.withAlias('f'),
+      Options.withDescription(
+        'Enable fuzzy matching for typo tolerance (e.g., "configration" matches "configuration")',
+      ),
+      Options.withDefault(false),
+    ),
+    stem: Options.boolean('stem').pipe(
+      Options.withDescription(
+        'Enable word stemming (e.g., "fail" matches "failure", "failed", "failing")',
+      ),
+      Options.withDefault(false),
+    ),
+    fuzzyDistance: Options.integer('fuzzy-distance').pipe(
+      Options.withDescription(
+        'Max edit distance for fuzzy matching (default: 2)',
+      ),
+      Options.optional,
+    ),
+    refine: Options.text('refine').pipe(
+      Options.withDescription(
+        'Additional filter terms to narrow results (can be used multiple times)',
+      ),
+      Options.repeated,
+    ),
   },
   ({
     query,
@@ -105,12 +309,81 @@ export const searchCommand = Command.make(
     beforeContext,
     afterContext,
     autoIndexThreshold,
+    provider,
+    rerank,
+    quality,
+    hyde,
+    rerankInit,
+    timeout,
     json,
     pretty,
+    summarize,
+    yes,
+    stream,
+    fuzzy,
+    stem,
+    fuzzyDistance,
+    refine,
   }) =>
     Effect.gen(function* () {
       const resolvedDir = path.resolve(dirPath)
+      // Handle --rerank-init: pre-download model and exit
+      if (rerankInit) {
+        yield* Console.log(
+          'Initializing cross-encoder model (~90MB download)...',
+        )
+        const cacheDir = path.join(resolvedDir, INDEX_DIR, 'models')
+        const result = yield* initializeReranker(cacheDir, (progress) => {
+          if (progress.status === 'loading' && progress.file) {
+            const pct = progress.progress
+              ? ` (${Math.round(progress.progress)}%)`
+              : ''
+            process.stdout.write(`\r  Downloading: ${progress.file}${pct}`)
+          }
+        }).pipe(
+          Effect.map(() => true),
+          Effect.catchTag('RerankerError', (e) => {
+            if (e.reason === 'DependencyMissing') {
+              return Effect.succeed(false)
+            }
+            return Effect.fail(e)
+          }),
+        )
+        if (!result) {
+          yield* Console.log('')
+          yield* Console.log('Error: @huggingface/transformers not installed.')
+          yield* Console.log(
+            'Install with: npm install @huggingface/transformers',
+          )
+          return
+        }
+        yield* Console.log('')
+        yield* Console.log('Cross-encoder model initialized successfully.')
+        yield* Console.log('Use --rerank on searches for improved precision.')
+        return
+      }
+      // Get configuration (with fallback to defaults if not available)
+      const config = yield* Effect.serviceOption(ConfigService).pipe(
+        Effect.map(Option.getOrElse(() => defaultConfig)),
+      )
+      const searchConfig = config.search
+      // Apply config-based defaults when CLI options use their static defaults
+      // Note: CLI options have static defaults for help text; config overrides those defaults
+      const effectiveLimit = limit === 10 ? searchConfig.defaultLimit : limit
+      const effectiveThreshold =
+        threshold === 0.35 ? searchConfig.minSimilarity : threshold
+      const effectiveAutoIndexThreshold = Option.getOrElse(
+        autoIndexThreshold,
+        () => searchConfig.autoIndexThreshold,
+      )
       // Get index info for display
       const indexInfo = yield* Effect.promise(() => getIndexInfo(resolvedDir))
@@ -123,54 +396,75 @@ export const searchCommand = Command.make(
         return
       }
-      // Check for embeddings
-      let embedsExist = indexInfo.embeddingsExist
+      // Determine the actual index root (may be a parent directory)
+      const indexRoot = indexInfo.indexRoot ?? resolvedDir
+      // Calculate path filter for scoped search
+      // If searching a subdirectory, filter results to that path
+      let scopedPathPattern: string | undefined
+      if (indexInfo.indexRoot && indexInfo.indexRoot !== resolvedDir) {
+        // Get relative path from index root to search dir
+        const relativePath = path.relative(indexRoot, resolvedDir)
+        // Create pattern to match files in this directory and subdirectories
+        scopedPathPattern = `${relativePath}/*`
+        if (!json) {
+          yield* Console.log(`Searching within: ${relativePath}/`)
+          yield* Console.log('')
+        }
+      }
+      // Check available search modes
+      const searchModes = yield* detectSearchModes(indexRoot)
+      let embedsExist = searchModes.hasEmbeddings
       // Determine search mode
-      // Priority: --mode flag > --keyword flag > regex pattern > embeddings availability
-      let useKeyword: boolean
+      // Priority: --mode flag > --keyword flag > advanced query > auto-detect
+      let effectiveMode: SearchMode
       let modeReason: string
       const modeValue = Option.getOrUndefined(mode)
-      if (modeValue === 'semantic') {
-        // User explicitly requested semantic search
+      if (modeValue === 'hybrid') {
+        effectiveMode = 'hybrid'
+        modeReason = '--mode hybrid'
+      } else if (modeValue === 'semantic') {
         if (!embedsExist) {
-          // Try to auto-create index
           embedsExist = yield* handleMissingEmbeddings(
-            resolvedDir,
-            autoIndexThreshold,
+            indexRoot,
+            effectiveAutoIndexThreshold,
             json,
           )
           if (!embedsExist) {
-            // User declined or error
             return
           }
         }
-        useKeyword = false
+        effectiveMode = 'semantic'
         modeReason = '--mode semantic'
       } else if (modeValue === 'keyword') {
-        useKeyword = true
+        effectiveMode = 'keyword'
         modeReason = '--mode keyword'
       } else if (keyword) {
-        useKeyword = true
+        effectiveMode = 'keyword'
         modeReason = '--keyword flag'
       } else if (isAdvancedQuery(query)) {
-        // Detect quoted phrases and boolean operators (AND, OR, NOT)
-        useKeyword = true
+        effectiveMode = 'keyword'
         modeReason = 'boolean/phrase pattern detected'
       } else if (isRegexPattern(query)) {
-        useKeyword = true
+        effectiveMode = 'keyword'
         modeReason = 'regex pattern detected'
-      } else if (!embedsExist) {
-        useKeyword = true
-        modeReason = 'no embeddings'
       } else {
-        useKeyword = false
-        modeReason = 'embeddings available'
+        // Auto-detect best mode based on available indexes
+        effectiveMode = searchModes.recommendedMode
+        if (effectiveMode === 'hybrid') {
+          modeReason = 'both indexes available'
+        } else if (effectiveMode === 'semantic') {
+          modeReason = 'embeddings available'
+        } else {
+          modeReason = 'no embeddings'
+        }
       }
-      const modeIndicator = useKeyword ? '[keyword]' : '[semantic]'
+      const modeIndicator = `[${effectiveMode}]`
       // Show index info (non-JSON mode)
       if (!json && indexInfo.lastUpdated) {
@@ -199,20 +493,202 @@ export const searchCommand = Command.make(
       const beforeValue = Option.getOrUndefined(beforeContext)
       const afterValue = Option.getOrUndefined(afterContext)
-      const contextBefore = beforeValue ?? contextValue ?? 1
-      const contextAfter = afterValue ?? contextValue ?? 1
+      const contextBefore = beforeValue ?? contextValue
+      const contextAfter = afterValue ?? contextValue
+      if (effectiveMode === 'hybrid') {
+        // Hybrid search - combines BM25 and semantic with RRF
+        const effectiveQuality = Option.getOrUndefined(quality) as
+          | SearchQuality
+          | undefined
+        // Get more results if refinement is needed (we'll filter down later)
+        const refineTerms = refine.length > 0 ? refine : []
+        const fetchLimit =
+          refineTerms.length > 0 ? effectiveLimit * 5 : effectiveLimit
+        const { results: rawResults, stats } = yield* hybridSearch(
+          indexRoot,
+          query,
+          {
+            limit: fetchLimit,
+            threshold: effectiveThreshold,
+            mode: 'hybrid',
+            rerank,
+            quality: effectiveQuality,
+            contextBefore,
+            contextAfter,
+            ...(scopedPathPattern && { pathPattern: scopedPathPattern }),
+          },
+        )
+        // Apply refine filtering if terms provided (parallel with caching)
+        let results = rawResults
+        if (refineTerms.length > 0) {
+          const storage = createStorage(indexRoot)
+          const sectionIndex = yield* loadSectionIndex(storage)
+          if (sectionIndex) {
+            results = yield* filterResultsByRefineTerms(
+              indexRoot,
+              rawResults,
+              refineTerms,
+              effectiveLimit,
+              (result) => {
+                const section = sectionIndex.sections[result.sectionId]
+                return section
+                  ? {
+                      documentPath: result.documentPath,
+                      startLine: section.startLine,
+                      endLine: section.endLine,
+                    }
+                  : null
+              },
+            )
+          }
+        }
+        // Warn if reranking was requested but not applied
+        if (rerank && !stats.reranked && !json) {
+          yield* Console.log(
+            'Note: --rerank requested but @huggingface/transformers not installed',
+          )
+          yield* Console.log(
+            '      Install with: npm install @huggingface/transformers',
+          )
+          yield* Console.log('')
+        }
+        if (json) {
+          const moreAvailable =
+            stats.totalAvailable !== undefined &&
+            stats.totalAvailable > results.length
+              ? stats.totalAvailable - results.length
+              : undefined
+          const output = {
+            mode: 'hybrid',
+            modeReason,
+            query,
+            stats,
+            moreAvailable,
+            results: results.map((r) => ({
+              path: r.documentPath,
+              heading: r.heading,
+              score: r.score,
+              similarity: r.similarity,
+              bm25Score: r.bm25Score,
+              sources: r.sources,
+              ...(r.contextLines && { contextLines: r.contextLines }),
+            })),
+          }
+          yield* Console.log(formatJson(output, pretty))
+        } else {
+          const showReason = !modeReason.startsWith('--mode')
+          const modeStr = showReason
+            ? `${modeIndicator} (${modeReason})`
+            : modeIndicator
+          yield* Console.log(`${modeStr} Searching: "${query}"`)
+          // Show results count with "more available" indicator if results were limited
+          const moreAvailable =
+            stats.totalAvailable !== undefined &&
+            stats.totalAvailable > results.length
+              ? stats.totalAvailable - results.length
+              : 0
+          if (moreAvailable > 0) {
+            yield* Console.log(
+              `Results: ${results.length} (${moreAvailable} more available, use --limit to see more)`,
+            )
+          } else {
+            yield* Console.log(`Results: ${results.length}`)
+          }
+          yield* Console.log('')
+          for (const result of results) {
+            const sources = result.sources.join('+')
+            const score = (result.score * 100).toFixed(1)
+            yield* Console.log(`  ${result.documentPath}`)
+            yield* Console.log(
+              `    ${result.heading} (${score} RRF, ${sources})`,
+            )
+            if (result.contextLines && result.contextLines.length > 0) {
+              yield* Console.log('')
+              for (const ctxLine of result.contextLines) {
+                const marker = ctxLine.isMatch ? '>' : ' '
+                yield* Console.log(
+                  `  ${marker} ${ctxLine.lineNumber}: ${ctxLine.line}`,
+                )
+              }
+            }
+            yield* Console.log('')
+          }
+        }
-      if (useKeyword) {
+        // Summarization for hybrid search
+        if (summarize && results.length > 0) {
+          const summarizableResults: SummarizableResult[] = results.map(
+            (r) => ({
+              documentPath: r.documentPath,
+              heading: r.heading,
+              score: r.score,
+              ...(r.similarity !== undefined && { similarity: r.similarity }),
+            }),
+          )
+          yield* runSummarization({
+            results: summarizableResults,
+            query,
+            searchMode: 'hybrid',
+            json,
+            yes,
+            stream,
+            config: {
+              mode: config.aiSummarization.mode,
+              provider: config.aiSummarization.provider,
+            },
+          })
+        }
+      } else if (effectiveMode === 'keyword') {
         // Keyword search - content by default, heading-only if flag set
-        const results = headingOnly
-          ? yield* search(resolvedDir, { heading: query, limit })
-          : yield* searchContent(resolvedDir, {
+        const effectiveFuzzyDistance = Option.getOrUndefined(fuzzyDistance)
+        const refineTerms = refine.length > 0 ? refine : []
+        const fetchLimit =
+          refineTerms.length > 0 ? effectiveLimit * 5 : effectiveLimit
+        let results = headingOnly
+          ? yield* search(indexRoot, {
+              heading: query,
+              limit: fetchLimit,
+              ...(scopedPathPattern && { pathPattern: scopedPathPattern }),
+            })
+          : yield* searchContent(indexRoot, {
               content: query,
-              limit,
+              limit: fetchLimit,
               contextBefore,
               contextAfter,
+              fuzzy,
+              stem,
+              ...(effectiveFuzzyDistance !== undefined && {
+                fuzzyDistance: effectiveFuzzyDistance,
+              }),
+              ...(scopedPathPattern && { pathPattern: scopedPathPattern }),
             })
+        // Apply refine filtering if terms provided (parallel with caching)
+        if (refineTerms.length > 0) {
+          results = yield* filterResultsByRefineTerms(
+            indexRoot,
+            results,
+            refineTerms,
+            effectiveLimit,
+            (result) => ({
+              documentPath: result.section.documentPath,
+              startLine: result.section.startLine,
+              endLine: result.section.endLine,
+            }),
+          )
+        }
         if (json) {
           const output = {
             mode: 'keyword',
@@ -220,6 +696,11 @@ export const searchCommand = Command.make(
             query,
             contextBefore,
             contextAfter,
+            fuzzy,
+            stem,
+            ...(effectiveFuzzyDistance !== undefined && {
+              fuzzyDistance: effectiveFuzzyDistance,
+            }),
             results: results.map((r) => ({
               path: r.section.documentPath,
               heading: r.section.heading,
@@ -236,13 +717,20 @@ export const searchCommand = Command.make(
           yield* Console.log(formatJson(output, pretty))
         } else {
           const searchType = headingOnly ? 'Heading' : 'Content'
-          // Show mode with explanation for auto-detected modes
           const showReason =
             modeReason !== '--mode keyword' && modeReason !== '--keyword flag'
           const modeStr = showReason
             ? `${modeIndicator} (${modeReason})`
             : modeIndicator
-          yield* Console.log(`${modeStr} ${searchType} search: "${query}"`)
+          // Build fuzzy/stem indicator
+          const fuzzyIndicators: string[] = []
+          if (fuzzy) fuzzyIndicators.push('fuzzy')
+          if (stem) fuzzyIndicators.push('stem')
+          const fuzzyStr =
+            fuzzyIndicators.length > 0 ? ` [${fuzzyIndicators.join('+')}]` : ''
+          yield* Console.log(
+            `${modeStr}${fuzzyStr} ${searchType} search: "${query}"`,
+          )
           yield* Console.log(`Results: ${results.length}`)
           yield* Console.log('')
@@ -255,12 +743,9 @@ export const searchCommand = Command.make(
               `    ${levelMarker} ${result.section.heading} (${result.section.tokenCount} tokens)`,
             )
-            // Show match snippets with line numbers
             if (result.matches && result.matches.length > 0) {
               yield* Console.log('')
               for (const match of result.matches.slice(0, 3)) {
-                // Show first 3 matches per section
-                // Use contextLines for formatted output with line numbers
                 if (match.contextLines && match.contextLines.length > 0) {
                   for (const ctxLine of match.contextLines) {
                     const marker = ctxLine.isMatch ? '>' : ' '
@@ -269,7 +754,6 @@ export const searchCommand = Command.make(
                     )
                   }
                 } else {
-                  // Fallback to simple snippet display
                   yield* Console.log(`    Line ${match.lineNumber}:`)
                   const snippetLines = match.snippet.split('\n')
                   for (const line of snippetLines) {
@@ -287,52 +771,395 @@ export const searchCommand = Command.make(
             yield* Console.log('')
           }
-          // Show tip for enabling semantic search if no embeddings
           if (!indexInfo.embeddingsExist) {
             yield* Console.log(
               "Tip: Run 'mdcontext index --embed' to enable semantic search",
             )
           }
         }
+        // Summarization for keyword search
+        if (summarize && results.length > 0) {
+          const summarizableResults: SummarizableResult[] = results.map(
+            (r) => ({
+              documentPath: r.section.documentPath,
+              heading: r.section.heading,
+            }),
+          )
+          yield* runSummarization({
+            results: summarizableResults,
+            query,
+            searchMode: 'keyword',
+            json,
+            yes,
+            stream,
+            config: {
+              mode: config.aiSummarization.mode,
+              provider: config.aiSummarization.provider,
+            },
+          })
+        }
       } else {
-        // Semantic search
-        const results = yield* semanticSearch(resolvedDir, query, {
-          limit,
-          threshold,
-        }).pipe(handleApiKeyError)
+        // Build provider config from CLI flag if specified
+        const cliTimeout = Option.getOrUndefined(timeout)
+        const providerConfig = Option.isSome(provider)
+          ? {
+              provider: provider.value as
+                | 'openai'
+                | 'ollama'
+                | 'lm-studio'
+                | 'openrouter'
+                | 'voyage',
+              timeout: cliTimeout,
+            }
+          : cliTimeout !== undefined
+            ? { provider: 'openai' as const, timeout: cliTimeout }
+            : undefined
+        // Semantic search with stats for below-threshold feedback
+        const refineTerms = refine.length > 0 ? refine : []
+        const fetchLimit =
+          refineTerms.length > 0 ? effectiveLimit * 5 : effectiveLimit
+        const semanticQuality = Option.getOrUndefined(quality) as
+          | SearchQuality
+          | undefined
+        const searchResult = yield* semanticSearchWithStats(indexRoot, query, {
+          limit: fetchLimit,
+          threshold: effectiveThreshold,
+          providerConfig,
+          quality: semanticQuality,
+          hyde,
+          contextBefore,
+          contextAfter,
+          ...(scopedPathPattern && { pathPattern: scopedPathPattern }),
+        })
+        let {
+          results,
+          belowThresholdCount,
+          belowThresholdHighest,
+          totalAvailable,
+        } = searchResult
+        // Apply refine filtering if terms provided (parallel with caching)
+        if (refineTerms.length > 0) {
+          const storage = createStorage(indexRoot)
+          const sectionIndex = yield* loadSectionIndex(storage)
+          if (sectionIndex) {
+            results = yield* filterResultsByRefineTerms(
+              indexRoot,
+              results,
+              refineTerms,
+              effectiveLimit,
+              (result) => {
+                const section = sectionIndex.sections[result.sectionId]
+                return section
+                  ? {
+                      documentPath: result.documentPath,
+                      startLine: section.startLine,
+                      endLine: section.endLine,
+                    }
+                  : null
+              },
+            )
+          }
+        }
         if (json) {
+          const moreAvailableSemantic =
+            totalAvailable !== undefined && totalAvailable > results.length
+              ? totalAvailable - results.length
+              : undefined
           const output = {
             mode: 'semantic',
             modeReason,
             query,
+            hyde,
             results,
+            belowThresholdCount,
+            belowThresholdHighest,
+            moreAvailable: moreAvailableSemantic,
           }
           yield* Console.log(formatJson(output, pretty))
         } else {
-          // Show mode with explanation for auto-detected modes
           const showSemanticReason = modeReason !== '--mode semantic'
           const semanticModeStr = showSemanticReason
             ? `${modeIndicator} (${modeReason})`
             : modeIndicator
-          yield* Console.log(`${semanticModeStr} Semantic search: "${query}"`)
-          yield* Console.log(`Results: ${results.length}`)
+          const hydeIndicator = hyde ? ' [HyDE]' : ''
+          yield* Console.log(
+            `${semanticModeStr}${hydeIndicator} Semantic search: "${query}"`,
+          )
+          // Show results count with "more available" indicator if results were limited
+          const moreAvailableSemantic =
+            totalAvailable !== undefined && totalAvailable > results.length
+              ? totalAvailable - results.length
+              : 0
+          if (moreAvailableSemantic > 0) {
+            yield* Console.log(
+              `Results: ${results.length} (${moreAvailableSemantic} more available, use --limit to see more)`,
+            )
+          } else {
+            yield* Console.log(`Results: ${results.length}`)
+          }
           yield* Console.log('')
           for (const result of results) {
             const similarity = (result.similarity * 100).toFixed(1)
             yield* Console.log(`  ${result.documentPath}`)
             yield* Console.log(`    ${result.heading} (${similarity}% match)`)
+            if (result.contextLines && result.contextLines.length > 0) {
+              yield* Console.log('')
+              for (const ctxLine of result.contextLines) {
+                const marker = ctxLine.isMatch ? '>' : ' '
+                yield* Console.log(
+                  `  ${marker} ${ctxLine.lineNumber}: ${ctxLine.line}`,
+                )
+              }
+            }
+            yield* Console.log('')
+          }
+          // Show below-threshold feedback when 0 results but content exists
+          if (
+            results.length === 0 &&
+            belowThresholdCount !== undefined &&
+            belowThresholdCount > 0 &&
+            belowThresholdHighest !== undefined
+          ) {
+            const highestPct = (belowThresholdHighest * 100).toFixed(1)
+            const suggestedThreshold = Math.max(
+              0.1,
+              belowThresholdHighest - 0.05,
+            ).toFixed(2)
+            yield* Console.log(
+              `Note: ${belowThresholdCount} results found below ${(effectiveThreshold * 100).toFixed(0)}% threshold (highest: ${highestPct}%)`,
+            )
+            yield* Console.log(
+              `Tip: Use --threshold ${suggestedThreshold} to see more results`,
+            )
             yield* Console.log('')
           }
-          // Show tip for keyword search alternative
           yield* Console.log('Tip: Use --mode keyword for exact text matching')
         }
+        // Summarization for semantic search
+        if (summarize && results.length > 0) {
+          const summarizableResults: SummarizableResult[] = results.map(
+            (r) => ({
+              documentPath: r.documentPath,
+              heading: r.heading,
+              similarity: r.similarity,
+            }),
+          )
+          yield* runSummarization({
+            results: summarizableResults,
+            query,
+            searchMode: 'semantic',
+            json,
+            yes,
+            stream,
+            config: {
+              mode: config.aiSummarization.mode,
+              provider: config.aiSummarization.provider,
+            },
+          })
+        }
       }
     }),
 ).pipe(Command.withDescription('Search by meaning or structure'))
+/**
+ * Options for running AI summarization
+ */
+interface SummarizationOptions {
+  readonly results: readonly SummarizableResult[]
+  readonly query: string
+  readonly searchMode: 'hybrid' | 'semantic' | 'keyword'
+  readonly json: boolean
+  readonly yes: boolean
+  readonly stream: boolean
+  readonly config: {
+    readonly mode: 'cli' | 'api'
+    readonly provider: CLIProviderName | APIProviderName
+  }
+}
+/**
+ * Run AI summarization on search results.
+ * Handles cost estimation, user consent, and output formatting.
+ *
+ * GRACEFUL DEGRADATION: This function never fails - on error, it displays
+ * an error message and returns, allowing search results to still be shown.
+ */
+const runSummarization = (
+  options: SummarizationOptions,
+): Effect.Effect<void, never> =>
+  runSummarizationUnsafe(options).pipe(
+    Effect.catchAll((error) =>
+      Effect.sync(() => {
+        if (!options.json) {
+          displaySummarizationError(error)
+        }
+      }),
+    ),
+  )
+/**
+ * Internal implementation that may fail.
+ * Wrapped by runSummarization for graceful error handling.
+ */
+const runSummarizationUnsafe = (
+  options: SummarizationOptions,
+): Effect.Effect<void, Error> =>
+  Effect.gen(function* () {
+    const { results, query, searchMode, json, yes, stream, config } = options
+    if (results.length === 0) {
+      if (!json) {
+        yield* Console.log('No results to summarize.')
+      }
+      return
+    }
+    // Get summarizer
+    const summarizerData = yield* Effect.tryPromise({
+      try: async () => {
+        const result = await getBestAvailableSummarizer({
+          mode: config.mode,
+          provider: config.provider,
+        })
+        if (!result) {
+          throw new Error('No summarization providers available')
+        }
+        return result
+      },
+      catch: (e) => new Error(`Failed to get summarizer: ${e}`),
+    })
+    const { summarizer, config: resolvedConfig } = summarizerData
+    // Format results for summary input
+    const resultsText = formatResultsForSummary(results)
+    // Estimate cost
+    const costEstimate = estimateSummaryCost(
+      resultsText,
+      resolvedConfig.mode,
+      resolvedConfig.provider,
+    )
+    // Display cost info
+    if (!json) {
+      if (costEstimate.isPaid) {
+        yield* Console.log('')
+        yield* Console.log('Cost Estimate:')
+        yield* Console.log(`  Provider: ${costEstimate.provider}`)
+        yield* Console.log(
+          `  Input tokens: ~${costEstimate.inputTokens.toLocaleString()}`,
+        )
+        yield* Console.log(
+          `  Output tokens: ~${costEstimate.outputTokens.toLocaleString()}`,
+        )
+        yield* Console.log(`  Estimated cost: ${costEstimate.formattedCost}`)
+        // Get user consent if needed
+        if (!yes) {
+          const answer = yield* Effect.promise(() =>
+            promptUser('Continue with summarization? [Y/n]: '),
+          )
+          if (answer === 'n' || answer === 'no') {
+            yield* Console.log('Summarization cancelled.')
+            return
+          }
+        }
+      } else {
+        yield* Console.log('')
+        yield* Console.log(
+          `Using ${resolvedConfig.provider} (subscription - FREE)`,
+        )
+      }
+    }
+    // Build prompt
+    const prompt = buildPrompt({
+      query,
+      resultCount: results.length,
+      searchMode,
+    })
+    // Generate summary
+    if (!json) {
+      yield* Console.log('')
+      yield* Console.log('--- AI Summary ---')
+      yield* Console.log('')
+    }
+    const startTime = Date.now()
+    if (stream && 'summarizeStream' in summarizer) {
+      // Streaming output
+      yield* Effect.tryPromise({
+        try: () =>
+          (
+            summarizer as {
+              summarizeStream: (
+                input: string,
+                prompt: string,
+                options: { onChunk: (chunk: string) => void },
+              ) => Promise<void>
+            }
+          ).summarizeStream(resultsText, prompt, {
+            onChunk: (chunk) => {
+              process.stdout.write(chunk)
+            },
+          }),
+        catch: (e) => new Error(`Summarization failed: ${e}`),
+      })
+      if (!json) {
+        yield* Console.log('') // Final newline
+      }
+    } else {
+      // Non-streaming output
+      const summaryResult = yield* Effect.tryPromise({
+        try: () => summarizer.summarize(resultsText, prompt),
+        catch: (e) => new Error(`Summarization failed: ${e}`),
+      })
+      if (json) {
+        yield* Console.log(
+          JSON.stringify(
+            {
+              summary: summaryResult.summary,
+              provider: summaryResult.provider,
+              mode: summaryResult.mode,
+              durationMs: summaryResult.durationMs,
+              cost: costEstimate.isPaid ? costEstimate.formattedCost : 'FREE',
+            },
+            null,
+            2,
+          ),
+        )
+      } else {
+        yield* Console.log(summaryResult.summary)
+      }
+    }
+    const durationMs = Date.now() - startTime
+    if (!json) {
+      yield* Console.log('')
+      yield* Console.log('------------------')
+      yield* Console.log(
+        `Generated in ${(durationMs / 1000).toFixed(1)}s | ${costEstimate.isPaid ? costEstimate.formattedCost : 'FREE'}`,
+      )
+    }
+  })
 /**
  * Handle the case when embeddings don't exist.
  * Returns true if embeddings were created (or already exist), false to fall back to keyword search.
@@ -344,8 +1171,11 @@ const handleMissingEmbeddings = (
 ): Effect.Effect<boolean, Error> =>
   Effect.gen(function* () {
     // Get cost estimate
+    // Note: We gracefully handle errors since this is an optional auto-index feature.
+    // IndexNotFoundError is expected if index doesn't exist.
     const estimate = yield* estimateEmbeddingCost(resolvedDir).pipe(
-      Effect.catchAll(() => Effect.succeed(null)),
+      Effect.map((r): EmbeddingEstimate | null => r),
+      Effect.catchTags(createCostEstimateErrorHandler()),
     )
     if (!estimate) {
@@ -364,18 +1194,19 @@ const handleMissingEmbeddings = (
         )
       }
+      // Note: Graceful degradation - embedding errors fall back to keyword search
       const result = yield* buildEmbeddings(resolvedDir, {
         force: false,
         onFileProgress: (progress) => {
           if (!json) {
-            process.stdout.write(
-              `\r  [${progress.fileIndex}/${progress.totalFiles}] ${progress.filePath}...`,
+            console.log(
+              `  [${progress.fileIndex}/${progress.totalFiles}] ${progress.filePath}`,
             )
           }
         },
       }).pipe(
-        handleApiKeyError,
-        Effect.catchAll(() => Effect.succeed(null)),
+        Effect.map((r): BuildEmbeddingsResult | null => r),
+        Effect.catchTags(createEmbeddingErrorHandler({ silent: json })),
       )
       if (!result) {
@@ -383,7 +1214,6 @@ const handleMissingEmbeddings = (
       }
       if (!json) {
-        process.stdout.write(`\r${' '.repeat(80)}\r`)
         yield* Console.log(
           `Index created (${result.sectionsEmbedded} sections, $${result.cost.toFixed(6)})`,
         )
@@ -415,18 +1245,19 @@ const handleMissingEmbeddings = (
         yield* Console.log('Building embeddings...')
       }
+      // Note: Graceful degradation - embedding errors fall back to keyword search
       const result = yield* buildEmbeddings(resolvedDir, {
         force: false,
         onFileProgress: (progress) => {
           if (!json) {
-            process.stdout.write(
-              `\r  [${progress.fileIndex}/${progress.totalFiles}] ${progress.filePath}...`,
+            console.log(
+              `  [${progress.fileIndex}/${progress.totalFiles}] ${progress.filePath}`,
             )
           }
         },
       }).pipe(
-        handleApiKeyError,
-        Effect.catchAll(() => Effect.succeed(null)),
+        Effect.map((r): BuildEmbeddingsResult | null => r),
+        Effect.catchTags(createEmbeddingErrorHandler({ silent: json })),
       )
       if (!result) {
@@ -434,7 +1265,6 @@ const handleMissingEmbeddings = (
       }
       if (!json) {
-        process.stdout.write(`\r${' '.repeat(80)}\r`)
         yield* Console.log(
           `Index created (${result.sectionsEmbedded} sections, $${result.cost.toFixed(6)})`,
         )