npm - mdcontext - Versions diffs - 0.1.0 → 0.2.0 - Mend

mdcontext 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (251) hide show

package/.changeset/config.json +9 -9
package/.claude/settings.local.json +25 -0
package/.github/workflows/claude-code-review.yml +44 -0
package/.github/workflows/claude.yml +85 -0
package/CONTRIBUTING.md +186 -0
package/NOTES/NOTES +44 -0
package/README.md +206 -3
package/biome.json +1 -1
package/dist/chunk-23UPXDNL.js +3044 -0
package/dist/chunk-2W7MO2DL.js +1366 -0
package/dist/chunk-3NUAZGMA.js +1689 -0
package/dist/chunk-7TOWB2XB.js +366 -0
package/dist/chunk-7XOTOADQ.js +3065 -0
package/dist/chunk-AH2PDM2K.js +3042 -0
package/dist/chunk-BNXWSZ63.js +3742 -0
package/dist/chunk-BTL5DJVU.js +3222 -0
package/dist/chunk-HDHYG7E4.js +104 -0
package/dist/chunk-HLR4KZBP.js +3234 -0
package/dist/chunk-IP3FRFEB.js +1045 -0
package/dist/chunk-KHU56VDO.js +3042 -0
package/dist/chunk-KRYIFLQR.js +85 -89
package/dist/chunk-LBSDNLEM.js +287 -0
package/dist/chunk-MNTQ7HCP.js +2643 -0
package/dist/chunk-MUJELQQ6.js +1387 -0
package/dist/chunk-MXJGMSLV.js +2199 -0
package/dist/chunk-N6QJGC3Z.js +2636 -0
package/dist/chunk-OBELGBPM.js +1713 -0
package/dist/chunk-OT7R5XTA.js +3192 -0
package/dist/chunk-P7X4RA2T.js +106 -0
package/dist/chunk-PIDUQNC2.js +3185 -0
package/dist/chunk-POGCDIH4.js +3187 -0
package/dist/chunk-PSIEOQGZ.js +3043 -0
package/dist/chunk-PVRT3IHA.js +3238 -0
package/dist/chunk-QNN4TT23.js +1430 -0
package/dist/chunk-RE3R45RJ.js +3042 -0
package/dist/chunk-S7E6TFX6.js +718 -657
package/dist/chunk-SG6GLU4U.js +1378 -0
package/dist/chunk-SJCDV2ST.js +274 -0
package/dist/chunk-SYE5XLF3.js +104 -0
package/dist/chunk-T5VLYBZD.js +103 -0
package/dist/chunk-TOQB7VWU.js +3238 -0
package/dist/chunk-VFNMZ4ZQ.js +3228 -0
package/dist/chunk-VVTGZNBT.js +1533 -1423
package/dist/chunk-W7Q4RFEV.js +104 -0
package/dist/chunk-XTYYVRLO.js +3190 -0
package/dist/chunk-Y6MDYVJD.js +3063 -0
package/dist/cli/main.js +4072 -629
package/dist/index.d.ts +420 -33
package/dist/index.js +8 -15
package/dist/mcp/server.js +103 -7
package/dist/schema-BAWSG7KY.js +22 -0
package/dist/schema-E3QUPL26.js +20 -0
package/dist/schema-EHL7WUT6.js +20 -0
package/docs/019-USAGE.md +44 -5
package/docs/020-current-implementation.md +8 -8
package/docs/021-DOGFOODING-FINDINGS.md +1 -1
package/docs/CONFIG.md +1123 -0
package/docs/ERRORS.md +383 -0
package/docs/summarization.md +320 -0
package/justfile +40 -0
package/package.json +39 -33
package/research/INDEX.md +315 -0
package/research/code-review/README.md +90 -0
package/research/code-review/cli-error-handling-review.md +979 -0
package/research/code-review/code-review-validation-report.md +464 -0
package/research/code-review/main-ts-review.md +1128 -0
package/research/config-docs/SUMMARY.md +357 -0
package/research/config-docs/TEST-RESULTS.md +776 -0
package/research/config-docs/TODO.md +542 -0
package/research/config-docs/analysis.md +744 -0
package/research/config-docs/fix-validation.md +502 -0
package/research/config-docs/help-audit.md +264 -0
package/research/config-docs/help-system-analysis.md +890 -0
package/research/frontmatter/COMMENTS-ARE-SKIPPED.md +149 -0
package/research/frontmatter/LLM-CODE-NAVIGATION.md +276 -0
package/research/issue-review.md +603 -0
package/research/llm-summarization/agent-cli-tools-2026.md +1082 -0
package/research/llm-summarization/alternative-providers-2026.md +1428 -0
package/research/llm-summarization/anthropic-2026.md +367 -0
package/research/llm-summarization/claude-cli-integration.md +1706 -0
package/research/llm-summarization/cli-integration-patterns.md +3155 -0
package/research/llm-summarization/openai-2026.md +473 -0
package/research/llm-summarization/openai-compatible-providers-2026.md +1022 -0
package/research/llm-summarization/opencode-cli-integration.md +1552 -0
package/research/llm-summarization/prompt-engineering-2026.md +1426 -0
package/research/llm-summarization/prototype-results.md +56 -0
package/research/llm-summarization/provider-switching-patterns-2026.md +2153 -0
package/research/llm-summarization/typescript-llm-libraries-2026.md +2436 -0
package/research/mdcontext-pudding/00-EXECUTIVE-SUMMARY.md +282 -0
package/research/mdcontext-pudding/01-index-embed.md +956 -0
package/research/mdcontext-pudding/02-search-COMMANDS.md +142 -0
package/research/mdcontext-pudding/02-search-SUMMARY.md +146 -0
package/research/mdcontext-pudding/02-search.md +970 -0
package/research/mdcontext-pudding/03-context.md +779 -0
package/research/mdcontext-pudding/04-navigation-and-analytics.md +803 -0
package/research/mdcontext-pudding/04-tree.md +704 -0
package/research/mdcontext-pudding/05-config.md +1038 -0
package/research/mdcontext-pudding/06-links-summary.txt +87 -0
package/research/mdcontext-pudding/06-links.md +679 -0
package/research/mdcontext-pudding/07-stats.md +693 -0
package/research/mdcontext-pudding/BUG-FIX-PLAN.md +388 -0
package/research/mdcontext-pudding/P0-BUG-VALIDATION.md +167 -0
package/research/mdcontext-pudding/README.md +168 -0
package/research/mdcontext-pudding/TESTING-SUMMARY.md +128 -0
package/research/research-quality-review.md +834 -0
package/research/semantic-search/embedding-text-analysis.md +156 -0
package/research/semantic-search/multi-word-failure-reproduction.md +171 -0
package/research/semantic-search/query-processing-analysis.md +207 -0
package/research/semantic-search/root-cause-and-solution.md +114 -0
package/research/semantic-search/threshold-validation-report.md +69 -0
package/research/semantic-search/vector-search-analysis.md +63 -0
package/research/test-path-issues.md +276 -0
package/review/ALP-76/1-error-type-design.md +962 -0
package/review/ALP-76/2-error-handling-patterns.md +906 -0
package/review/ALP-76/3-error-presentation.md +624 -0
package/review/ALP-76/4-test-coverage.md +625 -0
package/review/ALP-76/5-migration-completeness.md +440 -0
package/review/ALP-76/6-effect-best-practices.md +755 -0
package/scripts/apply-branch-protection.sh +47 -0
package/scripts/branch-protection-templates.json +79 -0
package/scripts/prototype-summarization.ts +346 -0
package/scripts/rebuild-hnswlib.js +32 -37
package/scripts/setup-branch-protection.sh +64 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/active-provider.json +7 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/bm25.json +541 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/bm25.meta.json +5 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/config.json +8 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin +0 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin +0 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/documents.json +60 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/links.json +13 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/.mdcontext/indexes/sections.json +1197 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/configuration-management.md +99 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/distributed-systems.md +92 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/error-handling.md +78 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/failure-automation.md +55 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/job-context.md +69 -0
package/src/__tests__/fixtures/semantic-search/multi-word-corpus/process-orchestration.md +99 -0
package/src/cli/argv-preprocessor.test.ts +2 -2
package/src/cli/cli.test.ts +230 -33
package/src/cli/commands/config-cmd.ts +642 -0
package/src/cli/commands/context.ts +97 -9
package/src/cli/commands/duplicates.ts +122 -0
package/src/cli/commands/embeddings.ts +529 -0
package/src/cli/commands/index-cmd.ts +210 -30
package/src/cli/commands/index.ts +3 -0
package/src/cli/commands/search.ts +894 -64
package/src/cli/commands/stats.ts +3 -0
package/src/cli/commands/tree.ts +26 -5
package/src/cli/config-layer.ts +176 -0
package/src/cli/error-handler.test.ts +235 -0
package/src/cli/error-handler.ts +655 -0
package/src/cli/flag-schemas.ts +66 -0
package/src/cli/help.ts +209 -7
package/src/cli/main.ts +348 -58
package/src/cli/options.ts +10 -0
package/src/cli/shared-error-handling.ts +199 -0
package/src/cli/utils.ts +150 -17
package/src/config/file-provider.test.ts +320 -0
package/src/config/file-provider.ts +273 -0
package/src/config/index.ts +72 -0
package/src/config/integration.test.ts +667 -0
package/src/config/precedence.test.ts +277 -0
package/src/config/precedence.ts +451 -0
package/src/config/schema.test.ts +414 -0
package/src/config/schema.ts +603 -0
package/src/config/service.test.ts +320 -0
package/src/config/service.ts +243 -0
package/src/config/testing.test.ts +264 -0
package/src/config/testing.ts +110 -0
package/src/core/types.ts +6 -33
package/src/duplicates/detector.test.ts +183 -0
package/src/duplicates/detector.ts +414 -0
package/src/duplicates/index.ts +18 -0
package/src/embeddings/embedding-namespace.test.ts +300 -0
package/src/embeddings/embedding-namespace.ts +947 -0
package/src/embeddings/heading-boost.test.ts +222 -0
package/src/embeddings/hnsw-build-options.test.ts +198 -0
package/src/embeddings/hyde.test.ts +272 -0
package/src/embeddings/hyde.ts +264 -0
package/src/embeddings/index.ts +2 -0
package/src/embeddings/openai-provider.ts +332 -83
package/src/embeddings/pricing.json +22 -0
package/src/embeddings/provider-constants.ts +204 -0
package/src/embeddings/provider-errors.test.ts +967 -0
package/src/embeddings/provider-errors.ts +565 -0
package/src/embeddings/provider-factory.test.ts +240 -0
package/src/embeddings/provider-factory.ts +225 -0
package/src/embeddings/provider-integration.test.ts +788 -0
package/src/embeddings/query-preprocessing.test.ts +187 -0
package/src/embeddings/semantic-search-threshold.test.ts +508 -0
package/src/embeddings/semantic-search.ts +780 -93
package/src/embeddings/types.ts +293 -16
package/src/embeddings/vector-store.ts +486 -77
package/src/embeddings/voyage-provider.ts +313 -0
package/src/errors/errors.test.ts +845 -0
package/src/errors/index.ts +533 -0
package/src/index/ignore-patterns.test.ts +354 -0
package/src/index/ignore-patterns.ts +305 -0
package/src/index/indexer.ts +286 -48
package/src/index/storage.ts +94 -30
package/src/index/types.ts +40 -2
package/src/index/watcher.ts +67 -9
package/src/index.ts +22 -0
package/src/integration/search-keyword.test.ts +678 -0
package/src/mcp/server.ts +135 -6
package/src/parser/parser.ts +18 -19
package/src/parser/section-filter.test.ts +277 -0
package/src/parser/section-filter.ts +125 -3
package/src/search/__tests__/hybrid-search.test.ts +650 -0
package/src/search/bm25-store.ts +366 -0
package/src/search/cross-encoder.test.ts +253 -0
package/src/search/cross-encoder.ts +406 -0
package/src/search/fuzzy-search.test.ts +419 -0
package/src/search/fuzzy-search.ts +273 -0
package/src/search/hybrid-search.ts +448 -0
package/src/search/path-matcher.test.ts +276 -0
package/src/search/path-matcher.ts +33 -0
package/src/search/searcher.test.ts +99 -1
package/src/search/searcher.ts +189 -67
package/src/search/wink-bm25.d.ts +30 -0
package/src/summarization/cli-providers/claude.ts +202 -0
package/src/summarization/cli-providers/detection.test.ts +273 -0
package/src/summarization/cli-providers/detection.ts +118 -0
package/src/summarization/cli-providers/index.ts +8 -0
package/src/summarization/cost.test.ts +139 -0
package/src/summarization/cost.ts +102 -0
package/src/summarization/error-handler.test.ts +127 -0
package/src/summarization/error-handler.ts +111 -0
package/src/summarization/index.ts +102 -0
package/src/summarization/pipeline.test.ts +498 -0
package/src/summarization/pipeline.ts +231 -0
package/src/summarization/prompts.test.ts +269 -0
package/src/summarization/prompts.ts +133 -0
package/src/summarization/provider-factory.test.ts +396 -0
package/src/summarization/provider-factory.ts +178 -0
package/src/summarization/types.ts +184 -0
package/src/summarize/summarizer.ts +104 -35
package/src/types/huggingface-transformers.d.ts +66 -0
package/tests/fixtures/cli/.mdcontext/active-provider.json +7 -0
package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin +0 -0
package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin +0 -0
package/tests/fixtures/cli/.mdcontext/indexes/documents.json +4 -4
package/tests/fixtures/cli/.mdcontext/indexes/sections.json +14 -0
package/tests/integration/embed-index.test.ts +712 -0
package/tests/integration/search-context.test.ts +469 -0
package/tests/integration/search-semantic.test.ts +522 -0
package/vitest.config.ts +1 -6
package/AGENTS.md +0 -46
package/tests/fixtures/cli/.mdcontext/vectors.bin +0 -0
package/tests/fixtures/cli/.mdcontext/vectors.meta.json +0 -1264

package/src/summarization/types.ts ADDED Viewed

@@ -0,0 +1,184 @@
+/**
+ * Summarization Module Types
+ *
+ * Core interfaces for AI-powered summarization of search results.
+ * Supports both CLI-based providers (free with subscriptions) and
+ * API-based providers (pay-per-use via Vercel AI SDK).
+ */
+/**
+ * Summarization mode - CLI providers are free, API providers cost money
+ */
+export type SummarizationMode = 'cli' | 'api'
+/**
+ * Known CLI tools that can be used for summarization
+ */
+export type CLIProviderName =
+  | 'claude'
+  | 'copilot'
+  | 'cline'
+  | 'aider'
+  | 'opencode'
+  | 'amp'
+/**
+ * Known API providers for summarization
+ */
+export type APIProviderName =
+  | 'deepseek'
+  | 'anthropic'
+  | 'openai'
+  | 'gemini'
+  | 'qwen'
+/**
+ * Information about a detected CLI tool
+ */
+export interface CLIInfo {
+  /** Internal name identifier */
+  readonly name: CLIProviderName
+  /** Command to execute */
+  readonly command: string
+  /** Display name for UI */
+  readonly displayName: string
+  /** Arguments to pass to the CLI for summarization */
+  readonly args: readonly string[]
+  /** Whether to use stdin for input */
+  readonly useStdin: boolean
+}
+/**
+ * API provider pricing information
+ */
+export interface APIProviderPricing {
+  /** Provider name */
+  readonly provider: APIProviderName
+  /** Display name */
+  readonly displayName: string
+  /** Cost per million input tokens */
+  readonly inputCostPer1M: number
+  /** Cost per million output tokens */
+  readonly outputCostPer1M: number
+  /** Default model to use */
+  readonly defaultModel: string
+  /** Base URL for the API */
+  readonly baseURL: string
+  /** Environment variable for API key */
+  readonly apiKeyEnvVar: string
+}
+/**
+ * Result from a summarization operation
+ */
+export interface SummaryResult {
+  /** The generated summary text */
+  readonly summary: string
+  /** Provider that generated the summary */
+  readonly provider: CLIProviderName | APIProviderName
+  /** Mode used (cli or api) */
+  readonly mode: SummarizationMode
+  /** Estimated cost in USD (0 for CLI providers) */
+  readonly estimatedCost: number
+  /** Time taken in milliseconds */
+  readonly durationMs: number
+  /** Token count estimates (if available) */
+  readonly tokens?: {
+    readonly input: number
+    readonly output: number
+  }
+}
+/**
+ * Core summarizer interface - simple and focused
+ *
+ * Each provider just needs to implement this interface.
+ * CLI providers return 0 for cost, API providers calculate actual costs.
+ */
+export interface Summarizer {
+  /** Generate a summary from input text */
+  summarize(input: string, prompt: string): Promise<SummaryResult>
+  /** Estimate cost before running (optional, defaults to 0 for CLI) */
+  estimateCost?(inputTokens: number): number
+  /** Check if the provider is available/configured */
+  isAvailable(): Promise<boolean>
+}
+/**
+ * Options for streaming summarization
+ */
+export interface StreamOptions {
+  /** Callback for each chunk of text */
+  onChunk: (chunk: string) => void
+  /** Callback when streaming completes */
+  onComplete?: (result: SummaryResult) => void
+  /** Callback on error */
+  onError?: (error: Error) => void
+}
+/**
+ * Extended summarizer interface with streaming support
+ */
+export interface StreamingSummarizer extends Summarizer {
+  /** Generate a summary with streaming output */
+  summarizeStream(
+    input: string,
+    prompt: string,
+    options: StreamOptions,
+  ): Promise<void>
+}
+/**
+ * Configuration for AI summarization (distinct from existing SummarizationConfig)
+ *
+ * This configures the AI provider for generating summaries, not the
+ * token budget settings in the existing SummarizationConfig.
+ */
+export interface AISummarizationConfig {
+  /** Mode: 'cli' (free) or 'api' (pay-per-use) */
+  readonly mode: SummarizationMode
+  /** Provider name */
+  readonly provider: CLIProviderName | APIProviderName
+  /** Model name (for API providers) */
+  readonly model?: string
+  /** Enable streaming output */
+  readonly stream?: boolean
+  /** Custom API base URL */
+  readonly baseURL?: string
+  /** API key (for API providers, usually from env) */
+  readonly apiKey?: string
+}
+/**
+ * Factory function type for creating summarizers
+ */
+export type SummarizerFactory = (
+  config: AISummarizationConfig,
+) => Promise<Summarizer>
+/**
+ * Error types specific to summarization
+ */
+export class SummarizationError extends Error {
+  constructor(
+    message: string,
+    public readonly code: SummarizationErrorCode,
+    public readonly provider?: string,
+    public readonly cause?: Error,
+  ) {
+    super(message)
+    this.name = 'SummarizationError'
+  }
+}
+export type SummarizationErrorCode =
+  | 'PROVIDER_NOT_FOUND'
+  | 'PROVIDER_NOT_AVAILABLE'
+  | 'CLI_EXECUTION_FAILED'
+  | 'API_REQUEST_FAILED'
+  | 'RATE_LIMITED'
+  | 'INVALID_RESPONSE'
+  | 'TIMEOUT'
+  | 'NO_API_KEY'

package/src/summarize/summarizer.ts CHANGED Viewed

@@ -7,11 +7,19 @@
 import * as fs from 'node:fs/promises'
 import * as path from 'node:path'
 import { Effect } from 'effect'
-import type { MdDocument, MdSection } from '../core/types.js'
+import type { MdDocument, MdSection, ParseError } from '../core/types.js'
+import type { FileReadError } from '../errors/index.js'
 import { parseFile } from '../parser/parser.js'
+import { filterDocumentSections } from '../parser/section-filter.js'
 import { countTokensApprox } from '../utils/tokens.js'
 import { formatSummary as formatSummaryImpl } from './formatters.js'
+/**
+ * Error type from parseFile function
+ * Uses centralized errors from src/errors/index.ts
+ */
+type ParseFileError = ParseError | FileReadError
 // ============================================================================
 // Types
 // ============================================================================
@@ -23,6 +31,8 @@ export interface SummarizeOptions {
   readonly level?: CompressionLevel | undefined
   /** Maximum tokens for output */
   readonly maxTokens?: number | undefined
+  /** Section patterns to exclude from output */
+  readonly exclude?: readonly string[] | undefined
 }
 export interface SectionSummary {
@@ -56,6 +66,8 @@ export interface AssembleContextOptions {
   readonly budget: number
   /** Compression level for each source */
   readonly level?: CompressionLevel | undefined
+  /** Section patterns to exclude from output */
+  readonly exclude?: readonly string[] | undefined
 }
 export interface AssembledContext {
@@ -375,14 +387,27 @@ export const summarizeDocument = (
   return result
 }
+/**
+ * Summarize a markdown file
+ *
+ * @throws ParseError - File content cannot be parsed
+ * @throws FileReadError - File cannot be read from filesystem
+ */
 export const summarizeFile = (
   filePath: string,
   options: SummarizeOptions = {},
-): Effect.Effect<DocumentSummary, Error> =>
+): Effect.Effect<DocumentSummary, ParseFileError> =>
   Effect.gen(function* () {
-    const document = yield* parseFile(filePath).pipe(
-      Effect.mapError((e) => new Error(`${e._tag}: ${e.message}`)),
-    )
+    let document = yield* parseFile(filePath)
+    // Apply exclusion filter if patterns provided
+    if (options.exclude && options.exclude.length > 0) {
+      const { document: filteredDoc } = filterDocumentSections(
+        document,
+        options.exclude,
+      )
+      document = filteredDoc
+    }
     return summarizeDocument(document, options)
   })
@@ -397,14 +422,21 @@ export { type FormatSummaryOptions, formatSummary } from './formatters.js'
 // Multi-Document Context Assembly
 // ============================================================================
+/**
+ * Assemble context from multiple markdown files within a token budget
+ *
+ * @throws ParseError - File content cannot be parsed
+ * @throws FileReadError - File cannot be read from filesystem
+ */
 export const assembleContext = (
   rootPath: string,
   sourcePaths: readonly string[],
   options: AssembleContextOptions,
-): Effect.Effect<AssembledContext, Error> =>
+): Effect.Effect<AssembledContext, ParseFileError> =>
   Effect.gen(function* () {
     const budget = options.budget
     const level = options.level ?? 'summary'
+    const excludePatterns = options.exclude ?? []
     const sources: SourceContext[] = []
     const overflow: string[] = []
@@ -418,33 +450,65 @@ export const assembleContext = (
         ? sourcePath
         : path.join(rootPath, sourcePath)
-      try {
-        const summary = yield* summarizeFile(resolvedPath, {
-          level,
-          maxTokens: perSourceBudget,
-        })
-        const content = formatSummaryImpl(summary)
-        // Count actual formatted output tokens, not pre-format summary tokens
-        const tokens = countTokensApprox(content)
+      // Use catchAll for graceful degradation - individual file failures
+      // shouldn't stop the entire context assembly operation
+      const summaryResult = yield* summarizeFile(resolvedPath, {
+        level,
+        maxTokens: perSourceBudget,
+        exclude: excludePatterns,
+      }).pipe(
+        Effect.map((s): DocumentSummary | null => s),
+        // Log error for observability before gracefully degrading
+        Effect.tapError((error) =>
+          Effect.logError(`Failed to summarize ${sourcePath}`, error),
+        ),
+        // Note: catchAll intentional for batch processing - individual file
+        // failures add to overflow instead of stopping assembly
+        Effect.catchAll(() => Effect.succeed(null as DocumentSummary | null)),
+      )
+      if (!summaryResult) {
+        overflow.push(sourcePath)
+        continue
+      }
-        if (totalTokens + tokens <= budget) {
-          sources.push({
-            path: path.relative(rootPath, resolvedPath),
-            title: summary.title,
-            tokens,
-            content,
-          })
-          totalTokens += tokens
-        } else {
-          // Over budget
-          const remaining = budget - totalTokens
-          if (remaining > MIN_PARTIAL_BUDGET) {
-            // Include partial if we have some room
-            const briefSummary = yield* summarizeFile(resolvedPath, {
-              level: 'brief',
-              maxTokens: remaining,
-            })
+      const summary = summaryResult
+      const content = formatSummaryImpl(summary)
+      // Count actual formatted output tokens, not pre-format summary tokens
+      const tokens = countTokensApprox(content)
+      if (totalTokens + tokens <= budget) {
+        sources.push({
+          path: path.relative(rootPath, resolvedPath),
+          title: summary.title,
+          tokens,
+          content,
+        })
+        totalTokens += tokens
+      } else {
+        // Over budget
+        const remaining = budget - totalTokens
+        if (remaining > MIN_PARTIAL_BUDGET) {
+          // Include partial if we have some room
+          const briefSummary = yield* summarizeFile(resolvedPath, {
+            level: 'brief',
+            maxTokens: remaining,
+            exclude: excludePatterns,
+          }).pipe(
+            Effect.map((s): DocumentSummary | null => s),
+            // Log error for observability before gracefully degrading
+            Effect.tapError((error) =>
+              Effect.logError(
+                `Failed to create brief summary for ${sourcePath}`,
+                error,
+              ),
+            ),
+            Effect.catchAll(() =>
+              Effect.succeed(null as DocumentSummary | null),
+            ),
+          )
+          if (briefSummary) {
             const briefContent = formatSummaryImpl(briefSummary)
             // Count actual formatted output tokens, not pre-format summary tokens
             const briefTokens = countTokensApprox(briefContent)
@@ -459,10 +523,9 @@ export const assembleContext = (
           } else {
             overflow.push(path.relative(rootPath, resolvedPath))
           }
+        } else {
+          overflow.push(path.relative(rootPath, resolvedPath))
         }
-      } catch (_e) {
-        // Skip files that can't be processed
-        overflow.push(sourcePath)
       }
     }
@@ -500,8 +563,14 @@ export const measureReduction = async (
   const originalTokens = countTokensApprox(originalContent)
   // Get summary
+  // Note: catchAll is intentional - measureReduction is a utility function
+  // where failures should return default values (no reduction) rather than throw
   const result = await Effect.runPromise(
     summarizeFile(filePath, { level }).pipe(
+      // Log error for observability before gracefully degrading
+      Effect.tapError((error) =>
+        Effect.logError(`Failed to measure reduction for ${filePath}`, error),
+      ),
       Effect.catchAll(() => Effect.succeed(null)),
     ),
   )

package/src/types/huggingface-transformers.d.ts ADDED Viewed

@@ -0,0 +1,66 @@
+/**
+ * Type declarations for @huggingface/transformers (optional dependency)
+ *
+ * This package is an optional peer dependency used for cross-encoder re-ranking.
+ * Users who want re-ranking can install it with: npm install @huggingface/transformers
+ */
+declare module '@huggingface/transformers' {
+  export interface ProgressCallbackData {
+    file?: string
+    progress?: number
+  }
+  export type ProgressCallback = (data: ProgressCallbackData) => void
+  export interface AutoModelOptions {
+    progress_callback?: ProgressCallback | undefined
+  }
+  export interface AutoTokenizerOptions {
+    progress_callback?: ProgressCallback | undefined
+  }
+  export interface TokenizerOutput {
+    input_ids: unknown
+    attention_mask: unknown
+  }
+  export interface ModelOutput {
+    logits: {
+      data: Float32Array
+    }
+  }
+  export const env: {
+    cacheDir: string
+  }
+  export type AutoTokenizerInstance = (
+    texts: string[],
+    options: {
+      text_pair?: string[]
+      padding?: boolean
+      truncation?: boolean
+      max_length?: number
+    },
+  ) => TokenizerOutput
+  export type AutoModelInstance = (
+    input: TokenizerOutput,
+  ) => Promise<ModelOutput>
+  export const AutoTokenizer: {
+    from_pretrained(
+      model: string,
+      options?: AutoTokenizerOptions,
+    ): Promise<AutoTokenizerInstance>
+  }
+  export const AutoModelForSequenceClassification: {
+    from_pretrained(
+      model: string,
+      options?: AutoModelOptions,
+    ): Promise<AutoModelInstance>
+  }
+}

package/tests/fixtures/cli/.mdcontext/active-provider.json ADDED Viewed

@@ -0,0 +1,7 @@
+{
+  "namespace": "openai_text-embedding-3-small_512",
+  "provider": "openai",
+  "model": "text-embedding-3-small",
+  "dimensions": 512,
+  "activatedAt": "2026-01-27T07:43:50.361Z"
+}

package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.bin ADDED Viewed

Binary file

package/tests/fixtures/cli/.mdcontext/embeddings/openai_text-embedding-3-small_512/vectors.meta.bin ADDED Viewed

Binary file

package/tests/fixtures/cli/.mdcontext/indexes/documents.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "version": 1,
-  "rootPath": "/Users/alphab/Dev/LLM/DEV/mdcontext/tests/fixtures/cli",
+  "rootPath": "tests/fixtures/cli",
   "documents": {
     "README.md": {
       "id": "04c6e90faac2",
       "path": "README.md",
       "title": "Test Project",
-      "mtime": 1768999918845,
+      "mtime": 1769492431399,
       "hash": "54872b0fdbf6858a",
       "tokenCount": 76,
       "sectionCount": 2
@@ -15,7 +15,7 @@
       "id": "392e93c0f22d",
       "path": "api-reference.md",
       "title": "API Reference",
-      "mtime": 1768999919391,
+      "mtime": 1769492431399,
       "hash": "4a879da54a831235",
       "tokenCount": 109,
       "sectionCount": 2
@@ -24,7 +24,7 @@
       "id": "b6885e1f8555",
       "path": "getting-started.md",
       "title": "Getting Started",
-      "mtime": 1769013198631,
+      "mtime": 1769492431400,
       "hash": "2d44a41d5d2579f2",
       "tokenCount": 66,
       "sectionCount": 3

package/tests/fixtures/cli/.mdcontext/indexes/sections.json CHANGED Viewed

@@ -110,6 +110,8 @@
       "04c6e90faac2-test-project",
       "04c6e90faac2-test-project",
       "04c6e90faac2-test-project",
+      "04c6e90faac2-test-project",
+      "04c6e90faac2-test-project",
       "04c6e90faac2-test-project"
     ],
     "overview": [
@@ -128,6 +130,8 @@
       "04c6e90faac2-overview",
       "04c6e90faac2-overview",
       "04c6e90faac2-overview",
+      "04c6e90faac2-overview",
+      "04c6e90faac2-overview",
       "04c6e90faac2-overview"
     ],
     "api reference": [
@@ -146,6 +150,8 @@
       "392e93c0f22d-api-reference",
       "392e93c0f22d-api-reference",
       "392e93c0f22d-api-reference",
+      "392e93c0f22d-api-reference",
+      "392e93c0f22d-api-reference",
       "392e93c0f22d-api-reference"
     ],
     "endpoints": [
@@ -164,6 +170,8 @@
       "392e93c0f22d-endpoints",
       "392e93c0f22d-endpoints",
       "392e93c0f22d-endpoints",
+      "392e93c0f22d-endpoints",
+      "392e93c0f22d-endpoints",
       "392e93c0f22d-endpoints"
     ],
     "getting started": [
@@ -182,6 +190,8 @@
       "b6885e1f8555-getting-started",
       "b6885e1f8555-getting-started",
       "b6885e1f8555-getting-started",
+      "b6885e1f8555-getting-started",
+      "b6885e1f8555-getting-started",
       "b6885e1f8555-getting-started"
     ],
     "installation": [
@@ -200,6 +210,8 @@
       "b6885e1f8555-installation",
       "b6885e1f8555-installation",
       "b6885e1f8555-installation",
+      "b6885e1f8555-installation",
+      "b6885e1f8555-installation",
       "b6885e1f8555-installation"
     ],
     "usage": [
@@ -218,6 +230,8 @@
       "b6885e1f8555-usage",
       "b6885e1f8555-usage",
       "b6885e1f8555-usage",
+      "b6885e1f8555-usage",
+      "b6885e1f8555-usage",
       "b6885e1f8555-usage"
     ]
   },