npm - @gmickel/gno - Versions diffs - 0.3.0 - Mend

@gmickel/gno 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (131) hide show

package/README.md +256 -0
package/assets/skill/SKILL.md +112 -0
package/assets/skill/cli-reference.md +327 -0
package/assets/skill/examples.md +234 -0
package/assets/skill/mcp-reference.md +159 -0
package/package.json +90 -0
package/src/app/constants.ts +313 -0
package/src/cli/colors.ts +65 -0
package/src/cli/commands/ask.ts +545 -0
package/src/cli/commands/cleanup.ts +105 -0
package/src/cli/commands/collection/add.ts +120 -0
package/src/cli/commands/collection/index.ts +10 -0
package/src/cli/commands/collection/list.ts +108 -0
package/src/cli/commands/collection/remove.ts +64 -0
package/src/cli/commands/collection/rename.ts +95 -0
package/src/cli/commands/context/add.ts +67 -0
package/src/cli/commands/context/check.ts +153 -0
package/src/cli/commands/context/index.ts +10 -0
package/src/cli/commands/context/list.ts +109 -0
package/src/cli/commands/context/rm.ts +52 -0
package/src/cli/commands/doctor.ts +393 -0
package/src/cli/commands/embed.ts +462 -0
package/src/cli/commands/get.ts +356 -0
package/src/cli/commands/index-cmd.ts +119 -0
package/src/cli/commands/index.ts +102 -0
package/src/cli/commands/init.ts +328 -0
package/src/cli/commands/ls.ts +217 -0
package/src/cli/commands/mcp/config.ts +300 -0
package/src/cli/commands/mcp/index.ts +24 -0
package/src/cli/commands/mcp/install.ts +203 -0
package/src/cli/commands/mcp/paths.ts +470 -0
package/src/cli/commands/mcp/status.ts +222 -0
package/src/cli/commands/mcp/uninstall.ts +158 -0
package/src/cli/commands/mcp.ts +20 -0
package/src/cli/commands/models/clear.ts +103 -0
package/src/cli/commands/models/index.ts +32 -0
package/src/cli/commands/models/list.ts +214 -0
package/src/cli/commands/models/path.ts +51 -0
package/src/cli/commands/models/pull.ts +199 -0
package/src/cli/commands/models/use.ts +85 -0
package/src/cli/commands/multi-get.ts +400 -0
package/src/cli/commands/query.ts +220 -0
package/src/cli/commands/ref-parser.ts +108 -0
package/src/cli/commands/reset.ts +191 -0
package/src/cli/commands/search.ts +136 -0
package/src/cli/commands/shared.ts +156 -0
package/src/cli/commands/skill/index.ts +19 -0
package/src/cli/commands/skill/install.ts +197 -0
package/src/cli/commands/skill/paths-cmd.ts +81 -0
package/src/cli/commands/skill/paths.ts +191 -0
package/src/cli/commands/skill/show.ts +73 -0
package/src/cli/commands/skill/uninstall.ts +141 -0
package/src/cli/commands/status.ts +205 -0
package/src/cli/commands/update.ts +68 -0
package/src/cli/commands/vsearch.ts +188 -0
package/src/cli/context.ts +64 -0
package/src/cli/errors.ts +64 -0
package/src/cli/format/search-results.ts +211 -0
package/src/cli/options.ts +183 -0
package/src/cli/program.ts +1330 -0
package/src/cli/run.ts +213 -0
package/src/cli/ui.ts +92 -0
package/src/config/defaults.ts +20 -0
package/src/config/index.ts +55 -0
package/src/config/loader.ts +161 -0
package/src/config/paths.ts +87 -0
package/src/config/saver.ts +153 -0
package/src/config/types.ts +280 -0
package/src/converters/adapters/markitdownTs/adapter.ts +140 -0
package/src/converters/adapters/officeparser/adapter.ts +126 -0
package/src/converters/canonicalize.ts +89 -0
package/src/converters/errors.ts +218 -0
package/src/converters/index.ts +51 -0
package/src/converters/mime.ts +163 -0
package/src/converters/native/markdown.ts +115 -0
package/src/converters/native/plaintext.ts +56 -0
package/src/converters/path.ts +48 -0
package/src/converters/pipeline.ts +159 -0
package/src/converters/registry.ts +74 -0
package/src/converters/types.ts +123 -0
package/src/converters/versions.ts +24 -0
package/src/index.ts +27 -0
package/src/ingestion/chunker.ts +238 -0
package/src/ingestion/index.ts +32 -0
package/src/ingestion/language.ts +276 -0
package/src/ingestion/sync.ts +671 -0
package/src/ingestion/types.ts +219 -0
package/src/ingestion/walker.ts +235 -0
package/src/llm/cache.ts +467 -0
package/src/llm/errors.ts +191 -0
package/src/llm/index.ts +58 -0
package/src/llm/nodeLlamaCpp/adapter.ts +133 -0
package/src/llm/nodeLlamaCpp/embedding.ts +165 -0
package/src/llm/nodeLlamaCpp/generation.ts +88 -0
package/src/llm/nodeLlamaCpp/lifecycle.ts +317 -0
package/src/llm/nodeLlamaCpp/rerank.ts +94 -0
package/src/llm/registry.ts +86 -0
package/src/llm/types.ts +129 -0
package/src/mcp/resources/index.ts +151 -0
package/src/mcp/server.ts +229 -0
package/src/mcp/tools/get.ts +220 -0
package/src/mcp/tools/index.ts +160 -0
package/src/mcp/tools/multi-get.ts +263 -0
package/src/mcp/tools/query.ts +226 -0
package/src/mcp/tools/search.ts +119 -0
package/src/mcp/tools/status.ts +81 -0
package/src/mcp/tools/vsearch.ts +198 -0
package/src/pipeline/chunk-lookup.ts +44 -0
package/src/pipeline/expansion.ts +256 -0
package/src/pipeline/explain.ts +115 -0
package/src/pipeline/fusion.ts +185 -0
package/src/pipeline/hybrid.ts +535 -0
package/src/pipeline/index.ts +64 -0
package/src/pipeline/query-language.ts +118 -0
package/src/pipeline/rerank.ts +223 -0
package/src/pipeline/search.ts +261 -0
package/src/pipeline/types.ts +328 -0
package/src/pipeline/vsearch.ts +348 -0
package/src/store/index.ts +41 -0
package/src/store/migrations/001-initial.ts +196 -0
package/src/store/migrations/index.ts +20 -0
package/src/store/migrations/runner.ts +187 -0
package/src/store/sqlite/adapter.ts +1242 -0
package/src/store/sqlite/index.ts +7 -0
package/src/store/sqlite/setup.ts +129 -0
package/src/store/sqlite/types.ts +28 -0
package/src/store/types.ts +506 -0
package/src/store/vector/index.ts +13 -0
package/src/store/vector/sqlite-vec.ts +373 -0
package/src/store/vector/stats.ts +152 -0
package/src/store/vector/types.ts +115 -0

package/src/cli/commands/ask.ts ADDED Viewed

@@ -0,0 +1,545 @@
+/**
+ * gno ask command implementation.
+ * Human-friendly query with citations and optional grounded answer.
+ *
+ * @module src/cli/commands/ask
+ */
+import { LlmAdapter } from '../../llm/nodeLlamaCpp/adapter';
+import { getActivePreset } from '../../llm/registry';
+import type {
+  EmbeddingPort,
+  GenerationPort,
+  RerankPort,
+} from '../../llm/types';
+import { type HybridSearchDeps, searchHybrid } from '../../pipeline/hybrid';
+import type {
+  AskOptions,
+  AskResult,
+  Citation,
+  SearchResult,
+} from '../../pipeline/types';
+import {
+  createVectorIndexPort,
+  type VectorIndexPort,
+} from '../../store/vector';
+import { initStore } from './shared';
+// ─────────────────────────────────────────────────────────────────────────────
+// Types
+// ─────────────────────────────────────────────────────────────────────────────
+export type AskCommandOptions = AskOptions & {
+  /** Override config path */
+  configPath?: string;
+  /** Override embedding model */
+  embedModel?: string;
+  /** Override generation model */
+  genModel?: string;
+  /** Override rerank model */
+  rerankModel?: string;
+  /** Output as JSON */
+  json?: boolean;
+  /** Output as Markdown */
+  md?: boolean;
+  /** Show all retrieved sources (not just cited) */
+  showSources?: boolean;
+};
+export type AskCommandResult =
+  | { success: true; data: AskResult }
+  | { success: false; error: string };
+// ─────────────────────────────────────────────────────────────────────────────
+// Grounded Answer Generation
+// ─────────────────────────────────────────────────────────────────────────────
+const ANSWER_PROMPT = `You are answering a question using ONLY the provided context blocks.
+Rules you MUST follow:
+1) Use ONLY facts stated in the context blocks. Do NOT use outside knowledge.
+2) Every factual statement must include an inline citation like [1] or [2] referring to a context block.
+3) If the context does not contain enough information to answer, reply EXACTLY:
+   "I don't have enough information in the provided sources to answer this question."
+4) Do not cite sources you did not use. Do not invent citation numbers.
+Question: {query}
+Context blocks:
+{context}
+Write a concise answer (1-3 paragraphs).`;
+/** Abstention message when LLM cannot ground answer */
+const ABSTENTION_MESSAGE =
+  "I don't have enough information in the provided sources to answer this question.";
+// Max characters per snippet to avoid blowing up prompt size
+const MAX_SNIPPET_CHARS = 1500;
+// Max number of sources to include in context
+const MAX_CONTEXT_SOURCES = 5;
+/**
+ * Extract VALID citation numbers from answer text.
+ * Only returns numbers in range [1, maxCitation].
+ * @param answer Answer text to parse
+ * @param maxCitation Maximum valid citation number
+ * @returns Sorted unique valid citation numbers (1-indexed)
+ */
+function extractValidCitationNumbers(
+  answer: string,
+  maxCitation: number
+): number[] {
+  const nums = new Set<number>();
+  // Use fresh regex to avoid lastIndex issues
+  const re = /\[(\d+)\]/g;
+  const matches = answer.matchAll(re);
+  for (const match of matches) {
+    const n = Number(match[1]);
+    // Only accept valid citation numbers in range [1, maxCitation]
+    if (Number.isInteger(n) && n >= 1 && n <= maxCitation) {
+      nums.add(n);
+    }
+  }
+  return [...nums].sort((a, b) => a - b);
+}
+/**
+ * Filter citations to only those actually referenced in the answer.
+ * @param citations All citations provided to LLM
+ * @param validUsedNumbers Valid 1-indexed citation numbers from answer
+ */
+function filterCitationsByUse(
+  citations: Citation[],
+  validUsedNumbers: number[]
+): Citation[] {
+  const usedSet = new Set(validUsedNumbers);
+  return citations.filter((_, idx) => usedSet.has(idx + 1));
+}
+/**
+ * Renumber citations in answer text to match filtered citations.
+ * E.g., if answer uses [2] and [5], renumber to [1] and [2].
+ * Invalid citations (not in validUsedNumbers) are removed.
+ */
+function renumberAnswerCitations(
+  answer: string,
+  validUsedNumbers: number[]
+): string {
+  // Build mapping: old number -> new number (1-indexed)
+  const mapping = new Map<number, number>();
+  for (let i = 0; i < validUsedNumbers.length; i++) {
+    const oldNum = validUsedNumbers[i];
+    if (oldNum !== undefined) {
+      mapping.set(oldNum, i + 1);
+    }
+  }
+  // Use fresh regex to avoid lastIndex issues
+  const re = /\[(\d+)\]/g;
+  // Replace valid [n] with renumbered [m], remove invalid citations
+  const replaced = answer.replace(re, (_match, numStr: string) => {
+    const oldNum = Number(numStr);
+    const newNum = mapping.get(oldNum);
+    // If not in mapping, remove the citation entirely
+    return newNum !== undefined ? `[${newNum}]` : '';
+  });
+  // Clean up whitespace artifacts from removed citations
+  // e.g., "See [99] for" → "See  for" → "See for"
+  return replaced.replace(/ {2,}/g, ' ').trim();
+}
+async function generateGroundedAnswer(
+  genPort: GenerationPort,
+  query: string,
+  results: SearchResult[],
+  maxTokens: number
+): Promise<{ answer: string; citations: Citation[] } | null> {
+  // Build context from top results with bounded snippet sizes
+  const contextParts: string[] = [];
+  const citations: Citation[] = [];
+  // Track citation index separately to ensure it matches context blocks exactly
+  let citationIndex = 0;
+  for (const r of results.slice(0, MAX_CONTEXT_SOURCES)) {
+    // Skip results with empty snippets
+    if (!r.snippet || r.snippet.trim().length === 0) {
+      continue;
+    }
+    // Cap snippet length to avoid prompt blowup
+    const snippet =
+      r.snippet.length > MAX_SNIPPET_CHARS
+        ? `${r.snippet.slice(0, MAX_SNIPPET_CHARS)}...`
+        : r.snippet;
+    citationIndex += 1;
+    contextParts.push(`[${citationIndex}] ${snippet}`);
+    citations.push({
+      docid: r.docid,
+      uri: r.uri,
+      startLine: r.snippetRange?.startLine,
+      endLine: r.snippetRange?.endLine,
+    });
+  }
+  // If no valid context, can't generate answer
+  if (contextParts.length === 0) {
+    return null;
+  }
+  const prompt = ANSWER_PROMPT.replace('{query}', query).replace(
+    '{context}',
+    contextParts.join('\n\n')
+  );
+  const result = await genPort.generate(prompt, {
+    temperature: 0,
+    maxTokens,
+  });
+  if (!result.ok) {
+    return null;
+  }
+  return { answer: result.value, citations };
+}
+// ─────────────────────────────────────────────────────────────────────────────
+// Command Implementation
+// ─────────────────────────────────────────────────────────────────────────────
+/**
+ * Execute gno ask command.
+ */
+// biome-ignore lint/complexity/noExcessiveCognitiveComplexity: CLI orchestration with multiple output formats
+export async function ask(
+  query: string,
+  options: AskCommandOptions = {}
+): Promise<AskCommandResult> {
+  const limit = options.limit ?? 5;
+  const initResult = await initStore({
+    configPath: options.configPath,
+    collection: options.collection,
+  });
+  if (!initResult.ok) {
+    return { success: false, error: initResult.error };
+  }
+  const { store, config } = initResult;
+  let embedPort: EmbeddingPort | null = null;
+  let genPort: GenerationPort | null = null;
+  let rerankPort: RerankPort | null = null;
+  try {
+    const preset = getActivePreset(config);
+    const llm = new LlmAdapter(config);
+    // Create embedding port
+    const embedUri = options.embedModel ?? preset.embed;
+    const embedResult = await llm.createEmbeddingPort(embedUri);
+    if (embedResult.ok) {
+      embedPort = embedResult.value;
+    }
+    // Create generation port (for expansion and answer)
+    const genUri = options.genModel ?? preset.gen;
+    const genResult = await llm.createGenerationPort(genUri);
+    if (genResult.ok) {
+      genPort = genResult.value;
+    }
+    // Create rerank port
+    const rerankUri = options.rerankModel ?? preset.rerank;
+    const rerankResult = await llm.createRerankPort(rerankUri);
+    if (rerankResult.ok) {
+      rerankPort = rerankResult.value;
+    }
+    // Create vector index
+    let vectorIndex: VectorIndexPort | null = null;
+    if (embedPort) {
+      const embedInitResult = await embedPort.init();
+      if (embedInitResult.ok) {
+        const dimensions = embedPort.dimensions();
+        const db = store.getRawDb();
+        const vectorResult = await createVectorIndexPort(db, {
+          model: embedUri,
+          dimensions,
+        });
+        if (vectorResult.ok) {
+          vectorIndex = vectorResult.value;
+        }
+      }
+    }
+    const deps: HybridSearchDeps = {
+      store,
+      config,
+      vectorIndex,
+      embedPort,
+      genPort,
+      rerankPort,
+    };
+    // Check if answer generation is explicitly requested
+    const answerRequested = options.answer && !options.noAnswer;
+    // Fail early if --answer is requested but no generation model available
+    if (answerRequested && genPort === null) {
+      return {
+        success: false,
+        error:
+          'Answer generation requested but no generation model available. ' +
+          'Run `gno models pull --gen` to download a model, or configure a preset.',
+      };
+    }
+    // Run hybrid search
+    const searchResult = await searchHybrid(deps, query, {
+      limit,
+      collection: options.collection,
+      lang: options.lang,
+    });
+    if (!searchResult.ok) {
+      return { success: false, error: searchResult.error.message };
+    }
+    const results = searchResult.value.results;
+    // Generate grounded answer if requested
+    let answer: string | undefined;
+    let citations: Citation[] | undefined;
+    let answerGenerated = false;
+    // Only generate answer if:
+    // 1. --answer was explicitly requested (not just default behavior)
+    // 2. --no-answer was not set
+    // 3. We have results to ground on (no point generating from nothing)
+    const shouldGenerateAnswer =
+      answerRequested && genPort !== null && results.length > 0;
+    if (shouldGenerateAnswer && genPort) {
+      const maxTokens = options.maxAnswerTokens ?? 512;
+      const answerResult = await generateGroundedAnswer(
+        genPort,
+        query,
+        results,
+        maxTokens
+      );
+      // Fail loudly if generation was requested but failed
+      if (!answerResult) {
+        return {
+          success: false,
+          error:
+            'Answer generation failed. The generation model may have encountered an error.',
+        };
+      }
+      // Extract only VALID citation numbers (in range 1..citations.length)
+      const maxCitation = answerResult.citations.length;
+      const validUsedNums = extractValidCitationNumbers(
+        answerResult.answer,
+        maxCitation
+      );
+      const filteredCitations = filterCitationsByUse(
+        answerResult.citations,
+        validUsedNums
+      );
+      // Abstention guard: if no valid citations, LLM didn't ground the answer
+      if (validUsedNums.length === 0 || filteredCitations.length === 0) {
+        answer = ABSTENTION_MESSAGE;
+        citations = [];
+      } else {
+        // Renumber citations in answer to match filtered list (e.g., [2],[5] -> [1],[2])
+        // Invalid citations are removed from the answer text
+        answer = renumberAnswerCitations(answerResult.answer, validUsedNums);
+        citations = filteredCitations;
+      }
+      answerGenerated = true;
+    }
+    const askResult: AskResult = {
+      query,
+      mode: searchResult.value.meta.vectorsUsed ? 'hybrid' : 'bm25_only',
+      queryLanguage: searchResult.value.meta.queryLanguage ?? 'und',
+      answer,
+      citations,
+      results,
+      meta: {
+        expanded: searchResult.value.meta.expanded ?? false,
+        reranked: searchResult.value.meta.reranked ?? false,
+        vectorsUsed: searchResult.value.meta.vectorsUsed ?? false,
+        answerGenerated,
+        totalResults: results.length,
+      },
+    };
+    return { success: true, data: askResult };
+  } finally {
+    if (embedPort) {
+      await embedPort.dispose();
+    }
+    if (genPort) {
+      await genPort.dispose();
+    }
+    if (rerankPort) {
+      await rerankPort.dispose();
+    }
+    await store.close();
+  }
+}
+// ─────────────────────────────────────────────────────────────────────────────
+// Formatters
+// ─────────────────────────────────────────────────────────────────────────────
+interface FormatOptions {
+  showSources?: boolean;
+}
+// biome-ignore lint/complexity/noExcessiveCognitiveComplexity: terminal formatting with conditional sections
+function formatTerminal(data: AskResult, opts: FormatOptions = {}): string {
+  const lines: string[] = [];
+  const hasAnswer = Boolean(data.answer);
+  // Show answer if present
+  if (data.answer) {
+    lines.push('Answer:');
+    lines.push(data.answer);
+    lines.push('');
+  }
+  // Show cited sources (only sources actually referenced in answer)
+  if (data.citations && data.citations.length > 0) {
+    lines.push('Cited Sources:');
+    for (let i = 0; i < data.citations.length; i++) {
+      const c = data.citations[i];
+      if (c) {
+        lines.push(`  [${i + 1}] ${c.uri}`);
+      }
+    }
+    lines.push('');
+  }
+  // Show all retrieved sources if:
+  // - No answer was generated (retrieval-only mode)
+  // - User explicitly requested with --show-sources
+  const showAllSources = !hasAnswer || opts.showSources;
+  if (showAllSources && data.results.length > 0) {
+    lines.push(hasAnswer ? 'All Retrieved Sources:' : 'Sources:');
+    for (const r of data.results) {
+      lines.push(`  [${r.docid}] ${r.uri}`);
+      if (r.title) {
+        lines.push(`    ${r.title}`);
+      }
+    }
+  } else if (hasAnswer && data.results.length > 0) {
+    // Hint about --show-sources when we have more sources
+    const citedCount = data.citations?.length ?? 0;
+    if (data.results.length > citedCount) {
+      lines.push(
+        `(${data.results.length} sources retrieved, use --show-sources to list all)`
+      );
+    }
+  }
+  if (!data.answer && data.results.length === 0) {
+    lines.push('No relevant sources found.');
+  }
+  return lines.join('\n');
+}
+function formatMarkdown(data: AskResult, opts: FormatOptions = {}): string {
+  const lines: string[] = [];
+  const hasAnswer = Boolean(data.answer);
+  lines.push(`# Question: ${data.query}`);
+  lines.push('');
+  if (data.answer) {
+    lines.push('## Answer');
+    lines.push('');
+    lines.push(data.answer);
+    lines.push('');
+  }
+  // Show cited sources (only sources actually referenced in answer)
+  if (data.citations && data.citations.length > 0) {
+    lines.push('## Cited Sources');
+    lines.push('');
+    for (let i = 0; i < data.citations.length; i++) {
+      const c = data.citations[i];
+      if (c) {
+        lines.push(`**[${i + 1}]** \`${c.uri}\``);
+      }
+    }
+    lines.push('');
+  }
+  // Show all retrieved sources if no answer or --show-sources
+  const showAllSources = !hasAnswer || opts.showSources;
+  if (showAllSources) {
+    lines.push(hasAnswer ? '## All Retrieved Sources' : '## Sources');
+    lines.push('');
+    for (let i = 0; i < data.results.length; i++) {
+      const r = data.results[i];
+      if (!r) {
+        continue;
+      }
+      lines.push(`${i + 1}. **${r.title || r.source.relPath}**`);
+      lines.push(`   - URI: \`${r.uri}\``);
+      lines.push(`   - Score: ${r.score.toFixed(2)}`);
+    }
+    if (data.results.length === 0) {
+      lines.push('*No relevant sources found.*');
+    }
+  }
+  lines.push('');
+  lines.push('---');
+  lines.push(
+    `*Mode: ${data.mode} | Expanded: ${data.meta.expanded} | Reranked: ${data.meta.reranked}*`
+  );
+  return lines.join('\n');
+}
+/**
+ * Format ask result for output.
+ */
+export function formatAsk(
+  result: AskCommandResult,
+  options: AskCommandOptions
+): string {
+  if (!result.success) {
+    return options.json
+      ? JSON.stringify({
+          error: { code: 'ASK_FAILED', message: result.error },
+        })
+      : `Error: ${result.error}`;
+  }
+  const formatOpts: FormatOptions = { showSources: options.showSources };
+  if (options.json) {
+    return JSON.stringify(result.data, null, 2);
+  }
+  if (options.md) {
+    return formatMarkdown(result.data, formatOpts);
+  }
+  return formatTerminal(result.data, formatOpts);
+}

package/src/cli/commands/cleanup.ts ADDED Viewed

@@ -0,0 +1,105 @@
+/**
+ * gno cleanup command implementation.
+ * Remove orphaned content, chunks, vectors not referenced by active documents.
+ *
+ * @module src/cli/commands/cleanup
+ */
+import { getIndexDbPath } from '../../app/constants';
+import { isInitialized, loadConfig } from '../../config';
+import { SqliteAdapter } from '../../store/sqlite/adapter';
+import type { CleanupStats } from '../../store/types';
+/**
+ * Options for cleanup command.
+ */
+export interface CleanupOptions {
+  /** Override config path */
+  configPath?: string;
+}
+/**
+ * Result of cleanup command.
+ */
+export type CleanupResult =
+  | { success: true; stats: CleanupStats }
+  | { success: false; error: string };
+/**
+ * Execute gno cleanup command.
+ */
+export async function cleanup(
+  options: CleanupOptions = {}
+): Promise<CleanupResult> {
+  // Check if initialized
+  const initialized = await isInitialized(options.configPath);
+  if (!initialized) {
+    return { success: false, error: 'GNO not initialized. Run: gno init' };
+  }
+  // Load config
+  const configResult = await loadConfig(options.configPath);
+  if (!configResult.ok) {
+    return { success: false, error: configResult.error.message };
+  }
+  const config = configResult.value;
+  // Open database
+  const store = new SqliteAdapter();
+  const dbPath = getIndexDbPath();
+  const openResult = await store.open(dbPath, config.ftsTokenizer);
+  if (!openResult.ok) {
+    return { success: false, error: openResult.error.message };
+  }
+  try {
+    const cleanupResult = await store.cleanupOrphans();
+    if (!cleanupResult.ok) {
+      return { success: false, error: cleanupResult.error.message };
+    }
+    return { success: true, stats: cleanupResult.value };
+  } finally {
+    await store.close();
+  }
+}
+/**
+ * Format cleanup result for output.
+ */
+export function formatCleanup(result: CleanupResult): string {
+  if (!result.success) {
+    return `Error: ${result.error}`;
+  }
+  const { stats } = result;
+  const total =
+    stats.orphanedContent +
+    stats.orphanedChunks +
+    stats.orphanedVectors +
+    stats.expiredCache;
+  if (total === 0) {
+    return 'No orphans found. Index is clean.';
+  }
+  const lines: string[] = ['Cleanup complete:'];
+  if (stats.orphanedContent > 0) {
+    lines.push(`  Orphaned content: ${stats.orphanedContent}`);
+  }
+  if (stats.orphanedChunks > 0) {
+    lines.push(`  Orphaned chunks: ${stats.orphanedChunks}`);
+  }
+  if (stats.orphanedVectors > 0) {
+    lines.push(`  Orphaned vectors: ${stats.orphanedVectors}`);
+  }
+  if (stats.expiredCache > 0) {
+    lines.push(`  Expired cache: ${stats.expiredCache}`);
+  }
+  lines.push(`Total removed: ${total}`);
+  return lines.join('\n');
+}