npm - @tobilu/qmd - Versions diffs - 2.0.1 → 2.5.1 - Mend

@tobilu/qmd 2.0.1 → 2.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/CHANGELOG.md +177 -0
package/README.md +64 -1
package/bin/qmd +49 -4
package/dist/ast.d.ts +65 -0
package/dist/ast.js +334 -0
package/dist/bench/bench.d.ts +23 -0
package/dist/bench/bench.js +280 -0
package/dist/bench/score.d.ts +33 -0
package/dist/bench/score.js +88 -0
package/dist/bench/types.d.ts +80 -0
package/dist/bench/types.js +8 -0
package/dist/cli/formatter.js +5 -1
package/dist/cli/qmd.d.ts +27 -0
package/dist/cli/qmd.js +1328 -115
package/dist/collections.d.ts +20 -0
package/dist/collections.js +32 -7
package/dist/db.d.ts +14 -3
package/dist/db.js +45 -4
package/dist/index.d.ts +11 -1
package/dist/index.js +18 -5
package/dist/llm.d.ts +77 -6
package/dist/llm.js +445 -62
package/dist/mcp/server.d.ts +6 -3
package/dist/mcp/server.js +68 -29
package/dist/paths.d.ts +1 -0
package/dist/paths.js +4 -0
package/dist/store.d.ts +148 -23
package/dist/store.js +1018 -255
package/package.json +48 -20
package/scripts/build.mjs +29 -0
package/scripts/check-package-grammars.mjs +29 -0
package/scripts/package-smoke.mjs +65 -0
package/scripts/test-all.mjs +27 -0
package/skills/qmd/SKILL.md +203 -0
package/skills/qmd/references/mcp-setup.md +102 -0
package/skills/release/SKILL.md +139 -0
package/skills/release/scripts/install-hooks.sh +38 -0
package/dist/embedded-skills.d.ts +0 -6
package/dist/embedded-skills.js +0 -14

package/dist/mcp/server.d.ts CHANGED Viewed

@@ -6,7 +6,10 @@
  *
  * Follows MCP spec 2025-06-18 for proper response types.
  */
-export declare function startMcpServer(): Promise<void>;
+export type McpStartupOptions = {
+    dbPath?: string;
+};
+export declare function startMcpServer(options?: McpStartupOptions): Promise<void>;
 export type HttpServerHandle = {
     httpServer: import("http").Server;
     port: number;
@@ -16,6 +19,6 @@ export type HttpServerHandle = {
  * Start MCP server over Streamable HTTP (JSON responses, no SSE).
  * Binds to localhost only. Returns a handle for shutdown and port discovery.
  */
-export declare function startMcpHttpServer(port: number, options?: {
+export declare function startMcpHttpServer(port: number, options?: ({
     quiet?: boolean;
-}): Promise<HttpServerHandle>;
+} & McpStartupOptions)): Promise<HttpServerHandle>;

package/dist/mcp/server.js CHANGED Viewed

@@ -8,13 +8,18 @@
  */
 import { createServer } from "node:http";
 import { randomUUID } from "node:crypto";
+import { readFileSync } from "node:fs";
+import { join, dirname } from "node:path";
 import { fileURLToPath } from "url";
 import { McpServer, ResourceTemplate } from "@modelcontextprotocol/sdk/server/mcp.js";
 import { StdioServerTransport } from "@modelcontextprotocol/sdk/server/stdio.js";
 import { WebStandardStreamableHTTPServerTransport } from "@modelcontextprotocol/sdk/server/webStandardStreamableHttp.js";
 import { isInitializeRequest } from "@modelcontextprotocol/sdk/types.js";
 import { z } from "zod";
+import { existsSync } from "fs";
 import { createStore, extractSnippet, addLineNumbers, getDefaultDbPath, DEFAULT_MULTI_GET_MAX_BYTES, } from "../index.js";
+import { getConfigPath } from "../collections.js";
+import { enableProductionMode } from "../store.js";
 // =============================================================================
 // Helper functions
 // =============================================================================
@@ -39,6 +44,16 @@ function formatSearchSummary(results, query) {
     }
     return lines.join('\n');
 }
+function getPackageVersion() {
+    try {
+        const pkgPath = join(dirname(fileURLToPath(import.meta.url)), "../../package.json");
+        const pkg = JSON.parse(readFileSync(pkgPath, "utf-8"));
+        return pkg.version ?? "unknown";
+    }
+    catch {
+        return "unknown";
+    }
+}
 // =============================================================================
 // MCP Server
 // =============================================================================
@@ -49,7 +64,6 @@ function formatSearchSummary(results, query) {
  */
 async function buildInstructions(store) {
     const status = await store.getStatus();
-    const contexts = await store.listContexts();
     const globalCtx = await store.getGlobalContext();
     const lines = [];
     // --- What is this? ---
@@ -57,15 +71,13 @@ async function buildInstructions(store) {
     if (globalCtx)
         lines.push(`Context: ${globalCtx}`);
     // --- What's searchable? ---
+    // Emit names only — the per-collection doc counts and descriptions can run to ~1.5 KB
+    // across a dozen collections, and the same info is available on demand via the `status` tool.
     if (status.collections.length > 0) {
         lines.push("");
-        lines.push("Collections (scope with `collection` parameter):");
-        for (const col of status.collections) {
-            // Find root context for this collection
-            const rootCtx = contexts.find(c => c.collection === col.name && (c.path === "" || c.path === "/"));
-            const desc = rootCtx ? ` — ${rootCtx.context}` : "";
-            lines.push(`  - "${col.name}" (${col.documents} docs)${desc}`);
-        }
+        const names = status.collections.map(c => c.name).join(", ");
+        lines.push(`Collections (scope with \`collection\` parameter): ${names}`);
+        lines.push("Call the `status` tool for collection descriptions, paths, and per-collection doc counts.");
     }
     // --- Capability gaps ---
     if (!status.hasVectorIndex) {
@@ -108,7 +120,7 @@ async function buildInstructions(store) {
  * Shared by both stdio and HTTP transports.
  */
 async function createMcpServer(store) {
-    const server = new McpServer({ name: "qmd", version: "0.9.9" }, { instructions: await buildInstructions(store) });
+    const server = new McpServer({ name: "qmd", version: getPackageVersion() }, { instructions: await buildInstructions(store) });
     // Pre-fetch default collection names for search tools
     const defaultCollectionNames = await store.getDefaultCollectionNames();
     // ---------------------------------------------------------------------------
@@ -155,6 +167,8 @@ async function createMcpServer(store) {
         title: "Query",
         description: `Search the knowledge base using a query document — one or more typed sub-queries combined for best recall.
+Each result includes a \`line\` field with the absolute 1-indexed line of the best match in the source markdown. To read more context around a hit, call \`get(file, fromLine = max(1, line - 20), maxLines = 80, lineNumbers = true)\`.
 ## Query Types
 **lex** — BM25 keyword search. Fast, exact, no LLM needed.
@@ -218,8 +232,9 @@ Intent-aware lex (C++ performance, not sports):
             candidateLimit: z.number().optional().describe("Maximum candidates to rerank (default: 40, lower = faster but may miss results)"),
             collections: z.array(z.string()).optional().describe("Filter to collections (OR match)"),
             intent: z.string().optional().describe("Background context to disambiguate the query. Example: query='performance', intent='web page load times and Core Web Vitals'. Does not search on its own."),
+            rerank: z.boolean().optional().default(true).describe("Rerank results using LLM (default: true). Set to false for faster results on CPU-only machines."),
         },
-    }, async ({ searches, limit, minScore, candidateLimit, collections, intent }) => {
+    }, async ({ searches, limit, minScore, candidateLimit, collections, intent, rerank }) => {
         // Map to internal format
         const queries = searches.map(s => ({
             type: s.type,
@@ -232,6 +247,8 @@ Intent-aware lex (C++ performance, not sports):
             collections: effectiveCollections.length > 0 ? effectiveCollections : undefined,
             limit,
             minScore,
+            candidateLimit,
+            rerank,
             intent,
         });
         // Use first lex or vec query for snippet extraction
@@ -239,13 +256,14 @@ Intent-aware lex (C++ performance, not sports):
             || searches.find(s => s.type === 'vec')?.query
             || searches[0]?.query || "";
         const filtered = results.map(r => {
-            const { line, snippet } = extractSnippet(r.bestChunk, primaryQuery, 300, undefined, undefined, intent);
+            const { line, snippet } = extractSnippet(r.body, primaryQuery, 300, r.bestChunkPos, r.bestChunk.length, intent);
             return {
                 docid: `#${r.docid}`,
                 file: r.displayPath,
                 title: r.title,
                 score: Math.round(r.score * 100) / 100,
                 context: r.context,
+                line,
                 snippet: addLineNumbers(snippet, line),
             };
         });
@@ -276,6 +294,8 @@ Intent-aware lex (C++ performance, not sports):
             parsedFromLine = parseInt(colonMatch[1], 10);
             lookup = lookup.slice(0, -colonMatch[0].length);
         }
+        if (parsedFromLine !== undefined)
+            parsedFromLine = Math.max(1, parsedFromLine);
         const result = await store.get(lookup, { includeBody: false });
         if ("error" in result) {
             let msg = `Document not found: ${file}`;
@@ -387,7 +407,7 @@ Intent-aware lex (C++ performance, not sports):
             `  Collections: ${status.collections.length}`,
         ];
         for (const col of status.collections) {
-            summary.push(`    - ${col.path} (${col.documents} docs)`);
+            summary.push(`    - ${col.name}: ${col.path} (${col.documents} docs)`);
         }
         return {
             content: [{ type: "text", text: summary.join('\n') }],
@@ -396,11 +416,18 @@ Intent-aware lex (C++ performance, not sports):
     });
     return server;
 }
-// =============================================================================
-// Transport: stdio (default)
-// =============================================================================
-export async function startMcpServer() {
-    const store = await createStore({ dbPath: getDefaultDbPath() });
+export async function startMcpServer(options = {}) {
+    // Opt into production mode when the MCP server is actually started, not
+    // when this module is merely imported for its exports. Importing the module
+    // at the top level flipped the global production flag and broke test
+    // isolation for downstream suites that expect the default (development)
+    // database path behaviour.
+    enableProductionMode();
+    const configPath = getConfigPath();
+    const store = await createStore({
+        dbPath: options.dbPath ?? getDefaultDbPath(),
+        ...(existsSync(configPath) ? { configPath } : {}),
+    });
     const server = await createMcpServer(store);
     const transport = new StdioServerTransport();
     await server.connect(transport);
@@ -409,8 +436,16 @@ export async function startMcpServer() {
  * Start MCP server over Streamable HTTP (JSON responses, no SSE).
  * Binds to localhost only. Returns a handle for shutdown and port discovery.
  */
-export async function startMcpHttpServer(port, options) {
-    const store = await createStore({ dbPath: getDefaultDbPath() });
+export async function startMcpHttpServer(port, options = {}) {
+    // See startMcpServer() for the rationale — flip production mode here so the
+    // HTTP transport resolves the real database path, without leaking state into
+    // callers that only import this module for its exports (e.g. tests).
+    enableProductionMode();
+    const configPath = getConfigPath();
+    const store = await createStore({
+        dbPath: options.dbPath ?? getDefaultDbPath(),
+        ...(existsSync(configPath) ? { configPath } : {}),
+    });
     // Pre-fetch default collection names for REST endpoint
     const defaultCollectionNames = await store.getDefaultCollectionNames();
     // Session map: each client gets its own McpServer + Transport pair (MCP spec requirement).
@@ -442,7 +477,7 @@ export async function startMcpHttpServer(port, options) {
     }
     /** Extract a human-readable label from a JSON-RPC body */
     function describeRequest(body) {
-        const method = body?.method ?? "unknown";
+        const method = typeof body.method === "string" ? body.method : "unknown";
         if (method === "tools/call") {
             const tool = body.params?.name ?? "?";
             const args = body.params?.arguments;
@@ -493,31 +528,35 @@ export async function startMcpHttpServer(port, options) {
                     return;
                 }
                 // Map to internal format
-                const queries = params.searches.map((s) => ({
+                const searches = params.searches;
+                const queries = searches.map((s) => ({
                     type: s.type,
                     query: String(s.query || ""),
                 }));
                 // Use default collections if none specified
-                const effectiveCollections = params.collections ?? defaultCollectionNames;
+                const effectiveCollections = Array.isArray(params.collections) ? params.collections.map(String) : defaultCollectionNames;
                 const results = await store.search({
                     queries,
                     collections: effectiveCollections.length > 0 ? effectiveCollections : undefined,
-                    limit: params.limit ?? 10,
-                    minScore: params.minScore ?? 0,
-                    intent: params.intent,
+                    limit: typeof params.limit === "number" ? params.limit : 10,
+                    minScore: typeof params.minScore === "number" ? params.minScore : 0,
+                    candidateLimit: typeof params.candidateLimit === "number" ? params.candidateLimit : undefined,
+                    intent: typeof params.intent === "string" ? params.intent : undefined,
+                    rerank: typeof params.rerank === "boolean" ? params.rerank : undefined,
                 });
                 // Use first lex or vec query for snippet extraction
-                const primaryQuery = params.searches.find((s) => s.type === 'lex')?.query
-                    || params.searches.find((s) => s.type === 'vec')?.query
-                    || params.searches[0]?.query || "";
+                const primaryQuery = searches.find((s) => s.type === 'lex')?.query
+                    || searches.find((s) => s.type === 'vec')?.query
+                    || searches[0]?.query || "";
                 const formatted = results.map(r => {
-                    const { line, snippet } = extractSnippet(r.bestChunk, primaryQuery, 300);
+                    const { line, snippet } = extractSnippet(r.body, String(primaryQuery), 300, r.bestChunkPos, r.bestChunk.length, typeof params.intent === "string" ? params.intent : undefined);
                     return {
                         docid: `#${r.docid}`,
                         file: r.displayPath,
                         title: r.title,
                         score: Math.round(r.score * 100) / 100,
                         context: r.context,
+                        line,
                         snippet: addLineNumbers(snippet, line),
                     };
                 });

package/dist/paths.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function qmdHomedir(): string;

package/dist/paths.js ADDED Viewed

@@ -0,0 +1,4 @@
+import { homedir as osHomedir } from "node:os";
+export function qmdHomedir() {
+    return process.env.HOME || process.env.USERPROFILE || osHomedir() || "/tmp";
+}

package/dist/store.d.ts CHANGED Viewed

@@ -13,17 +13,20 @@
 import type { Database } from "./db.js";
 import { LlamaCpp, formatQueryForEmbedding, formatDocForEmbedding, type ILLMSession } from "./llm.js";
 import type { NamedCollection, Collection, CollectionConfig } from "./collections.js";
-export declare const DEFAULT_EMBED_MODEL = "embeddinggemma";
-export declare const DEFAULT_RERANK_MODEL = "ExpedientFalcon/qwen3-reranker:0.6b-q8_0";
-export declare const DEFAULT_QUERY_MODEL = "Qwen/Qwen3-1.7B";
+export declare const DEFAULT_EMBED_MODEL = "hf:ggml-org/embeddinggemma-300M-GGUF/embeddinggemma-300M-Q8_0.gguf";
+export declare const DEFAULT_RERANK_MODEL = "hf:ggml-org/Qwen3-Reranker-0.6B-Q8_0-GGUF/qwen3-reranker-0.6b-q8_0.gguf";
+export declare const DEFAULT_QUERY_MODEL = "hf:tobil/qmd-query-expansion-1.7B-gguf/qmd-query-expansion-1.7B-q4_k_m.gguf";
 export declare const DEFAULT_GLOB = "**/*.md";
 export declare const DEFAULT_MULTI_GET_MAX_BYTES: number;
+export declare const DEFAULT_EMBED_MAX_DOCS_PER_BATCH = 64;
+export declare const DEFAULT_EMBED_MAX_BATCH_BYTES: number;
 export declare const CHUNK_SIZE_TOKENS = 900;
 export declare const CHUNK_OVERLAP_TOKENS: number;
 export declare const CHUNK_SIZE_CHARS: number;
 export declare const CHUNK_OVERLAP_CHARS: number;
 export declare const CHUNK_WINDOW_TOKENS = 200;
 export declare const CHUNK_WINDOW_CHARS: number;
+export declare function getEmbeddingFingerprint(model?: string): string;
 /**
  * A potential break point in the document with a base score indicating quality.
  */
@@ -76,6 +79,20 @@ export declare function isInsideCodeFence(pos: number, fences: CodeFenceRegion[]
  * @returns The best position to cut at
  */
 export declare function findBestCutoff(breakPoints: BreakPoint[], targetCharPos: number, windowChars?: number, decayFactor?: number, codeFences?: CodeFenceRegion[]): number;
+export type ChunkStrategy = "auto" | "regex";
+/**
+ * Merge two sets of break points (e.g. regex + AST), keeping the highest
+ * score at each position. Result is sorted by position.
+ */
+export declare function mergeBreakPoints(a: BreakPoint[], b: BreakPoint[]): BreakPoint[];
+/**
+ * Core chunk algorithm that operates on precomputed break points and code fences.
+ * This is the shared implementation used by both regex-only and AST-aware chunking.
+ */
+export declare function chunkDocumentWithBreakPoints(content: string, breakPoints: BreakPoint[], codeFences: CodeFenceRegion[], maxChars?: number, overlapChars?: number, windowChars?: number): {
+    text: string;
+    pos: number;
+}[];
 export declare const STRONG_SIGNAL_MIN_SCORE = 0.85;
 export declare const STRONG_SIGNAL_MIN_GAP = 0.15;
 export declare const RERANK_CANDIDATE_LIMIT = 40;
@@ -118,12 +135,15 @@ export declare function normalizePathSeparators(path: string): string;
 export declare function getRelativePathFromPrefix(path: string, prefix: string): string | null;
 export declare function resolve(...paths: string[]): string;
 export declare function enableProductionMode(): void;
+/** Reset production mode flag — only for testing. */
+export declare function _resetProductionModeForTesting(): void;
 export declare function getDefaultDbPath(indexName?: string): string;
 export declare function getPwd(): string;
 export declare function getRealPath(path: string): string;
 export type VirtualPath = {
     collectionName: string;
     path: string;
+    indexName?: string;
 };
 /**
  * Normalize explicit virtual path formats to standard qmd:// format.
@@ -146,7 +166,7 @@ export declare function parseVirtualPath(virtualPath: string): VirtualPath | nul
 /**
  * Build a virtual path from collection name and relative path.
  */
-export declare function buildVirtualPath(collectionName: string, path: string): string;
+export declare function buildVirtualPath(collectionName: string, path: string, indexName?: string): string;
 /**
  * Check if a path is explicitly a virtual path.
  * Only recognizes explicit virtual path formats:
@@ -167,6 +187,12 @@ export declare function resolveVirtualPath(db: Database, virtualPath: string): s
  */
 export declare function toVirtualPath(db: Database, absolutePath: string): string | null;
 export declare function verifySqliteVecLoaded(db: Database): void;
+/**
+ * FTS5's unicode61 tokenizer does not segment CJK text into searchable words.
+ * Normalize CJK runs by spacing every character so exact CJK queries can be
+ * translated into phrase queries while Latin text keeps the default tokenizer.
+ */
+export declare function normalizeCjkForFTS(text: string): string;
 export declare function getStoreCollections(db: Database): NamedCollection[];
 export declare function getStoreCollection(db: Database, name: string): NamedCollection | null;
 export declare function getStoreGlobalContext(db: Database): string | undefined;
@@ -196,9 +222,9 @@ export type Store = {
     llm?: LlamaCpp;
     close: () => void;
     ensureVecTable: (dimensions: number) => void;
-    getHashesNeedingEmbedding: () => number;
-    getIndexHealth: () => IndexHealthInfo;
-    getStatus: () => IndexStatus;
+    getHashesNeedingEmbedding: (model?: string) => number;
+    getIndexHealth: (model?: string) => IndexHealthInfo;
+    getStatus: (model?: string) => IndexStatus;
     getCacheKey: typeof getCacheKey;
     getCachedResult: (cacheKey: string) => string | null;
     setCachedResult: (cacheKey: string, result: string) => void;
@@ -266,6 +292,11 @@ export type Store = {
         hash: string;
         title: string;
     } | null;
+    findOrMigrateLegacyDocument: (collectionName: string, path: string) => {
+        id: number;
+        hash: string;
+        title: string;
+    } | null;
     updateDocumentTitle: (documentId: number, title: string, modifiedAt: string) => void;
     updateDocument: (documentId: number, title: string, hash: string, modifiedAt: string) => void;
     deactivateDocument: (collectionName: string, path: string) => void;
@@ -276,7 +307,7 @@ export type Store = {
         path: string;
     }[];
     clearAllEmbeddings: () => void;
-    insertEmbedding: (hash: string, seq: number, pos: number, embedding: Float32Array, model: string, embeddedAt: string) => void;
+    insertEmbedding: (hash: string, seq: number, pos: number, embedding: Float32Array, model: string, embeddedAt: string, totalChunks?: number, fingerprint?: string) => void;
 };
 export type ReindexProgress = {
     file: string;
@@ -298,29 +329,49 @@ export declare function reindexCollection(store: Store, collectionPath: string,
     ignorePatterns?: string[];
     onProgress?: (info: ReindexProgress) => void;
 }): Promise<ReindexResult>;
+export type EmbedFailure = {
+    path: string;
+    hash: string;
+    seq: number;
+    attempts: number;
+    reason: string;
+};
 export type EmbedProgress = {
     chunksEmbedded: number;
     totalChunks: number;
     bytesProcessed: number;
     totalBytes: number;
+    /** Active failed chunks still awaiting a successful retry. */
     errors: number;
+    failures?: EmbedFailure[];
 };
 export type EmbedResult = {
     docsProcessed: number;
     chunksEmbedded: number;
+    /** Active failed chunks that did not recover after retries. */
     errors: number;
+    failures?: EmbedFailure[];
     durationMs: number;
 };
+export type EmbedOptions = {
+    force?: boolean;
+    model?: string;
+    /**
+     * Restrict embedding to documents in a single collection.
+     * When omitted, all pending documents across every collection are embedded.
+     */
+    collection?: string;
+    maxDocsPerBatch?: number;
+    maxBatchBytes?: number;
+    chunkStrategy?: ChunkStrategy;
+    onProgress?: (info: EmbedProgress) => void;
+};
 /**
  * Generate vector embeddings for documents that need them.
  * Pure function — no console output, no db lifecycle management.
  * Uses the store's LlamaCpp instance if set, otherwise the global singleton.
  */
-export declare function generateEmbeddings(store: Store, options?: {
-    force?: boolean;
-    model?: string;
-    onProgress?: (info: EmbedProgress) => void;
-}): Promise<EmbedResult>;
+export declare function generateEmbeddings(store: Store, options?: EmbedOptions): Promise<EmbedResult>;
 /**
  * Create a new store instance with the given database path.
  * If no path is provided, uses the default path (~/.cache/qmd/index.sqlite).
@@ -432,13 +483,19 @@ export type IndexStatus = {
     hasVectorIndex: boolean;
     collections: CollectionInfo[];
 };
-export declare function getHashesNeedingEmbedding(db: Database): number;
+export declare function getHashesNeedingEmbedding(db: Database, collection?: string, model?: string): number;
 export type IndexHealthInfo = {
     needsEmbedding: number;
     totalDocs: number;
     daysStale: number | null;
 };
-export declare function getIndexHealth(db: Database): IndexHealthInfo;
+export type LegacyFingerprintAdoptionResult = {
+    checked: boolean;
+    adopted: number;
+    reason: string;
+};
+export declare function maybeAdoptLegacyEmbeddingFingerprint(store: Store, model?: string): Promise<LegacyFingerprintAdoptionResult>;
+export declare function getIndexHealth(db: Database, model?: string): IndexHealthInfo;
 export declare function getCacheKey(url: string, body: object): string;
 export declare function getCachedResult(db: Database, cacheKey: string): string | null;
 export declare function setCachedResult(db: Database, cacheKey: string, result: string): void;
@@ -454,7 +511,9 @@ export declare function deleteLLMCache(db: Database): number;
  */
 export declare function deleteInactiveDocuments(db: Database): number;
 /**
- * Remove orphaned content hashes that are not referenced by any active document.
+ * Remove orphaned content hashes that are not referenced by any document.
+ * Inactive documents are soft-deleted tombstones, so their content rows must
+ * remain referenced until deleteInactiveDocuments() hard-deletes them.
  * Returns the number of orphaned content hashes deleted.
  */
 export declare function cleanupOrphanedContent(db: Database): number;
@@ -487,6 +546,20 @@ export declare function findActiveDocument(db: Database, collectionName: string,
     hash: string;
     title: string;
 } | null;
+/**
+ * Find an active document, falling back to a case-insensitive path match.
+ * If found under a different casing, renames it in-place and rebuilds the
+ * FTS entry. Embeddings are keyed by content hash, so the rename is
+ * safe — no re-embedding required.
+ *
+ * @internal Used by reindexCollection and indexFiles during qmd update.
+ * Returns null if the document does not exist under either path.
+ */
+export declare function findOrMigrateLegacyDocument(db: Database, collectionName: string, path: string): {
+    id: number;
+    hash: string;
+    title: string;
+} | null;
 /**
  * Update the title and modified_at timestamp for a document.
  */
@@ -505,15 +578,34 @@ export declare function deactivateDocument(db: Database, collectionName: string,
  */
 export declare function getActiveDocumentPaths(db: Database, collectionName: string): string[];
 export { formatQueryForEmbedding, formatDocForEmbedding };
+/**
+ * Chunk a document using regex-only break point detection.
+ * This is the sync, backward-compatible API used by tests and legacy callers.
+ */
 export declare function chunkDocument(content: string, maxChars?: number, overlapChars?: number, windowChars?: number): {
     text: string;
     pos: number;
 }[];
+/**
+ * Async AST-aware chunking. Detects language from filepath, computes AST
+ * break points for supported code files, merges with regex break points,
+ * and delegates to the shared chunk algorithm.
+ *
+ * Falls back to regex-only when strategy is "regex", filepath is absent,
+ * or language is unsupported.
+ */
+export declare function chunkDocumentAsync(content: string, maxChars?: number, overlapChars?: number, windowChars?: number, filepath?: string, chunkStrategy?: ChunkStrategy): Promise<{
+    text: string;
+    pos: number;
+}[]>;
 /**
  * Chunk a document by actual token count using the LLM tokenizer.
  * More accurate than character-based chunking but requires async.
+ *
+ * When filepath and chunkStrategy are provided, uses AST-aware break points
+ * for supported code files.
  */
-export declare function chunkDocumentByTokens(content: string, maxTokens?: number, overlapTokens?: number, windowTokens?: number): Promise<{
+export declare function chunkDocumentByTokens(content: string, maxTokens?: number, overlapTokens?: number, windowTokens?: number, filepath?: string, chunkStrategy?: ChunkStrategy, signal?: AbortSignal): Promise<{
     text: string;
     pos: number;
     tokens: number;
@@ -640,6 +732,7 @@ export declare function getCollectionsWithoutContext(db: Database): {
  * Useful for suggesting where context might be needed.
  */
 export declare function getTopLevelPathsWithoutContext(db: Database, collectionName: string): string[];
+export declare function sanitizeFTS5Term(term: string): string;
 /**
  * Validate that a vec/hyde query doesn't use lex-only syntax.
  * Returns error message if invalid, null if valid.
@@ -652,21 +745,39 @@ export declare function searchVec(db: Database, query: string, model: string, li
  * Get all unique content hashes that need embeddings (from active documents).
  * Returns hash, document body, and a sample path for display purposes.
  */
-export declare function getHashesForEmbedding(db: Database): {
+export declare function getHashesForEmbedding(db: Database, model?: string): {
     hash: string;
     body: string;
     path: string;
 }[];
 /**
- * Clear all embeddings from the database (force re-index).
- * Deletes all rows from content_vectors and drops the vectors_vec table.
+ * Clear embeddings for the whole index, or just for one collection.
+ *
+ * When `collection` is omitted the entire content_vectors table is emptied and
+ * the vectors_vec virtual table is dropped (it is recreated with the right
+ * dimensions on the next embed run).
+ *
+ * When `collection` is provided, only vectors whose hash is referenced
+ * exclusively by active documents in that collection are removed. Hashes
+ * shared with active documents in other collections are left in place so
+ * vector search keeps working there (content_vectors is keyed globally by
+ * content hash; identical document bodies across collections share a row).
+ * vectors_vec is preserved so other collections keep working unless the scoped
+ * clear empties content_vectors entirely, in which case it is dropped so the
+ * next embed can recreate the table with the current dimensions.
  */
-export declare function clearAllEmbeddings(db: Database): void;
+export declare function clearAllEmbeddings(db: Database, collection?: string): void;
 /**
  * Insert a single embedding into both content_vectors and vectors_vec tables.
  * The hash_seq key is formatted as "hash_seq" for the vectors_vec table.
+ *
+ * content_vectors is inserted first so that getHashesForEmbedding (which checks
+ * only content_vectors) won't re-select the hash on a crash between the two inserts.
+ *
+ * vectors_vec uses DELETE + INSERT instead of INSERT OR REPLACE because sqlite-vec's
+ * vec0 virtual tables silently ignore the OR REPLACE conflict clause.
  */
-export declare function insertEmbedding(db: Database, hash: string, seq: number, pos: number, embedding: Float32Array, model: string, embeddedAt: string): void;
+export declare function insertEmbedding(db: Database, hash: string, seq: number, pos: number, embedding: Float32Array, model: string, embeddedAt: string, totalChunks?: number, fingerprint?: string): void;
 export declare function expandQuery(query: string, model: string | undefined, db: Database, intent?: string, llmOverride?: LlamaCpp): Promise<ExpandedQuery[]>;
 export declare function rerank(query: string, documents: {
     file: string;
@@ -711,7 +822,7 @@ export declare function findDocuments(db: Database, pattern: string, options?: {
     docs: MultiGetResult[];
     errors: string[];
 };
-export declare function getStatus(db: Database): IndexStatus;
+export declare function getStatus(db: Database, model?: string): IndexStatus;
 export type SnippetResult = {
     line: number;
     snippet: string;
@@ -763,6 +874,7 @@ export interface HybridQueryOptions {
     explain?: boolean;
     intent?: string;
     skipRerank?: boolean;
+    chunkStrategy?: ChunkStrategy;
     hooks?: SearchHooks;
 }
 export interface HybridQueryResult {
@@ -782,6 +894,18 @@ export type RankedListMeta = {
     queryType: "original" | "lex" | "vec" | "hyde";
     query: string;
 };
+/**
+ * RRF list weights for hybridQuery.
+ *
+ * Original-query retrieval paths are the primary evidence and get 2x weight:
+ * - original FTS
+ * - original vector search
+ *
+ * Expansion-derived lists (lex/vec/hyde) stay at 1x regardless of list order,
+ * so a lex expansion inserted before original vector search cannot steal the
+ * original vector boost.
+ */
+export declare function getHybridRrfWeights(rankedListMeta: RankedListMeta[]): number[];
 /**
  * Hybrid search: BM25 + vector + query expansion + RRF + chunked reranking.
  *
@@ -836,6 +960,7 @@ export interface StructuredSearchOptions {
     intent?: string;
     /** Skip LLM reranking, use only RRF scores */
     skipRerank?: boolean;
+    chunkStrategy?: ChunkStrategy;
     hooks?: SearchHooks;
 }
 /**