npm - @tryformation/querylight-cli - Versions diffs - 0.2.2 → 0.2.4 - Mend

@tryformation/querylight-cli 0.2.2 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

package/README.md +33 -3
package/dist/cli/format.d.ts +2 -2
package/dist/cli/main.js +694 -135
package/dist/core/constants.d.ts +1 -1
package/dist/index/querylight-indexer.d.ts +2 -2
package/dist/index.d.ts +1 -0
package/dist/index.js +592 -123
package/dist/query/search-service.d.ts +14 -1
package/dist/server/search-api.d.ts +15 -0
package/dist/types/models.d.ts +36 -1
package/dist/vector/dense.d.ts +6 -1
package/package.json +2 -2
package/scripts/sparse-encode.py +29 -8

package/dist/cli/main.js CHANGED Viewed

@@ -2,8 +2,8 @@
 // src/cli/run-cli.ts
 import { Command, Option } from "commander";
-import { stat as stat4 } from "fs/promises";
-import path21 from "path";
+import { readFile as readFile11, stat as stat5 } from "fs/promises";
+import path22 from "path";
 // src/chunk/chunker.ts
 import { readFile as readFile3 } from "fs/promises";
@@ -16,7 +16,7 @@ import path from "path";
 import YAML from "yaml";
 // src/core/constants.ts
-var PACKAGE_VERSION = "0.2.1";
+var PACKAGE_VERSION = "0.2.3";
 var DEFAULT_WORKSPACE = ".kb";
 var DEFAULT_SHARED_MODEL_CACHE_DIR = "~/.qli/models/huggingface";
 var LEGACY_WORKSPACE_MODEL_CACHE_DIR = ".kb/models/huggingface";
@@ -53,7 +53,7 @@ var defaultConfig = () => ({
     defaultMode: "lexical",
     dense: {
       enabled: true,
-      modelId: "Xenova/all-MiniLM-L6-v2",
+      modelId: "Xenova/paraphrase-MiniLM-L3-v2",
       cacheDir: DEFAULT_SHARED_MODEL_CACHE_DIR,
       indexHashTables: 8,
       indexRandomSeed: 42,
@@ -61,7 +61,7 @@ var defaultConfig = () => ({
     },
     sparse: {
       enabled: true,
-      modelId: "opensearch-project/opensearch-neural-sparse-encoding-doc-v3-distill",
+      modelId: "opensearch-project/opensearch-neural-sparse-encoding-doc-v2-mini",
       cacheDir: DEFAULT_SHARED_MODEL_CACHE_DIR,
       documentTopTokens: 128,
       queryEncoding: "tokenizer-token-weights",
@@ -374,7 +374,7 @@ async function assertWorkspaceExists(workspacePath) {
 }
 // src/index/querylight-indexer.ts
-import { Analyzer, DocumentIndex, KeywordTokenizer, LowerCaseTextFilter, RankingAlgorithm, TextFieldIndex } from "@tryformation/querylight-ts";
+import { Analyzer, DateFieldIndex, DocumentIndex, KeywordTokenizer, LowerCaseTextFilter, RankingAlgorithm, StoredSourceIndex, TextFieldIndex } from "@tryformation/querylight-ts";
 import path11 from "path";
 // src/vector/dense.ts
@@ -682,15 +682,26 @@ function createSparseChunkText(chunk) {
 // src/vector/dense.ts
 var denseEmbedderFactory = null;
 var EXACT_DENSE_RERANK_THRESHOLD = 5e3;
+function normalizeDenseEmbedder(embedder) {
+  if (typeof embedder === "function") {
+    return { embed: embedder };
+  }
+  return embedder;
+}
 async function createEmbedder(cacheDir, modelId) {
   if (denseEmbedderFactory) {
-    return denseEmbedderFactory(cacheDir, modelId);
+    return normalizeDenseEmbedder(await denseEmbedderFactory(cacheDir, modelId));
   }
   const runtime = await getDenseTransformersRuntime(cacheDir);
   const extractor = await runtime.pipeline("feature-extraction", modelId);
-  return async (text) => {
-    const output = await extractor(text, { pooling: "mean", normalize: true });
-    return output.tolist()[0];
+  return {
+    async embed(text) {
+      const output = await extractor(text, { pooling: "mean", normalize: true });
+      return output.tolist()[0];
+    },
+    async dispose() {
+      await extractor.dispose();
+    }
   };
 }
 function exactDenseQuery(payload, vector, topK) {
@@ -699,8 +710,12 @@ function exactDenseQuery(payload, vector, topK) {
 async function pullDenseModel(workspacePath, config) {
   const cacheDir = resolveCacheDir(workspacePath, config.cacheDir);
   await mkdir4(cacheDir, { recursive: true });
-  const embed = await createEmbedder(cacheDir, config.modelId);
-  await embed("warm dense model cache");
+  const embedder = await createEmbedder(cacheDir, config.modelId);
+  try {
+    await embedder.embed("warm dense model cache");
+  } finally {
+    await embedder.dispose?.();
+  }
 }
 async function buildDenseVectors({
   workspacePath,
@@ -710,53 +725,57 @@ async function buildDenseVectors({
   const chunks = await readJsonl(path8.join(workspacePath, "chunks", "chunks.jsonl"));
   const cacheDir = resolveCacheDir(workspacePath, config.cacheDir);
   await mkdir4(cacheDir, { recursive: true });
-  const embed = await createEmbedder(cacheDir, config.modelId);
-  const records = [];
-  let dimensions = 0;
-  reportProgress(progress, `Encoding ${chunks.length} chunk${chunks.length === 1 ? "" : "s"} for dense retrieval`);
-  for (const chunk of chunks) {
-    const embedding = await embed(createDenseChunkText(chunk));
-    dimensions ||= embedding.length;
-    records.push({
-      chunkId: chunk.id,
-      documentId: chunk.documentId,
-      sourceId: chunk.sourceId,
-      title: chunk.title,
-      uri: chunk.uri,
-      headingPath: chunk.headingPath,
-      text: chunk.text,
-      embedding
+  const embedder = await createEmbedder(cacheDir, config.modelId);
+  try {
+    const records = [];
+    let dimensions = 0;
+    reportProgress(progress, `Encoding ${chunks.length} chunk${chunks.length === 1 ? "" : "s"} for dense retrieval`);
+    for (const chunk of chunks) {
+      const embedding = await embedder.embed(createDenseChunkText(chunk));
+      dimensions ||= embedding.length;
+      records.push({
+        chunkId: chunk.id,
+        documentId: chunk.documentId,
+        sourceId: chunk.sourceId,
+        title: chunk.title,
+        uri: chunk.uri,
+        headingPath: chunk.headingPath,
+        text: chunk.text,
+        embedding
+      });
+      if (records.length === 1 || records.length % 100 === 0 || records.length === chunks.length) {
+        reportProgressDetail(progress, `Encoded ${records.length}/${chunks.length} chunks for dense retrieval`);
+      }
+    }
+    reportProgress(progress, "Building dense vector index");
+    const index = new VectorFieldIndex({
+      numHashTables: config.indexHashTables,
+      dimensions,
+      random: createSeededRandom(config.indexRandomSeed)
     });
-    if (records.length === 1 || records.length % 100 === 0 || records.length === chunks.length) {
-      reportProgressDetail(progress, `Encoded ${records.length}/${chunks.length} chunks for dense retrieval`);
+    for (const record of records) {
+      index.insert(record.chunkId, [record.embedding]);
     }
+    const metadata = {
+      createdAt: (/* @__PURE__ */ new Date()).toISOString(),
+      modelId: config.modelId,
+      dimensions,
+      hashTables: config.indexHashTables,
+      randomSeed: config.indexRandomSeed,
+      chunkCount: records.length,
+      indexHash: sha256(JSON.stringify(index.indexState))
+    };
+    const payload = {
+      metadata,
+      indexState: index.indexState,
+      chunks: records
+    };
+    await writeDensePayload(workspacePath, payload);
+    reportProgress(progress, `Dense vectors written for ${records.length} chunk${records.length === 1 ? "" : "s"}`);
+    return payload;
+  } finally {
+    await embedder.dispose?.();
   }
-  reportProgress(progress, "Building dense vector index");
-  const index = new VectorFieldIndex({
-    numHashTables: config.indexHashTables,
-    dimensions,
-    random: createSeededRandom(config.indexRandomSeed)
-  });
-  for (const record of records) {
-    index.insert(record.chunkId, [record.embedding]);
-  }
-  const metadata = {
-    createdAt: (/* @__PURE__ */ new Date()).toISOString(),
-    modelId: config.modelId,
-    dimensions,
-    hashTables: config.indexHashTables,
-    randomSeed: config.indexRandomSeed,
-    chunkCount: records.length,
-    indexHash: sha256(JSON.stringify(index.indexState))
-  };
-  const payload = {
-    metadata,
-    indexState: index.indexState,
-    chunks: records
-  };
-  await writeDensePayload(workspacePath, payload);
-  reportProgress(progress, `Dense vectors written for ${records.length} chunk${records.length === 1 ? "" : "s"}`);
-  return payload;
 }
 async function denseQuery({
   workspacePath,
@@ -766,21 +785,25 @@ async function denseQuery({
 }) {
   const payload = await readDensePayload(workspacePath);
   const cacheDir = resolveCacheDir(workspacePath, config.cacheDir);
-  const embed = await createEmbedder(cacheDir, config.modelId);
-  const vector = await embed(query);
-  if (payload.chunks.length <= EXACT_DENSE_RERANK_THRESHOLD) {
+  const embedder = await createEmbedder(cacheDir, config.modelId);
+  try {
+    const vector = await embedder.embed(query);
+    if (payload.chunks.length <= EXACT_DENSE_RERANK_THRESHOLD) {
+      return exactDenseQuery(payload, vector, topK);
+    }
+    const index = new VectorFieldIndex({
+      numHashTables: payload.metadata.hashTables,
+      dimensions: payload.metadata.dimensions,
+      random: createSeededRandom(payload.metadata.randomSeed)
+    }).loadState(payload.indexState);
+    const approximateHits = index.query(vector, topK);
+    if (approximateHits.length >= topK) {
+      return approximateHits;
+    }
     return exactDenseQuery(payload, vector, topK);
+  } finally {
+    await embedder.dispose?.();
   }
-  const index = new VectorFieldIndex({
-    numHashTables: payload.metadata.hashTables,
-    dimensions: payload.metadata.dimensions,
-    random: createSeededRandom(payload.metadata.randomSeed)
-  }).loadState(payload.indexState);
-  const approximateHits = index.query(vector, topK);
-  if (approximateHits.length >= topK) {
-    return approximateHits;
-  }
-  return exactDenseQuery(payload, vector, topK);
 }
 // src/vector/sparse.ts
@@ -1091,12 +1114,19 @@ function keywordFieldIndex() {
 function createIndexMapping(extraFields = []) {
   const lexical = new TextFieldIndex(void 0, void 0, RankingAlgorithm.BM25);
   const mapping = {
+    _source: new StoredSourceIndex(),
     text: lexical,
     title: new TextFieldIndex(void 0, void 0, RankingAlgorithm.BM25),
     uri: keywordFieldIndex(),
     sourceId: keywordFieldIndex(),
+    sourceName: keywordFieldIndex(),
     tags: keywordFieldIndex(),
-    sourceType: keywordFieldIndex()
+    sourceType: keywordFieldIndex(),
+    publicationDate: new DateFieldIndex(),
+    firstSeenAt: new DateFieldIndex(),
+    lastSeenAt: new DateFieldIndex(),
+    lastChangedAt: new DateFieldIndex(),
+    crawledAt: new DateFieldIndex()
   };
   for (const field of extraFields) {
     mapping[field] = keywordFieldIndex();
@@ -1132,8 +1162,12 @@ async function buildIndex({
   const sources = await readJsonl(path11.join(workspacePath, "sources", "sources.jsonl"));
   const metadataFields = [...new Set(chunks.flatMap((chunk) => Object.keys(chunk.metadata).map((key) => `metadata.${key}`)))];
   const index = new DocumentIndex(createIndexMapping(metadataFields));
+  const documentsById = new Map(documents.map((document) => [document.id, document]));
+  const sourcesById = new Map(sources.map((source) => [source.id, source]));
   reportProgress(progress, `Building lexical index from ${chunks.length} chunk${chunks.length === 1 ? "" : "s"}`);
   for (const chunk of chunks) {
+    const document = documentsById.get(chunk.documentId);
+    const source = sourcesById.get(chunk.sourceId);
     index.index({
       id: chunk.id,
       fields: {
@@ -1141,9 +1175,33 @@ async function buildIndex({
         title: [chunk.title],
         uri: [chunk.uri.toLowerCase()],
         sourceId: [chunk.sourceId.toLowerCase()],
+        sourceName: source ? [source.name.toLowerCase()] : [],
         tags: Array.isArray(chunk.metadata.tags) ? chunk.metadata.tags.map((tag) => String(tag).toLowerCase()) : [],
         sourceType: [String(chunk.metadata.sourceType ?? "").toLowerCase()],
+        publicationDate: document?.publicationDate ? [document.publicationDate] : [],
+        firstSeenAt: [document?.firstSeenAt ?? chunk.firstSeenAt],
+        lastSeenAt: [document?.lastSeenAt ?? chunk.lastSeenAt],
+        lastChangedAt: [document?.lastChangedAt ?? chunk.lastChangedAt],
+        crawledAt: document?.crawledAt ? [document.crawledAt] : [],
         ...flattenMetadata(chunk.metadata)
+      },
+      source: {
+        chunkId: chunk.id,
+        documentId: chunk.documentId,
+        sourceId: chunk.sourceId,
+        sourceType: document?.sourceType ?? "text",
+        sourceName: source?.name,
+        title: chunk.title,
+        uri: chunk.uri,
+        headingPath: chunk.headingPath,
+        text: chunk.text,
+        normalizedPath: document?.normalizedPath,
+        publicationDate: document?.publicationDate ?? null,
+        crawledAt: document?.crawledAt,
+        firstSeenAt: document?.firstSeenAt ?? chunk.firstSeenAt,
+        lastSeenAt: document?.lastSeenAt ?? chunk.lastSeenAt,
+        lastChangedAt: document?.lastChangedAt ?? chunk.lastChangedAt,
+        metadata: chunk.metadata
       }
     });
   }
@@ -1152,7 +1210,7 @@ async function buildIndex({
   const metadata = {
     id: `index_${createdAt.replace(/[:.]/g, "-")}`,
     createdAt,
-    querylightVersion: "0.10.0",
+    querylightVersion: "0.11.0",
     kbVersion: "0.1.0",
     documentCount: documents.length,
     chunkCount: chunks.length,
@@ -2138,13 +2196,17 @@ function isAllowed(url, baseUrl, includePatterns, excludePatterns, disallowRules
   if (url.search.length > 0) {
     return false;
   }
-  if (url.pathname.endsWith(".xml")) {
+  const pathname = url.pathname.toLowerCase();
+  if (pathname.endsWith(".xml")) {
     return false;
   }
-  if (url.pathname.includes("/cdn-cgi/")) {
+  if (pathname.endsWith(".pdf")) {
     return false;
   }
-  if (url.pathname === "/search" || url.pathname === "/search/" || url.pathname.endsWith("/search/")) {
+  if (pathname.includes("/cdn-cgi/")) {
+    return false;
+  }
+  if (pathname === "/search" || pathname === "/search/" || pathname.endsWith("/search/")) {
     return false;
   }
   if (disallowRules.some((rule) => rule !== "/" && url.pathname.startsWith(rule))) {
@@ -2778,7 +2840,7 @@ async function discoverWebsiteFeed(websiteUrl, userAgent) {
 // src/query/search-service.ts
 import { readFile as readFile10 } from "fs/promises";
-import { BoolQuery, MatchQuery, OP, TermQuery, reciprocalRankFusion } from "@tryformation/querylight-ts";
+import { reciprocalRankFusion, searchJsonDsl } from "@tryformation/querylight-ts";
 import path18 from "path";
 async function loadHydratedIndex(workspacePath) {
   let state;
@@ -2806,24 +2868,6 @@ function matchesPrefix(value, prefixes) {
   const lower = value.toLowerCase();
   return prefixes.some((prefix) => lower.startsWith(prefix));
 }
-function buildSearchQuery(query, filters) {
-  const sourceIds = normalizeFilterValues([filters.sourceId, ...filters.sourceIds ?? []].filter((value) => Boolean(value)));
-  const sourceTypes = normalizeFilterValues([filters.sourceType, ...filters.sourceTypes ?? []].filter((value) => Boolean(value)));
-  const tags = normalizeFilterValues([filters.tag, ...filters.tags ?? []].filter((value) => Boolean(value)));
-  return new BoolQuery({
-    should: [
-      new MatchQuery({ field: "title", text: query, operation: OP.AND, boost: 6 }),
-      new MatchQuery({ field: "text", text: query, operation: OP.AND, boost: 4 }),
-      new MatchQuery({ field: "text", text: query, operation: OP.OR, boost: 2 })
-    ],
-    filter: [
-      ...sourceIds.length === 1 ? [new TermQuery({ field: "sourceId", text: sourceIds[0] })] : [],
-      ...sourceTypes.length === 1 ? [new TermQuery({ field: "sourceType", text: sourceTypes[0] })] : [],
-      ...tags.length === 1 ? [new TermQuery({ field: "tags", text: tags[0] })] : [],
-      ...(filters.metadata ?? []).map(({ key, value }) => new TermQuery({ field: `metadata.${key}`, text: value.toLowerCase() }))
-    ]
-  });
-}
 function isValidDate(value) {
   return typeof value === "string" && !Number.isNaN(new Date(value).getTime());
 }
@@ -3022,6 +3066,185 @@ async function buildSnippetWithAdjacentChunks(chunk, query, {
   }
   return buildExpandedParagraphSnippet(paragraphs, currentIndex, query);
 }
+function buildSearchDslRequest({
+  query,
+  topK,
+  filters,
+  dateRanges
+}) {
+  const filterClauses = [];
+  const sourceIds = normalizeFilterValues([filters.sourceId, ...filters.sourceIds ?? []].filter((value) => Boolean(value)));
+  const sourceNames = normalizeFilterValues([filters.sourceName, ...filters.sourceNames ?? []].filter((value) => Boolean(value)));
+  const sourceTypes = normalizeFilterValues([filters.sourceType, ...filters.sourceTypes ?? []].filter((value) => Boolean(value)));
+  const uriPrefixes = normalizeFilterValues([filters.uriPrefix, ...filters.uriPrefixes ?? []].filter((value) => Boolean(value)));
+  const tags = normalizeFilterValues([filters.tag, ...filters.tags ?? []].filter((value) => Boolean(value)));
+  if (sourceIds.length > 0) {
+    filterClauses.push({ terms: { sourceId: sourceIds } });
+  }
+  if (sourceNames.length > 0) {
+    filterClauses.push({ terms: { sourceName: sourceNames } });
+  }
+  if (sourceTypes.length > 0) {
+    filterClauses.push({ terms: { sourceType: sourceTypes } });
+  }
+  if (uriPrefixes.length > 0) {
+    filterClauses.push({
+      bool: {
+        should: uriPrefixes.map((prefix) => ({ prefix: { uri: prefix } })),
+        minimum_should_match: 1
+      }
+    });
+  }
+  if (tags.length > 0) {
+    filterClauses.push({ terms: { tags } });
+  }
+  if (filters.hasPublicationDate) {
+    filterClauses.push({ exists: { field: "publicationDate" } });
+  }
+  for (const { key, value } of filters.metadata ?? []) {
+    filterClauses.push({ term: { [`metadata.${key}`]: value.toLowerCase() } });
+  }
+  for (const { field, from, to } of dateRanges) {
+    filterClauses.push({
+      range: {
+        [field]: {
+          ...from ? { gte: from } : {},
+          ...to ? { lte: to } : {}
+        }
+      }
+    });
+  }
+  return {
+    size: topK,
+    query: {
+      bool: {
+        should: [
+          { match: { title: { query, operator: "and", boost: 6 } } },
+          { match: { text: { query, operator: "and", boost: 4 } } },
+          { match: { text: { query, operator: "or", boost: 2 } } }
+        ],
+        filter: filterClauses,
+        minimum_should_match: 1
+      }
+    }
+  };
+}
+function sourceToChunkRecord(source) {
+  return {
+    id: source.chunkId,
+    documentId: source.documentId,
+    sourceId: source.sourceId,
+    title: source.title,
+    uri: source.uri,
+    headingPath: source.headingPath,
+    text: source.text,
+    contentHash: "",
+    metadata: source.metadata,
+    firstSeenAt: source.firstSeenAt,
+    lastSeenAt: source.lastSeenAt,
+    lastChangedAt: source.lastChangedAt
+  };
+}
+function sourceToDocumentRecord(source) {
+  return {
+    id: source.documentId,
+    sourceId: source.sourceId,
+    sourceType: source.sourceType,
+    title: source.title,
+    uri: source.uri,
+    sourceUri: source.uri,
+    mimeType: "text/plain",
+    normalizedPath: source.normalizedPath ?? "",
+    contentHash: "",
+    metadata: source.metadata,
+    publicationDate: source.publicationDate ?? null,
+    crawledAt: source.crawledAt,
+    firstSeenAt: source.firstSeenAt,
+    lastSeenAt: source.lastSeenAt,
+    lastChangedAt: source.lastChangedAt
+  };
+}
+async function materializeSearchHit(hit, query, config, orderedChunkCache, showChunks) {
+  const source = hit._source;
+  const chunk = sourceToChunkRecord(source);
+  const document = sourceToDocumentRecord(source);
+  const snippet = await buildSnippetWithAdjacentChunks(chunk, query, { document, config, orderedChunkCache });
+  const enrichedSource = {
+    ...source,
+    snippet
+  };
+  const result = {
+    chunkId: source.chunkId,
+    documentId: source.documentId,
+    sourceId: source.sourceId,
+    sourceType: source.sourceType,
+    score: hit._score,
+    title: chooseResultTitle(chunk),
+    uri: source.uri,
+    snippet,
+    text: showChunks ? source.text : void 0,
+    publicationDate: source.publicationDate ?? null,
+    firstSeenAt: source.firstSeenAt,
+    lastSeenAt: source.lastSeenAt,
+    lastChangedAt: source.lastChangedAt,
+    metadata: source.metadata
+  };
+  return {
+    hit: {
+      ...hit,
+      _source: enrichedSource
+    },
+    result
+  };
+}
+function createSearchResponse(retrievalMode, hits, took, aggregations) {
+  return {
+    retrievalMode,
+    took,
+    hits: {
+      total: {
+        value: hits.length,
+        relation: "eq"
+      },
+      max_score: hits.length > 0 ? Math.max(...hits.map((hit) => hit._score)) : null,
+      hits
+    },
+    aggregations
+  };
+}
+function searchResultsFromResponse(response2, showChunks = false) {
+  return response2.hits.hits.map((hit) => ({
+    chunkId: hit._source.chunkId,
+    documentId: hit._source.documentId,
+    sourceId: hit._source.sourceId,
+    sourceType: hit._source.sourceType,
+    score: hit._score,
+    title: chooseResultTitle(sourceToChunkRecord(hit._source)),
+    uri: hit._source.uri,
+    snippet: hit._source.snippet ?? hit.highlight?.text?.join("\n\n") ?? buildSnippet(hit._source.text, hit._source.title),
+    text: showChunks ? hit._source.text : void 0,
+    publicationDate: hit._source.publicationDate ?? null,
+    firstSeenAt: hit._source.firstSeenAt,
+    lastSeenAt: hit._source.lastSeenAt,
+    lastChangedAt: hit._source.lastChangedAt,
+    metadata: hit._source.metadata
+  }));
+}
+async function searchJsonRequest({
+  index,
+  request,
+  indexName = "querylight"
+}) {
+  return searchJsonDsl({ index, request, indexName });
+}
+async function searchJsonIndex({
+  workspacePath,
+  request,
+  indexName = "querylight"
+}) {
+  const index = await loadHydratedIndex(workspacePath);
+  return searchJsonRequest({ index, request, indexName });
+}
 function normalizeDisplayTitle(title) {
   return title.replace(/\s*\|\s*Querylight TS Demo\s*$/i, "").replace(/\s+/g, " ").trim();
 }
@@ -3159,6 +3382,7 @@ async function searchIndex({
   retrievalMode,
   showChunks = false
 }) {
+  const startedAt = Date.now();
   const config = await loadConfig(workspacePath);
   const mode = retrievalMode ?? config.retrieval.defaultMode;
   const candidateLimit = Math.max(topK * 5, 50);
@@ -3215,12 +3439,48 @@ async function searchIndex({
         };
       })
     );
-    return { retrievalMode: "lexical", results: latestResults.filter((result) => result != null) };
+    const hits2 = latestResults.filter((result) => result != null).map((result) => {
+      const chunk = chunks.get(result.chunkId);
+      const document = documents.get(result.documentId);
+      const source = sources.get(result.sourceId);
+      return {
+        _index: "querylight",
+        _id: result.chunkId,
+        _score: result.score,
+        _source: {
+          chunkId: result.chunkId,
+          documentId: result.documentId,
+          sourceId: result.sourceId,
+          sourceType: result.sourceType,
+          sourceName: source?.name,
+          title: chunk.title,
+          uri: result.uri,
+          headingPath: chunk.headingPath,
+          text: chunk.text,
+          snippet: result.snippet,
+          normalizedPath: document.normalizedPath,
+          publicationDate: result.publicationDate ?? null,
+          crawledAt: document.crawledAt,
+          firstSeenAt: result.firstSeenAt,
+          lastSeenAt: result.lastSeenAt,
+          lastChangedAt: result.lastChangedAt,
+          metadata: result.metadata
+        }
+      };
+    });
+    return createSearchResponse("lexical", hits2, Date.now() - startedAt);
   }
   const lexicalHits = async () => {
-    const index = await loadHydratedIndex(workspacePath);
-    const all = await index.searchRequest({ query: buildSearchQuery(normalizedQuery, { sourceId, sourceIds, sourceType, sourceTypes, tag, tags, metadata }), limit: candidateLimit });
-    return all.filter(([chunkId]) => filterIds.includes(chunkId)).slice(0, candidateLimit);
+    const response2 = await searchJsonIndex({
+      workspacePath,
+      request: buildSearchDslRequest({
+        query: normalizedQuery,
+        topK: candidateLimit,
+        filters: { sourceId, sourceIds, sourceName, sourceNames, sourceType, sourceTypes, uriPrefix, uriPrefixes, hasPublicationDate, tag, tags, metadata },
+        dateRanges
+      })
+    });
+    return response2.hits.hits;
   };
   const denseHits = async () => {
     if (!await fileExists(denseVectorPath(workspacePath))) {
@@ -3234,15 +3494,18 @@ async function searchIndex({
     }
     return sparseQuery({ workspacePath, config: config.retrieval.sparse, query: normalizedQuery, topK: candidateLimit }).then((hits2) => hits2.filter(([chunkId]) => filterIds.includes(chunkId)).slice(0, candidateLimit));
   };
+  let lexicalResponseHits = [];
   let hits;
   if (mode === "lexical") {
-    hits = await lexicalHits();
+    lexicalResponseHits = await lexicalHits();
+    hits = lexicalResponseHits.map((hit) => [hit._id, hit._score]);
   } else if (mode === "dense") {
     hits = await denseHits();
   } else if (mode === "sparse") {
     hits = await sparseHits();
   } else {
-    const rankings = [await lexicalHits()];
+    lexicalResponseHits = await lexicalHits();
+    const rankings = [lexicalResponseHits.map((hit) => [hit._id, hit._score])];
     if (await fileExists(denseVectorPath(workspacePath))) {
       rankings.push(await denseQuery({ workspacePath, config: config.retrieval.dense, query: normalizedQuery, topK: candidateLimit }).then((dense) => dense.filter(([chunkId]) => filterIds.includes(chunkId)).slice(0, candidateLimit)));
     }
@@ -3251,38 +3514,242 @@ async function searchIndex({
     }
     hits = reciprocalRankFusion(rankings, { rankConstant: 20, weights: rankings.map((_, index) => index === 0 ? 3 : 1) }).slice(0, candidateLimit);
   }
-  const rawResults = await Promise.all(hits.map(async ([chunkId, score]) => {
+  const baseHits = mode === "lexical" ? lexicalResponseHits : hits.flatMap(([chunkId, score]) => {
     const chunk = chunks.get(chunkId);
     if (!chunk) {
-      return null;
+      return [];
     }
+    const document = documents.get(chunk.documentId);
+    const source = sources.get(chunk.sourceId);
+    return [{
+      _index: "querylight",
+      _id: chunkId,
+      _score: score,
+      _source: {
+        chunkId,
+        documentId: chunk.documentId,
+        sourceId: chunk.sourceId,
+        sourceType: document?.sourceType ?? "text",
+        sourceName: source?.name,
+        title: chunk.title,
+        uri: chunk.uri,
+        headingPath: chunk.headingPath,
+        text: chunk.text,
+        normalizedPath: document?.normalizedPath,
+        publicationDate: document?.publicationDate ?? null,
+        crawledAt: document?.crawledAt,
+        firstSeenAt: document?.firstSeenAt ?? chunk.firstSeenAt,
+        lastSeenAt: document?.lastSeenAt ?? chunk.lastSeenAt,
+        lastChangedAt: document?.lastChangedAt ?? chunk.lastChangedAt,
+        metadata: chunk.metadata
+      }
+    }];
+  });
+  const materialized = await Promise.all(baseHits.map((hit) => materializeSearchHit(hit, normalizedQuery, config, orderedChunkCache, showChunks)));
+  if (showChunks) {
+    const topHits = materialized.sort((left, right) => right.result.score - left.result.score).slice(0, topK).map(({ hit, result }) => ({ ...hit, _score: result.score }));
+    return createSearchResponse(mode, topHits, Date.now() - startedAt);
+  }
+  const reranked = rerankResultsByDocument(materialized.map(({ result }) => result), topK);
+  const byChunkId = new Map(materialized.map(({ hit }) => [hit._id, hit]));
+  const finalHits = reranked.map((result) => {
+    const hit = byChunkId.get(result.chunkId);
+    return hit ? { ...hit, _score: result.score, _source: { ...hit._source, snippet: result.snippet } } : null;
+  }).filter((hit) => hit != null);
+  return createSearchResponse(mode, finalHits, Date.now() - startedAt);
+}
+// src/server/search-api.ts
+import { createServer } from "http";
+import { readdir, stat as stat4 } from "fs/promises";
+import path19 from "path";
+async function pathIsDirectory(candidatePath) {
+  try {
+    return (await stat4(candidatePath)).isDirectory();
+  } catch {
+    return false;
+  }
+}
+async function discoverKnowledgeBases(workspacePath) {
+  try {
+    const singleWorkspace = await assertWorkspaceExists(workspacePath);
+    const config = await loadConfig(singleWorkspace);
+    const index = await loadHydratedIndex(singleWorkspace);
     return {
-      chunkId,
-      documentId: chunk.documentId,
-      sourceId: chunk.sourceId,
-      sourceType: documents.get(chunk.documentId)?.sourceType ?? "text",
-      score,
-      title: chooseResultTitle(chunk),
-      uri: chunk.uri,
-      snippet: await buildSnippetWithAdjacentChunks(chunk, normalizedQuery, {
-        document: documents.get(chunk.documentId),
-        config,
-        orderedChunkCache
-      }),
-      text: showChunks ? chunk.text : void 0,
-      publicationDate: documents.get(chunk.documentId)?.publicationDate ?? null,
-      firstSeenAt: documents.get(chunk.documentId)?.firstSeenAt ?? chunk.firstSeenAt,
-      lastSeenAt: documents.get(chunk.documentId)?.lastSeenAt ?? chunk.lastSeenAt,
-      lastChangedAt: documents.get(chunk.documentId)?.lastChangedAt ?? chunk.lastChangedAt,
-      metadata: chunk.metadata
+      mode: "single",
+      knowledgeBases: [{
+        name: config.index.name,
+        workspacePath: singleWorkspace,
+        configuredIndexName: config.index.name,
+        index
+      }]
     };
-  }));
-  const results = rawResults.filter((result) => result != null);
-  return { retrievalMode: mode, results: rerankResultsByDocument(results, topK) };
+  } catch (error) {
+    if (!(error instanceof CliError) || error.code !== "WORKSPACE_ERROR") {
+      throw error;
+    }
+  }
+  const resolvedRoot = path19.resolve(workspacePath);
+  if (!await pathIsDirectory(resolvedRoot)) {
+    throw new CliError(`workspace path does not exist: ${resolvedRoot}`, "WORKSPACE_ERROR", 3 /* WorkspaceError */);
+  }
+  const entries = await readdir(resolvedRoot, { withFileTypes: true });
+  const knowledgeBases = (await Promise.all(entries.filter((entry) => entry.isDirectory()).map(async (entry) => {
+    const candidateWorkspace = path19.join(resolvedRoot, entry.name, ".kb");
+    try {
+      const workspace = await assertWorkspaceExists(candidateWorkspace);
+      const config = await loadConfig(workspace);
+      const index = await loadHydratedIndex(workspace);
+      return {
+        name: entry.name,
+        workspacePath: workspace,
+        configuredIndexName: config.index.name,
+        index
+      };
+    } catch (error) {
+      if (error instanceof CliError && error.code === "WORKSPACE_ERROR") {
+        return null;
+      }
+      throw error;
+    }
+  }))).filter((knowledgeBase) => knowledgeBase != null);
+  if (knowledgeBases.length === 0) {
+    throw new CliError(
+      `no knowledge bases found at ${resolvedRoot}; use a .kb workspace or a directory of named subdirectories that each contain .kb`,
+      "WORKSPACE_ERROR",
+      3 /* WorkspaceError */
+    );
+  }
+  return { mode: "multi", knowledgeBases };
+}
+function sendJson(response2, statusCode, payload) {
+  response2.statusCode = statusCode;
+  response2.setHeader("content-type", "application/json; charset=utf-8");
+  response2.end(JSON.stringify(payload));
+}
+function sendError(response2, statusCode, type, reason) {
+  sendJson(response2, statusCode, {
+    error: {
+      type,
+      reason
+    },
+    status: statusCode
+  });
+}
+async function readRequestBody(request) {
+  const chunks = [];
+  for await (const chunk of request) {
+    chunks.push(Buffer.isBuffer(chunk) ? chunk : Buffer.from(chunk));
+  }
+  return Buffer.concat(chunks).toString("utf8");
+}
+function parseSearchRequest(raw) {
+  const normalized = raw.trim();
+  if (normalized.length === 0) {
+    return {};
+  }
+  try {
+    const parsed = JSON.parse(normalized);
+    if (!parsed || typeof parsed !== "object" || Array.isArray(parsed)) {
+      throw new Error("expected a JSON object");
+    }
+    return parsed;
+  } catch (error) {
+    const message = error instanceof Error ? error.message : String(error);
+    throw new CliError(`invalid JSON request: ${message}`, "INVALID_ARGUMENT", 2 /* InvalidArguments */);
+  }
+}
+function routeForKnowledgeBase(mode, knowledgeBase) {
+  return mode === "single" ? "/_search" : `/${knowledgeBase.name}/_search`;
+}
+function resolveKnowledgeBaseForPath(pathname, mode, knowledgeBases) {
+  const segments = pathname.split("/").filter(Boolean);
+  if (mode === "single") {
+    const knowledgeBase = [...knowledgeBases.values()][0];
+    if (!knowledgeBase) {
+      return null;
+    }
+    if (segments.length === 1 && segments[0] === "_search") {
+      return knowledgeBase;
+    }
+    if (segments.length === 2 && segments[1] === "_search" && segments[0] === knowledgeBase.configuredIndexName) {
+      return knowledgeBase;
+    }
+    return null;
+  }
+  if (segments.length === 2 && segments[1] === "_search") {
+    return knowledgeBases.get(segments[0]) ?? null;
+  }
+  return null;
+}
+async function handleSearchRequest(request, response2, pathname, mode, knowledgeBases) {
+  if (request.method !== "GET" && request.method !== "POST") {
+    response2.setHeader("allow", "GET, POST");
+    sendError(response2, 405, "method_not_allowed", `unsupported method for ${pathname}`);
+    return;
+  }
+  const knowledgeBase = resolveKnowledgeBaseForPath(pathname, mode, knowledgeBases);
+  if (!knowledgeBase) {
+    sendError(response2, 404, "resource_not_found_exception", `unknown search route: ${pathname}`);
+    return;
+  }
+  try {
+    const requestBody = parseSearchRequest(await readRequestBody(request));
+    const indexName = mode === "multi" ? knowledgeBase.name : knowledgeBase.configuredIndexName;
+    const result = await searchJsonRequest({
+      index: knowledgeBase.index,
+      request: requestBody,
+      indexName
+    });
+    sendJson(response2, 200, result);
+  } catch (error) {
+    if (error instanceof CliError && error.code === "INVALID_ARGUMENT") {
+      sendError(response2, 400, "parse_exception", error.message);
+      return;
+    }
+    const message = error instanceof Error ? error.message : String(error);
+    sendError(response2, 500, "search_phase_execution_exception", message);
+  }
+}
+async function startSearchApiServer({
+  workspacePath,
+  host = "127.0.0.1",
+  port = 3e3
+}) {
+  const { mode, knowledgeBases } = await discoverKnowledgeBases(workspacePath);
+  const byName = new Map(knowledgeBases.map((knowledgeBase) => [knowledgeBase.name, knowledgeBase]));
+  const server = createServer(async (request, response2) => {
+    const url2 = new URL(request.url ?? "/", `http://${request.headers.host ?? `${host}:${port}`}`);
+    await handleSearchRequest(request, response2, url2.pathname, mode, byName);
+  });
+  await new Promise((resolve2, reject) => {
+    server.once("error", reject);
+    server.listen(port, host, () => {
+      server.off("error", reject);
+      resolve2();
+    });
+  });
+  const address = server.address();
+  if (!address || typeof address === "string") {
+    throw new CliError("server failed to bind to a TCP address", "SERVER_ERROR", 1 /* GeneralError */);
+  }
+  const url = `http://${host}:${address.port}`;
+  return {
+    mode,
+    url,
+    knowledgeBases: knowledgeBases.map((knowledgeBase) => ({
+      name: knowledgeBase.name,
+      workspacePath: knowledgeBase.workspacePath,
+      route: routeForKnowledgeBase(mode, knowledgeBase)
+    })),
+    close: async () => new Promise((resolve2, reject) => {
+      server.close((error) => error ? reject(error) : resolve2());
+    })
+  };
 }
 // src/query/related-service.ts
-import path19 from "path";
+import path20 from "path";
 function cosineSimilarity2(left, right) {
   let dot = 0;
   let leftNorm = 0;
@@ -3358,7 +3825,7 @@ async function findRelatedDocuments({
   if (!await fileExists(denseVectorPath(workspacePath))) {
     throw new CliError("dense vector index is not built; run `qli models pull --dense` and `qli rebuild`", "DENSE_INDEX_MISSING", 7 /* QueryError */);
   }
-  const documents = await readJsonl(path19.join(workspacePath, "documents", "documents.jsonl"));
+  const documents = await readJsonl(path20.join(workspacePath, "documents", "documents.jsonl"));
   const selected = resolveDocumentSelector(documents, document);
   const densePayload = await readDensePayload(workspacePath);
   const vectors = buildDocumentVectors(documents, densePayload.chunks, densePayload.metadata.dimensions);
@@ -3395,9 +3862,10 @@ async function createContext({
   retrievalMode
 }) {
   const search = await searchIndex({ workspacePath, query, topK, showChunks: true, retrievalMode });
+  const results = searchResultsFromResponse(search, true);
   const sources = [];
   let total = 0;
-  for (const result of search.results) {
+  for (const result of results) {
     const text = result.text ?? "";
     if (total + text.length > maxChars && sources.length > 0) {
       break;
@@ -3430,7 +3898,7 @@ async function createContext({
 }
 // src/report/diff-service.ts
-import path20 from "path";
+import path21 from "path";
 function chooseBaselineRun(runs, since) {
   if (since === "last-run") {
     return runs.at(-1);
@@ -3446,7 +3914,7 @@ async function diffWorkspace({
   documentId,
   since
 }) {
-  const current = await readJsonl(path20.join(workspacePath, "documents", "documents.jsonl"));
+  const current = await readJsonl(path21.join(workspacePath, "documents", "documents.jsonl"));
   const baseline = chooseBaselineRun(await listRuns(workspacePath), since);
   const previous = new Map((baseline?.documentsSnapshot ?? []).map((document) => [document.id, document]));
   const changedDocuments = current.filter((document) => (!sourceId || document.sourceId === sourceId) && (!documentId || document.id === documentId)).filter((document) => {
@@ -3498,7 +3966,8 @@ function formatSourcesTable(sources) {
   }
   return table.toString();
 }
-function formatSearchResults(results) {
+function formatSearchResults(response2) {
+  const results = searchResultsFromResponse(response2);
   return results.map((result, index) => [
     `${index + 1}. ${colors.bold(result.title)}`,
     `   URL: ${result.uri}`,
@@ -3803,6 +4272,19 @@ function parseDateValue(input, optionName) {
   }
   return parsed.toISOString();
 }
+async function parseJsonArgument(input) {
+  const raw = input.startsWith("@") ? await readFile11(path22.resolve(input.slice(1)), "utf8") : input;
+  try {
+    const parsed = JSON.parse(raw);
+    if (!parsed || typeof parsed !== "object" || Array.isArray(parsed)) {
+      throw new Error("expected a JSON object");
+    }
+    return parsed;
+  } catch (error) {
+    const message = error instanceof Error ? error.message : String(error);
+    throw new CliError(`invalid JSON request: ${message}`, "INVALID_ARGUMENT", 2 /* InvalidArguments */);
+  }
+}
 function searchDateRanges(options) {
   const entries = [];
   if (options.since || options.until) {
@@ -3835,14 +4317,14 @@ function searchDateRanges(options) {
   return entries;
 }
 async function resolveWorkspace(options) {
-  return path21.resolve(options.workspace ?? DEFAULT_WORKSPACE);
+  return path22.resolve(options.workspace ?? DEFAULT_WORKSPACE);
 }
 function workspaceFromArgv(argv) {
   const index = argv.findIndex((arg) => arg === "--workspace");
   if (index >= 0 && argv[index + 1]) {
-    return path21.resolve(argv[index + 1]);
+    return path22.resolve(argv[index + 1]);
   }
-  return path21.resolve(DEFAULT_WORKSPACE);
+  return path22.resolve(DEFAULT_WORKSPACE);
 }
 async function runCli(argv, io = {}) {
   const capture = { stdout: [], stderr: [], ...io };
@@ -3936,7 +4418,7 @@ Notes:
     }
     const stored = await addSource(workspace, {
       type,
-      uri: ["file", "directory"].includes(type) ? path21.resolve(uri) : uri,
+      uri: ["file", "directory"].includes(type) ? path22.resolve(uri) : uri,
       name: options.name,
       enabled: true,
       tags: options.tag ?? [],
@@ -4147,7 +4629,7 @@ Examples:
     progress?.("info", "Rebuild complete");
     emit(global.json, capture, response("rebuild", workspace, data), `Processed ${ingest.processedSources} sources, wrote ${chunk.chunksWritten} chunks`);
   });
-  program.command("search").description("Search the built index and return ranked matching documents or chunks.").argument("[query]", "Text query. Omit it to list the latest matching documents.").option("--top-k <n>", "Maximum number of results to return.", "12").option("--source <sourceIds>", "Restrict results to one or more source ids. Use comma-separated values.").option("--source-name <names>", "Restrict results to one or more source names. Use comma-separated values.").option("--source-type <types>", `Restrict results to one or more source types. Use comma-separated values: ${SOURCE_TYPE_LIST.join(", ")}`).option("--uri-prefix <prefixes>", "Restrict results to one or more URI prefixes. Use comma-separated values.").option("--tag <tags>", "Restrict results to one or more source tags. Use comma-separated values.").option("--metadata <key=value...>", "Restrict results to sources with matching metadata.").option("--since <date>", "Shortcut for --publication-date-from.").option("--until <date>", "Shortcut for --publication-date-to.").option("--changed-since <date>", "Only include documents changed on or after this date.").option("--has-publication-date", "Only include documents with a publication date.").option("--publication-date-from <date>", "Only include documents published on or after this date.").option("--publication-date-to <date>", "Only include documents published on or before this date.").option("--first-seen-at-from <date>", "Only include documents first seen on or after this date.").option("--first-seen-at-to <date>", "Only include documents first seen on or before this date.").option("--last-seen-at-from <date>", "Only include documents last seen on or after this date.").option("--last-seen-at-to <date>", "Only include documents last seen on or before this date.").option("--last-changed-at-from <date>", "Only include documents changed on or after this date.").option("--last-changed-at-to <date>", "Only include documents changed on or before this date.").option("--crawled-at-from <date>", "Only include documents crawled on or after this date.").option("--crawled-at-to <date>", "Only include documents crawled on or before this date.").option("--retrieval <mode>", `Retrieval mode: ${RETRIEVAL_MODE_LIST.join(", ")}`).option("--show-chunks", "Return chunk-level matches when available.").addHelpText("after", `
+  program.command("search").description("Search the built index and return ranked matching documents or chunks. Use search-json for raw JSON DSL queries.").argument("[query]", "Text query. Omit it to list the latest matching documents.").option("--top-k <n>", "Maximum number of results to return.", "12").option("--source <sourceIds>", "Restrict results to one or more source ids. Use comma-separated values.").option("--source-name <names>", "Restrict results to one or more source names. Use comma-separated values.").option("--source-type <types>", `Restrict results to one or more source types. Use comma-separated values: ${SOURCE_TYPE_LIST.join(", ")}`).option("--uri-prefix <prefixes>", "Restrict results to one or more URI prefixes. Use comma-separated values.").option("--tag <tags>", "Restrict results to one or more source tags. Use comma-separated values.").option("--metadata <key=value...>", "Restrict results to sources with matching metadata.").option("--since <date>", "Shortcut for --publication-date-from.").option("--until <date>", "Shortcut for --publication-date-to.").option("--changed-since <date>", "Only include documents changed on or after this date.").option("--has-publication-date", "Only include documents with a publication date.").option("--publication-date-from <date>", "Only include documents published on or after this date.").option("--publication-date-to <date>", "Only include documents published on or before this date.").option("--first-seen-at-from <date>", "Only include documents first seen on or after this date.").option("--first-seen-at-to <date>", "Only include documents first seen on or before this date.").option("--last-seen-at-from <date>", "Only include documents last seen on or after this date.").option("--last-seen-at-to <date>", "Only include documents last seen on or before this date.").option("--last-changed-at-from <date>", "Only include documents changed on or after this date.").option("--last-changed-at-to <date>", "Only include documents changed on or before this date.").option("--crawled-at-from <date>", "Only include documents crawled on or after this date.").option("--crawled-at-to <date>", "Only include documents crawled on or before this date.").option("--retrieval <mode>", `Retrieval mode: ${RETRIEVAL_MODE_LIST.join(", ")}`).option("--show-chunks", "Return chunk-level matches when available.").addHelpText("after", `
 Examples:
   qli search "pricing api limits"
   qli search "authentication" --top-k 20 --tag docs
@@ -4160,6 +4642,7 @@ Examples:
 Notes:
   lexical works without vector models.
   dense, sparse, and hybrid require the relevant index artifacts to exist.
+  Use search-json when you want the raw Querylight 0.11 JSON DSL and hit format.
   When you omit the query, qli returns the latest matching documents sorted by publication date.`).action(async function command(query, options) {
     const global = this.optsWithGlobals();
     const workspace = await resolveWorkspace({ workspace: global.workspace });
@@ -4178,7 +4661,83 @@ Notes:
       retrievalMode: parseRetrievalMode(options.retrieval),
       showChunks: Boolean(options.showChunks)
     });
-    emit(global.json, capture, response("search", workspace, result), formatSearchResults(result.results));
+    emit(global.json, capture, response("search", workspace, result), formatSearchResults(result));
+  });
+  program.command("search-json").description("Run a raw Querylight 0.11 JSON DSL search request against the lexical index.").argument("<request>", "Inline JSON request or @path/to/request.json.").addHelpText("after", `
+Examples:
+  qli search-json '{"query":{"match":{"text":"authentication"}},"size":5}'
+  qli search-json @./search-request.json
+  qli search-json '{"query":{"bool":{"filter":[{"term":{"sourceType":"rss"}}]}},"aggs":{"types":{"terms":{"field":"sourceType","size":5}}}}' --json
+Notes:
+  search-json uses the lexical index and Querylight 0.11 JSON DSL fields.
+  Stored hit payloads are returned under _source.
+  Use --json when another tool needs the full response envelope.`).action(async function command(requestInput) {
+    const global = this.optsWithGlobals();
+    const workspace = await resolveWorkspace({ workspace: global.workspace });
+    const request = await parseJsonArgument(requestInput);
+    const result = await searchJsonIndex({
+      workspacePath: workspace,
+      request
+    });
+    emit(global.json, capture, response("search-json", workspace, result), JSON.stringify(result, null, 2));
+  });
+  program.command("serve").description("Start a small HTTP API that exposes Querylight JSON DSL search through an OpenSearch-like _search endpoint.").option("--host <host>", "Host interface to bind. Defaults to 127.0.0.1.", "127.0.0.1").option("--port <n>", "Port to bind. Use 0 to let the OS choose a free port.", "3000").addHelpText("after", `
+Examples:
+  qli serve
+  qli serve --workspace ./docs/.kb --port 4000
+  qli serve --workspace ./kbs --host 0.0.0.0 --port 4000
+Routes:
+  Single workspace: POST /_search
+  Single workspace: POST /<configured-index-name>/_search
+  Multi-KB root: POST /<directory-name>/_search
+Notes:
+  The request body must be a Querylight JSON DSL object.
+  serve only exposes lexical _search for now.
+  When --workspace points to a directory of knowledge bases, each child directory must contain its own .kb workspace.
+  Index files are loaded once at startup and reused across requests.`).action(async function command(options) {
+    const global = this.optsWithGlobals();
+    const workspace = await resolveWorkspace({ workspace: global.workspace });
+    const port = Number(options.port);
+    if (!Number.isInteger(port) || port < 0 || port > 65535) {
+      throw new CliError(`invalid port: ${options.port}`, "INVALID_ARGUMENT", 2 /* InvalidArguments */);
+    }
+    const server = await startSearchApiServer({
+      workspacePath: workspace,
+      host: options.host,
+      port
+    });
+    const data = {
+      url: server.url,
+      mode: server.mode,
+      knowledgeBases: server.knowledgeBases
+    };
+    const human = [
+      `Listening on ${server.url}`,
+      ...server.knowledgeBases.map((knowledgeBase) => `${knowledgeBase.route} -> ${knowledgeBase.workspacePath}`)
+    ].join("\n");
+    emit(global.json, capture, response("serve", workspace, data), human);
+    const shutdown = async () => {
+      for (const signal of ["SIGINT", "SIGTERM"]) {
+        process.off(signal, stop);
+      }
+      await server.close();
+    };
+    const stop = () => {
+      void shutdown().then(() => resolveStop(), rejectStop);
+    };
+    let resolveStop;
+    let rejectStop;
+    const waitForStop = new Promise((resolve2, reject) => {
+      resolveStop = resolve2;
+      rejectStop = reject;
+    });
+    for (const signal of ["SIGINT", "SIGTERM"]) {
+      process.once(signal, stop);
+    }
+    await waitForStop;
   });
   program.command("related").description("Find documents similar to an existing document by id or URI.").argument("<document>", "Document id, uri, or canonical uri").option("--top-k <n>", "Maximum number of related documents to return.", "12").addHelpText("after", `
 Examples:
@@ -4303,7 +4862,7 @@ Examples:
     try {
       const meta = await readLatestIndexMetadata(workspace);
       latestIndex = meta.createdAt;
-      indexSize = (await stat4(await resolveLatestIndexArtifactPath(workspace))).size;
+      indexSize = (await stat5(await resolveLatestIndexArtifactPath(workspace))).size;
     } catch {
       latestIndex = void 0;
     }