npm - xindex - Versions diffs - 1.0.17 → 1.0.19 - Mend

xindex 1.0.17 → 1.0.19

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

package/.mcp.json +0 -4
package/.xindex.json +2 -1
package/apps/indexApp.ts +1 -1
package/apps/mcpApp.ts +18 -4
package/apps/run.mcp.ts +12 -6
package/apps/run.search.ts +2 -2
package/apps/searchApp.ts +18 -6
package/apps/watchApp.ts +1 -1
package/components/buildComponents.ts +2 -0
package/components/config/loadConfig.ts +6 -0
package/components/config/xindexConfig.ts +2 -0
package/components/index/contentIndexDriver.ts +3 -2
package/components/keywords/cleanUpKeywords.ts +23 -3
package/components/locate/locateInFile.ts +61 -57
package/components/locate/windowsOf.ts +3 -1
package/features/searchIndex.ts +71 -9
package/package.json +2 -2
package/packages/fun/src/array-finder.ts +1 -1
package/packages/fun/src/array-index.ts +1 -1
package/packages/fun/src/asyncRequest.ts +1 -1
package/packages/fun/src/concurrency.ts +5 -5
package/packages/fun/src/counter.ts +1 -1
package/packages/fun/src/flatten.ts +12 -6
package/packages/fun/src/hash128.ts +2 -2
package/packages/fun/src/hash256.ts +2 -2
package/packages/fun/src/hub.ts +1 -1
package/packages/fun/src/interval.ts +1 -1
package/packages/fun/src/mailbox.ts +1 -1
package/packages/fun/src/match-left-and-right-arrays.ts +1 -1
package/packages/fun/src/memos.ts +1 -1
package/packages/fun/src/pubsub.ts +2 -2
package/packages/fun/src/tick.ts +1 -1
package/packages/fun/src/time-behavior.ts +1 -1
package/packages/fun/src/timedFallback.ts +1 -1
package/packages/fun/src/value.ts +1 -1
package/packages/fun/src/waitForCounter.ts +2 -2
package/packages/streamx/src/batch.ts +2 -2
package/packages/streamx/src/batchTimed.ts +5 -5
package/packages/streamx/src/buffer.ts +4 -4
package/packages/streamx/src/concatenate.ts +1 -1
package/packages/streamx/src/filter.ts +2 -2
package/packages/streamx/src/flat.ts +1 -1
package/packages/streamx/src/flatMap.ts +3 -3
package/packages/streamx/src/from.ts +1 -1
package/packages/streamx/src/interval.ts +3 -3
package/packages/streamx/src/loop.ts +2 -2
package/packages/streamx/src/map.ts +2 -2
package/packages/streamx/src/merge.ts +4 -4
package/packages/streamx/src/nodeReadable.ts +1 -1
package/packages/streamx/src/nodeTransform.ts +2 -2
package/packages/streamx/src/nodeWritable.ts +3 -3
package/packages/streamx/src/objectReader.ts +2 -2
package/packages/streamx/src/reader.ts +1 -1
package/packages/streamx/src/reduce.ts +2 -2
package/packages/streamx/src/scale.ts +7 -7
package/packages/streamx/src/scaleSync.ts +5 -5
package/packages/streamx/src/sequence.ts +1 -1
package/packages/streamx/src/tap.ts +3 -3
package/packages/streamx/src/toArray.ts +1 -1
package/packages/streamx/src/writer.ts +4 -4
package/tsconfig.json +1 -1
package/components/index/documentContentIndexDriver.ts +0 -127

package/.mcp.json CHANGED Viewed

@@ -1,9 +1,5 @@
 {
   "mcpServers": {
-    "fetch": {
-      "command": "docker",
-      "args": ["run", "-i", "--rm", "mcp/fetch"]
-    },
     "xindex": {
       "command": "xindex-mcp",
       "args": []

package/.xindex.json CHANGED Viewed

@@ -105,5 +105,6 @@
   ],
   "maxLines": 30,
   "maxFileBytes": 100000,
-  "followSymlinks": false
+  "followSymlinks": false,
+  "searchDefaultLimit": 7
 }

package/apps/indexApp.ts CHANGED Viewed

@@ -6,7 +6,7 @@ import {run} from "../packages/streamx/src/index.js";
 import {IWalkFiles} from "../components/walkFiles.js";
 import {IIndexContent} from "../features/indexContent.js";
 import {ILogger} from "../components/logger.js";
-import {INDEXING_BATCH_SIZE} from "../components/config/INDEXING_BATCH_SIZE";
+import {INDEXING_BATCH_SIZE} from "../components/config/INDEXING_BATCH_SIZE.js";
 import {SafeIndexBatch} from "../components/io/safeIndexBatch.js";
 export type IIndexApp = (inputs: string[]) => Promise<void>;

package/apps/mcpApp.ts CHANGED Viewed

@@ -50,14 +50,28 @@ export function McpApp({
             inputSchema: z.object({
                 query: z.string()
                     .describe("Natural language search query"),
-                limit: z.number().int().min(1).max(50).default(7)
-                    .describe("Max results to return, 7 by default, 50 max"),
+                limit: z.number().int().min(1).max(50).default(config.searchDefaultLimit)
+                    .describe(`Max results to return default ${config.searchDefaultLimit}, max 50)`),
+                windowLines: z.number().int().min(1).default(config.maxLines).optional()
+                    .describe("Optional line-window size for per-file snippet locating"),
+                includePaths: z.array(z.string()).optional()
+                    .describe("Optional gitignore-style include patterns (e.g. 'src/**', '**/*.ts', '!src/vendor/**')"),
+                excludePaths: z.array(z.string()).optional()
+                    .describe("Optional gitignore-style exclude patterns (e.g. 'node_modules/**', '**/*.test.ts')"),
+                scoreThreshold: z.number().min(0).max(1).optional()
+                    .describe("Optional minimum semantic score threshold (0..1)"),
             }),
             annotations: {readOnlyHint: true},
-        }, async ({query, limit}) => {
+        }, async ({query, limit, scoreThreshold, windowLines, includePaths, excludePaths}) => {
             try {
                 const format = FormatSearchResults();
-                const results = await search(query, limit);
+                const results = await search(query, {
+                    limit,
+                    scoreThreshold,
+                    windowLines,
+                    includePaths,
+                    excludePaths,
+                });
                 const text = await format(query, results);
                 return {content: [{type: "text" as const, text}]};
             } catch (e) {

package/apps/run.mcp.ts CHANGED Viewed

@@ -29,7 +29,7 @@ const indexApp = async (inputs: string[]) => {
     await rawIndexApp(inputs);
     await flush();
 };
-const search = SearchApp({searchContentIndex});
+const search = SearchApp({searchIndex: searchContentIndex, searchDefaultLimit: config.searchDefaultLimit});
 const appId = AppId();
 const watcherLock = WatcherLock({
@@ -45,16 +45,22 @@ const watch = watchDisabled ? undefined : {
     watcherLock,
 };
-process.on("SIGINT", async () => {
-    log(`shutting down — stopping heartbeat...`);
+let shuttingDown = false;
+const shutdown = async (reason: string) => {
+    if (shuttingDown) return;
+    shuttingDown = true;
+    log(`shutdown (${reason}) — stopping heartbeat...`);
     watcherLock.stopHeartbeat();
     log(`releasing lock...`);
     await watcherLock.release();
-    log(`waiting 7s for another watcher to take over...`);
-    await new Promise(r => setTimeout(r, 7000));
     log(`exiting`);
     process.exit(0);
-});
+};
+process.on("SIGINT",  () => shutdown("SIGINT"));
+process.on("SIGTERM", () => shutdown("SIGTERM"));
+process.on("SIGHUP",  () => shutdown("SIGHUP"));
+process.stdin.on("close", () => shutdown("stdin-close"));
+process.stdin.on("end",   () => shutdown("stdin-end"));
 log(`[${appId}] started`);
 const mcpApp = McpApp({search, indexApp, getIndexStats, resetIndex, log, watch, config});

package/apps/run.search.ts CHANGED Viewed

@@ -4,8 +4,8 @@ import {SearchApp} from "./searchApp.js";
 import {FormatSearchResults} from "../components/index/formatSearchResults.js";
 const log = BufferedLoggerToStdOut();
-const {searchContentIndex} = await BuildComponents({log});
-const search = SearchApp({searchContentIndex});
+const {searchContentIndex, config} = await BuildComponents({log});
+const search = SearchApp({searchIndex: searchContentIndex, searchDefaultLimit: config.searchDefaultLimit});
 const query = process.argv.slice(2).join(" ");
 if (!query) {

package/apps/searchApp.ts CHANGED Viewed

@@ -1,11 +1,23 @@
-import {ISearchIndex, IIndexRecord} from "../features/searchIndex.js";
+import {IIndexRecord, ISearchIndex, ISearchIndexOptions} from "../features/searchIndex.js";
-export type ISearchApp = (query: string, limit?: number) => Promise<IIndexRecord[]>;
+export type ISearchApp = (query: string, options?: Partial<ISearchIndexOptions>) => Promise<IIndexRecord[]>;
-export function SearchApp({searchContentIndex}: {
-    searchContentIndex: ISearchIndex;
+export function SearchApp({searchIndex, searchDefaultLimit = 7}: {
+    searchIndex: ISearchIndex;
+    searchDefaultLimit?: number;
 }): ISearchApp {
-    return async function search(query, limit = 7) {
-        return searchContentIndex(query, limit);
+    return async function search(query, options = {}) {
+        const normalizedOptions: ISearchIndexOptions = {
+            limit: options.limit ?? searchDefaultLimit,
+            prefetchMultiplier: options.prefetchMultiplier,
+            scoreThreshold: options.scoreThreshold,
+            locateInFiles: options.locateInFiles,
+            windowLines: options.windowLines,
+            useKeywordsSearch: options.useKeywordsSearch,
+            includePaths: options.includePaths ?? [],
+            excludePaths: options.excludePaths ?? [],
+        };
+        return searchIndex({query, options: normalizedOptions});
     }
 }

package/apps/watchApp.ts CHANGED Viewed

@@ -10,7 +10,7 @@ import {ILogger} from "../components/logger.js";
 import {IWatcherLock} from "../components/index/watcherLock.js";
 import {WatchFileEventsApp} from "./watchFileEventsApp.js";
 import {IIndexContent} from "../features/indexContent.js";
-import {INDEXING_BATCH_SIZE} from "../components/config/INDEXING_BATCH_SIZE";
+import {INDEXING_BATCH_SIZE} from "../components/config/INDEXING_BATCH_SIZE.js";
 import {SafeIndexBatch} from "../components/io/safeIndexBatch.js";
 export type IWatchApp = {

package/components/buildComponents.ts CHANGED Viewed

@@ -23,6 +23,7 @@ export async function BuildComponents({log, watchCoalesceMs = 0, indexingCoalesc
         extractKeywords,
         cleanUpKeywords,
         windowLines: config.maxLines,
+        embedConcurrency: config.searchConcurrency,
         maxFileBytes: config.maxFileBytes,
     });
@@ -38,6 +39,7 @@ export async function BuildComponents({log, watchCoalesceMs = 0, indexingCoalesc
         cleanUpKeywords,
         locateInFile,
         scoreThreshold: SCORE_THRESHOLD,
+        searchConcurrency: config.searchConcurrency,
         log,
         indexingWatchCoalesceMs: watchCoalesceMs,
         indexingCoalesceMs,

package/components/config/loadConfig.ts CHANGED Viewed

@@ -3,6 +3,8 @@ import {IXindexConfig} from "./xindexConfig.js";
 import {ILogger} from "../logger.js";
 const DEFAULT_MAX_LINES = 30;
+const DEFAULT_SEARCH_DEFAULT_LIMIT = 7;
+const DEFAULT_SEARCH_CONCURRENCY = 4;
 const DEFAULT_MAX_FILE_BYTES = 50_000;
 const DEFAULT_FOLLOW_SYMLINKS = false;
 const DEFAULT_IGNORE_FILES = ['.xindex', 'node_modules'];
@@ -11,6 +13,8 @@ const DEFAULTS: IXindexConfig = {
     ignoreKeywords: [],
     ignoreFiles: DEFAULT_IGNORE_FILES,
     maxLines: DEFAULT_MAX_LINES,
+    searchDefaultLimit: DEFAULT_SEARCH_DEFAULT_LIMIT,
+    searchConcurrency: DEFAULT_SEARCH_CONCURRENCY,
     maxFileBytes: DEFAULT_MAX_FILE_BYTES,
     followSymlinks: DEFAULT_FOLLOW_SYMLINKS,
 };
@@ -45,6 +49,8 @@ export function LoadConfig({configPath, log}: { configPath: string, log: ILogger
             ignoreKeywords: toStrings(parsed.ignoreKeywords),
             ignoreFiles: toStrings(parsed.ignoreFiles),
             maxLines: toNum(parsed.maxLines, DEFAULT_MAX_LINES),
+            searchDefaultLimit: Math.max(1, toNum(parsed.searchDefaultLimit, DEFAULT_SEARCH_DEFAULT_LIMIT)),
+            searchConcurrency: Math.max(1, toNum(parsed.searchConcurrency, DEFAULT_SEARCH_CONCURRENCY)),
             maxFileBytes: toNum(parsed.maxFileBytes, DEFAULT_MAX_FILE_BYTES),
             followSymlinks: typeof parsed.followSymlinks === "boolean" ? parsed.followSymlinks : DEFAULT_FOLLOW_SYMLINKS,
         };

package/components/config/xindexConfig.ts CHANGED Viewed

@@ -2,6 +2,8 @@ export type IXindexConfig = {
     ignoreKeywords: string[];
     ignoreFiles: string[];
     maxLines: number;
+    searchDefaultLimit: number;
+    searchConcurrency: number;
     maxFileBytes: number;
     followSymlinks: boolean;
 };

package/components/index/contentIndexDriver.ts CHANGED Viewed

@@ -23,7 +23,7 @@ export type IContentIndexDriver = Readonly<{
 }>;
 export async function ContentIndexDriver({
-    path, embed, extractKeywords, cleanUpKeywords, locateInFile, scoreThreshold, log,
+    path, embed, extractKeywords, cleanUpKeywords, locateInFile, scoreThreshold, searchConcurrency, log,
     indexingWatchCoalesceMs = 0, indexingCoalesceMs = 0,
 }: {
     path: string,
@@ -32,6 +32,7 @@ export async function ContentIndexDriver({
     cleanUpKeywords: ICleanUpKeywords,
     locateInFile: ILocateInFile,
     scoreThreshold: number,
+    searchConcurrency: number,
     log: ILogger,
     indexingWatchCoalesceMs?: number,
     indexingCoalesceMs?: number,
@@ -62,7 +63,7 @@ export async function ContentIndexDriver({
         indexContentWatch: IndexContent({extractKeywords, cleanUpKeywords, embed, indexApi: watchCoalesce, log}),
         indexContentBatch: IndexContent({extractKeywords, cleanUpKeywords, embed, indexApi: batchCoalesce, log}),
         removeContent: RemoveContent({indexApi: drainingApi}),
-        searchContentIndex: SearchIndex({extractKeywords, cleanUpKeywords, embed, index, locateInFile, scoreThreshold}),
+        searchContentIndex: SearchIndex({extractKeywords, cleanUpKeywords, embed, index, locateInFile, scoreThreshold, searchConcurrency}),
         resetIndex: ResetIndex({indexApi: drainingApi}),
         flush: flushAll,
     };

package/components/keywords/cleanUpKeywords.ts CHANGED Viewed

@@ -13,7 +13,16 @@ export function CleanUpKeywords({maxNgrams, minLength, ignoreKeywords = []}: {
     const ignoreSet = new Set(ignoreKeywords.map(normalize));
     return function cleanUpKeywords(keywords) {
-        const cleaned = keywords.join(" ").replace(/\W+/gm, " ").trim();
+        const joined = keywords.join(" ");
+        const expanded = joined + " " + splitIdentifiers(joined);
+        const tokens = expanded.replace(/[\W_]+/gm, " ").trim().split(/\s+/);
+        const seenTokens = new Set<string>();
+        const cleaned = tokens.filter(t => {
+            const k = t.toLowerCase();
+            if (!k || seenTokens.has(k)) return false;
+            seenTokens.add(k);
+            return true;
+        }).join(" ");
         const extracted: string[] = keyword_extractor.extract(cleaned, {
             language: "english",
@@ -25,14 +34,25 @@ export function CleanUpKeywords({maxNgrams, minLength, ignoreKeywords = []}: {
         const seen = new Set<string>();
-        return extracted
+        const output = extracted
             .map(normalize)
             .filter((kw: string) => {
-                if (kw.length <= minLength || !/[a-z]/i.test(kw)) return false;
+                // if (kw.length <= minLength || !/[a-z]/i.test(kw)) return false;
+                if (kw.length <= minLength) return false;
                 if (ignoreSet.has(kw)) return false;
                 if (seen.has(kw)) return false;
                 seen.add(kw);
                 return true;
             });
+        // console.log(`CleanUpKeywords: input=${JSON.stringify(keywords, null, 2)} output=${JSON.stringify(output, null, 2)}`);
+        return output;
     }
 }
+function splitIdentifiers(text: string): string {
+    return text
+        .replace(/[_\-.]+/g, " ")
+        .replace(/([a-z0-9])([A-Z])/g, "$1 $2")
+        .replace(/([A-Z]+)([A-Z][a-z])/g, "$1 $2");
+}

package/components/locate/locateInFile.ts CHANGED Viewed

@@ -6,20 +6,20 @@ import {IIndexRecord} from "../../features/searchIndex.js";
 import {IInMemoryIndex, InMemoryIndex} from "./inMemoryIndex.js";
 import {IWindow, windowsOf} from "./windowsOf.js";
 import {Bm25, IBm25Doc, tokenizeForBm25} from "./bm25.js";
+import {DEFAULT_LOCATE_BATCH_SIZE} from "../config/DEFAULT_LOCATE_BATCH_SIZE.js";
 import {from} from "../../packages/streamx/src/from.js";
 import {filter} from "../../packages/streamx/src/filter.js";
 import {map} from "../../packages/streamx/src/map.js";
 import {flatMap} from "../../packages/streamx/src/flatMap.js";
-import {tap} from "../../packages/streamx/src/tap.js";
-import {run} from "../../packages/streamx/src/index.js";
-import {DEFAULT_LOCATE_BATCH_SIZE} from "../config/DEFAULT_LOCATE_BATCH_SIZE";
-import {scaleSync} from "../../packages/streamx/src/scaleSync";
+import {scaleSync} from "../../packages/streamx/src/scaleSync.js";
+import {toArray} from "../../packages/streamx/src/toArray.js";
 export type ILocateInFile = (
     query: string,
     queryVector: number[],
     candidates: IIndexRecord[],
     limit: number,
+    windowLinesOverride?: number,
 ) => Promise<IIndexRecord[]>;
 export function LocateInFile({
@@ -41,67 +41,70 @@ export function LocateInFile({
     type IWindowWithKeywords = IWindow & { keywords: string };
     type IWindowWithVector = IWindowWithKeywords & { vector: number[] };
-    return async function locateInFile(query, queryVector, candidates, limit) {
+    return async function locateInFile(query, queryVector, candidates, limit, windowLinesOverride) {
+        const effectiveWindowLines = windowLinesOverride ?? windowLines;
+        const effectiveConcurrency = Math.max(1, embedConcurrency);
         const memIndex: IInMemoryIndex = InMemoryIndex({dimensions: queryVector.length});
         try {
-            const ids = candidates.map(c => c.id);
+            const ids: string[] = await toArray(
+                from<IIndexRecord>(candidates)
+                    .pipe(scaleSync<IIndexRecord, string | null>(effectiveConcurrency, async (c) => {
+                        try {
+                            const s = await stat(c.id);
+                            if (!s.isFile()) return null;
+                            if (s.size > maxFileBytes) return null;
+                            return c.id;
+                        } catch {
+                            return null;
+                        }
+                    }))
+                    .pipe(filter((id: string | null) => id !== null))
+                    .pipe(map<string | null, string>((id) => id as string)),
+            );
             const bm25Docs: IBm25Doc[] = [];
             const metaById = new Map<string, { fileId: string; startLine: number; endLine: number; snippet: string }>();
-            const SCALE_FILE_READS = embedConcurrency;
-            const windows = from<string>(ids)
-                .pipe(filter(async (id: string) => {
-                    try {
-                        const s = await stat(id);
-                        if (!s.isFile()) return false;
-                        if (s.size > maxFileBytes) return false;
-                        return true;
-                    } catch {
-                        return false;
-                    }
-                }))
-                .pipe(scaleSync(SCALE_FILE_READS, async (id: string): Promise<{ id: string, text: string } | null> => {
-                    try {
-                        const text = await readFile(id, "utf8");
-                        return {id, text};
-                    } catch {
-                        return null;
-                    }
-                }))
-                .pipe(filter(async (r: { id: string, text: string } | null) => r !== null))
-                .pipe(flatMap((r: { id: string, text: string } | null): IWindow[] => {
-                    return windowsOf({text: r!.text, id: r!.id, windowLines});
-                }));
+            const withVectors: IWindowWithVector[] = await toArray(
+                from<string>(ids)
+                    .pipe(scaleSync<string, {id: string, text: string} | null>(effectiveConcurrency, async (id) => {
+                        try {
+                            const text = await readFile(id, "utf8");
+                            return {id, text};
+                        } catch {
+                            return null;
+                        }
+                    }))
+                    .pipe(filter((r: {id: string, text: string} | null) => r !== null))
+                    .pipe(flatMap((r: {id: string, text: string} | null): IWindow[] =>
+                        windowsOf({text: r!.text, id: r!.id, windowLines: effectiveWindowLines})))
+                    .pipe(map<IWindow, IWindowWithKeywords>((w: IWindow) => {
+                        const kw = cleanUpKeywords(extractKeywords(w.snippet)).join(", ");
+                        return {...w, keywords: kw || w.snippet.slice(0, 200)};
+                    }))
+                    .pipe(scaleSync<IWindowWithKeywords, IWindowWithVector>(effectiveConcurrency, async (w) => {
+                        const vector = await embed(w.keywords);
+                        return {...w, vector};
+                    })),
+            );
-            const withVectors = from<IWindow>(windows)
-                .pipe(map<IWindow, IWindowWithKeywords>(w => {
-                    const kw = cleanUpKeywords(extractKeywords(w.snippet)).join(", ");
-                    return {...w, keywords: kw || w.snippet.slice(0, 200)};
-                }))
-                .pipe(scaleSync<IWindowWithKeywords, IWindowWithVector>(embedConcurrency, async (w) => {
-                    const vector = await embed(w.keywords);
-                    return {...w, vector};
-                }))
-                .pipe(tap(async (w: IWindowWithVector) => {
-                    const id = `${w.fileId}:${w.startLine}:${w.endLine}`;
-                    await memIndex.upsertItem(
-                        id,
-                        w.vector,
-                        {fileId: w.fileId, startLine: w.startLine, endLine: w.endLine, snippet: w.snippet},
-                    );
-                    bm25Docs.push({id, tokens: tokenizeForBm25(w.snippet)});
-                    metaById.set(id, {
-                        fileId: w.fileId,
-                        startLine: w.startLine,
-                        endLine: w.endLine,
-                        snippet: w.snippet
-                    });
-                }));
-            await run(withVectors);
+            for (const w of withVectors) {
+                const id = `${w.fileId}:${w.startLine}:${w.endLine}`;
+                await memIndex.upsertItem(
+                    id,
+                    w.vector,
+                    {fileId: w.fileId, startLine: w.startLine, endLine: w.endLine, snippet: w.snippet},
+                );
+                bm25Docs.push({id, tokens: tokenizeForBm25(w.snippet)});
+                metaById.set(id, {
+                    fileId: w.fileId,
+                    startLine: w.startLine,
+                    endLine: w.endLine,
+                    snippet: w.snippet,
+                });
+            }
-            const poolSize = Math.max(limit * 8, 40);
+            const poolSize = Math.min(limit * 10, 100);
             const vecHits = await memIndex.query(queryVector, query, poolSize);
             const bm25 = Bm25({docs: bm25Docs});
@@ -151,3 +154,4 @@ export function LocateInFile({
         }
     };
 }

package/components/locate/windowsOf.ts CHANGED Viewed

@@ -12,7 +12,9 @@ export function windowsOf({text, id, windowLines}: {
 }): IWindow[] {
     const lines = text.split("\n");
     const windows: IWindow[] = [];
-    const scales = [Math.max(1, Math.floor(windowLines / 2)), windowLines];
+    const a12 = Math.max(1, Math.floor(windowLines / 2));
+    // const a13 = Math.max(1, Math.floor(windowLines / 3));
+    const scales = [a12, windowLines];
     for (const size of scales) {
         const step = Math.max(1, Math.floor(size / 2));
         for (let i = 0; i < lines.length; i += step) {

package/features/searchIndex.ts CHANGED Viewed

@@ -1,8 +1,10 @@
 import {LocalIndex} from "vectra";
+import ignore from "ignore";
 import {IEmbed} from "../components/llm/embed.js";
 import {IExtractKeywords} from "../components/keywords/extractKeywords.js";
 import {ICleanUpKeywords} from "../components/keywords/cleanUpKeywords.js";
 import {ILocateInFile} from "../components/locate/locateInFile.js";
+import {Concurrency} from "../packages/fun/src/concurrency.js";
 export type IIndexRecord = {
     score: number;
@@ -15,25 +17,66 @@ export type IIndexRecord = {
     endLine?: number;
 };
-export type ISearchIndex = (query: string, limit: number) => Promise<IIndexRecord[]>;
+export type ISearchIndexOptions = {
+    limit: number;
+    prefetchMultiplier?: number;
+    scoreThreshold?: number;
+    locateInFiles?: boolean;
+    windowLines?: number;
+    useKeywordsSearch?: boolean;
+    includePaths?: string[];
+    excludePaths?: string[];
+};
+export type ISearchIndexQuery = Readonly<{
+    query: string;
+    options: ISearchIndexOptions;
+}>;
+export type ISearchIndex = (query: ISearchIndexQuery) => Promise<IIndexRecord[]>;
-export function SearchIndex({extractKeywords, cleanUpKeywords, embed, index, locateInFile, scoreThreshold = 0.05}: {
+export function SearchIndex({
+                                extractKeywords,
+                                cleanUpKeywords,
+                                embed,
+                                index,
+                                locateInFile,
+                                searchConcurrency = 3,
+                                scoreThreshold = 0.05
+                            }: {
     extractKeywords: IExtractKeywords,
     cleanUpKeywords: ICleanUpKeywords,
     embed: IEmbed,
     index: LocalIndex,
     locateInFile: ILocateInFile,
     scoreThreshold: number
+    searchConcurrency?: number
 }): ISearchIndex {
-    return async function searchContentIndex(query, limit) {
-        const keywords = cleanUpKeywords(extractKeywords(query));
-        const searchText = keywords.length > 0 ? keywords.join(", ") : query;
+    const worker: ISearchIndex = async function searchContentIndex({
+                                                                       query, options: {
+            limit,
+            prefetchMultiplier = 3,
+            scoreThreshold: threshold = scoreThreshold,
+            locateInFiles = true,
+            windowLines,
+            useKeywordsSearch = false,
+            includePaths = [],
+            excludePaths = [],
+        }
+                                                                   }: ISearchIndexQuery) {
+        const keywords = useKeywordsSearch ? cleanUpKeywords(extractKeywords(query)) : [];
+        const searchText = useKeywordsSearch && keywords.length > 0 ? keywords.join(", ") : query;
         const vector = await embed(searchText);
+        const includeMatcher = createGitignoreMatcher(includePaths);
+        const excludeMatcher = createGitignoreMatcher(excludePaths);
-        const results = await index.queryItems(vector, searchText, limit * 2);
+        const expectedMultiplier = limit * prefetchMultiplier;
+        const pathPatternBoost = Math.max(1, includePaths.length + excludePaths.length);
+        const results = await index.queryItems(vector, searchText, expectedMultiplier + pathPatternBoost);
         const candidates = results
-            .filter(r => r.score >= scoreThreshold)
+            .filter(r => r.score >= threshold)
+            .filter(r => includePaths.length === 0 || includeMatcher(r.item.id))
+            .filter(r => excludePaths.length === 0 || !excludeMatcher(r.item.id))
             .sort((a, b) => b.score - a.score)
             .map(r => ({
                 score: r.score,
@@ -41,10 +84,29 @@ export function SearchIndex({extractKeywords, cleanUpKeywords, embed, index, loc
                 keywords: typeof r.item.metadata?.keywords === "string" ? r.item.metadata.keywords : "",
             }));
-        if (!locateInFile || candidates.length === 0) {
+        if (!locateInFile || !locateInFiles || candidates.length === 0) {
             return candidates;
         }
-        return locateInFile(query, vector, candidates, limit);
+        return locateInFile(query, vector, candidates, limit, windowLines);
+    };
+    const control = Concurrency(searchConcurrency, worker);
+    return async (input) => {
+        const resolve = await control(input);
+        return await resolve();
+    };
+}
+function createGitignoreMatcher(patterns: string[]): (path: string) => boolean {
+    const ig = ignore();
+    for (const pattern of patterns) {
+        ig.add(pattern);
     }
+    return (path: string) => ig.ignores(normalizePath(path));
+}
+function normalizePath(path: string): string {
+    return path.replaceAll("\\", "/").replace(/^\.\/+/, "");
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "xindex",
-  "version": "1.0.17",
+  "version": "1.0.19",
   "description": "Local semantic code search — index codebase, search by meaning or keywords",
   "type": "module",
   "main": "xindex.ts",
@@ -21,7 +21,7 @@
     "mcp": "tsx apps/run.mcp.ts",
     "watch": "tsx apps/run.watch.ts",
     "test.functional": "bash test/functional.sh",
-    "test.compilation": "npx -y tsc --ignoreConfig --noEmit --target ES2022 --module ESNext --moduleResolution bundler --esModuleInterop --skipLibCheck --strict false $(git ls-files '*.ts')",
+    "test.compilation": "tsc --ignoreConfig --noEmit --target ES2022 --module ESNext --moduleResolution bundler --esModuleInterop --skipLibCheck --strict false $(git ls-files '*.ts') && tsc -p tsconfig.json --noEmit",
     "test.npx": "docker run --rm -it -w /tmp node:22 bash -c 'npm i -g xindex && xindex-index tsx-0 && xindex-search streamx map | grep \"await mapper\" && which xindex | grep bin/xindex' ",
     "console": "docker run --rm -it -v \"$PWD:/app\" -w /app node:22 bash"
   },

package/packages/fun/src/array-finder.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { sortObject } from './sort-object';
+import { sortObject } from './sort-object.js';
 export function ArrayFinder<Type, ID>(
   items: Type[] | ReadonlyArray<Type>,

package/packages/fun/src/array-index.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { sortObject } from './sort-object';
+import { sortObject } from './sort-object.js';
 export function ArrayIndex<Type, ID>(
   items: Type[] | ReadonlyArray<Type>,

package/packages/fun/src/asyncRequest.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { Defer, IDefer } from './defer';
+import { Defer, IDefer } from './defer.js';
 export type IAsyncRequest<Request = any, Response = void, Cancellation = void> = Omit<
   IDefer<Response>,

package/packages/fun/src/concurrency.ts CHANGED Viewed

@@ -1,7 +1,7 @@
-import { Counter, ICounter } from './counter';
-import { Defer, IDefer } from './defer';
-import { IValue, Value } from './value';
-import { waitForCounter, waitForZeroCounter } from './waitForCounter';
+import { Counter, ICounter } from './counter.js';
+import { Defer, IDefer } from './defer.js';
+import { IValue, Value } from './value.js';
+import { waitForCounter, waitForZeroCounter } from './waitForCounter.js';
 export type IStopKeepConcurrency = () => Promise<void>;
@@ -168,7 +168,7 @@ export function KeyedConcurrency<Input, Output = any>(
         const keyedControl = Concurrency<Input>(workerConcurrency, worker);
         registry[key] = keyedControl;
-        const unsubscribe = keyedControl.quantity.subscribe(value => {
+        const unsubscribe = keyedControl.quantity.subscribe((value: number) => {
           if (value <= 0) {
             unsubscribe();

package/packages/fun/src/counter.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { IPubSubSubscribe, SyncPubSub } from './pubsub';
+import { IPubSubSubscribe, SyncPubSub } from './pubsub.js';
 export type ICounter = {
   increment: (n?: number) => number;