npm - @nusoft/nuos-build-catalogue - Versions diffs - 0.19.1 → 0.20.1 - Mend

@nusoft/nuos-build-catalogue 0.19.1 → 0.20.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/dist/cli.js +10 -0
package/dist/commands/init.js +19 -0
package/dist/setup/auto-index.d.ts +59 -0
package/dist/setup/auto-index.js +138 -0
package/package.json +1 -1

package/dist/cli.js CHANGED Viewed

@@ -460,7 +460,17 @@ async function main() {
             // when the user switched machines and needs to pull the model
             // freshly. Same orchestrator that `init` calls internally.
             const { runLlmSetup } = await import('./setup/run-llm-setup.js');
+            const { ensureIndexBuilt } = await import('./setup/auto-index.js');
             const result = await runLlmSetup({ nonInteractive: false });
+            // After the LLM stack is ready, auto-build the search index when
+            // it isn't already present. Same helper init and install-protocols
+            // use — keeps the three commands aligned on "after this finishes
+            // the project is search-ready".
+            if (result.kind === 'already_ready' ||
+                result.kind === 'pulled_only' ||
+                result.kind === 'installed_and_pulled') {
+                await ensureIndexBuilt({});
+            }
             // Most failure paths emit guidance in-band; we exit non-zero only
             // when a pull actually failed (so CI scripting can branch on it).
             const exitCode = result.kind === 'pull_failed' || result.kind === 'install_failed' ? 1 : 0;

package/dist/commands/init.js CHANGED Viewed

@@ -211,6 +211,7 @@ export async function cmdInit(prompt, options = {}) {
     // `nuos-catalogue setup-llm` later.
     if (!options.noLlm) {
         const { runLlmSetup } = await import('../setup/run-llm-setup.js');
+        const { ensureIndexBuilt } = await import('../setup/auto-index.js');
         await runLlmSetup({
             // The setup module writes its own progress directly to stderr; we
             // don't route through `prompt.print` because the in-place progress
@@ -224,6 +225,17 @@ export async function cmdInit(prompt, options = {}) {
             // so this is safe in unattended runs too.
             nonInteractive: false,
         });
+        // After LLM setup succeeds, auto-build the first search index. On a
+        // fresh project this is ~30s of starter-kit boilerplate; trivial,
+        // and finishing here means `search` works out of the box. When the
+        // LLM stack isn't ready, `ensureIndexBuilt` skips with a hint
+        // pointing back to setup-llm.
+        const indexResult = await ensureIndexBuilt({ cwd });
+        if (indexResult.kind === 'skipped_llm_not_ready') {
+            prompt.print('');
+            prompt.print(`  · Skipping first-index build: ${indexResult.reason}.`);
+            prompt.print(`  · ${indexResult.hint}`);
+        }
     }
     else {
         prompt.print('');
@@ -284,6 +296,13 @@ export async function cmdInstallProtocols(prompt, options = {}) {
     prompt.print('');
     prompt.print('Checking local semantic search (Ollama + qwen3-embedding:0.6b):');
     await reportLlmStatus((msg) => prompt.print(`  ${msg}`));
+    // Auto-build/refresh the search index when the LLM is ready. The
+    // indexer is incremental via per-file SHA hashes: a no-change project
+    // takes ~1s, a project with N changed files takes O(N) embed calls.
+    // When the LLM stack isn't ready the helper skips silently — the
+    // status was already reported above by reportLlmStatus.
+    const { ensureIndexBuilt } = await import('../setup/auto-index.js');
+    await ensureIndexBuilt({ cwd });
     return { output: '', exitCode: 0 };
 }
 /**

package/dist/setup/auto-index.d.ts ADDED Viewed

@@ -0,0 +1,59 @@
+/**
+ * Shared helper that runs the first search index build automatically
+ * from `init`, `install-protocols`, and `setup-llm`.
+ *
+ * Gated on the LLM stack being ready (Ollama + the configured embedding
+ * model). If the LLM isn't ready, this helper returns a `skipped_llm`
+ * result with a hint string the caller prints. The hint references
+ * `setup-llm` so the user has a clear path forward.
+ *
+ * Indexing on a fresh project takes ~30s — small enough that auto-
+ * running on first install is friendlier than asking. Subsequent calls
+ * are incremental via the per-file SHA hashes, so re-running on an
+ * existing index is cheap.
+ *
+ * @module setup/auto-index
+ */
+/** Outcome of an auto-index attempt. */
+export type AutoIndexResult =
+/**
+ * The indexer ran. `indexed` includes both freshly-embedded files and
+ * re-embedded changed ones. `unchanged` is non-zero on subsequent
+ * runs — those files were SHA-matched and skipped without embedding.
+ */
+{
+    kind: 'ran';
+    indexPath: string;
+    indexed: number;
+    unchanged: number;
+    chunks: number;
+    durationMs: number;
+} | {
+    kind: 'skipped_llm_not_ready';
+    reason: string;
+    hint: string;
+} | {
+    kind: 'skipped_no_catalogue';
+} | {
+    kind: 'failed';
+    error: string;
+};
+export interface AutoIndexOptions {
+    /** Project root for path resolution. Defaults to `process.cwd()`. */
+    cwd?: string;
+    /** Output sink — defaults to process.stderr. */
+    out?: (text: string) => void;
+    /** Force a full reindex even if the index file already exists. */
+    force?: boolean;
+}
+/**
+ * Run the indexer when conditions allow. Always runs (the indexer is
+ * incremental — unchanged files are SHA-skipped without embedding work),
+ * so this both *creates* the index on first call and *refreshes* it on
+ * subsequent calls. Returns `skipped_llm_not_ready` with a hint when
+ * the Ollama probe fails — the caller prints the hint and the user runs
+ * `setup-llm` to fix things.
+ *
+ * Never throws on user-facing failures.
+ */
+export declare function ensureIndexBuilt(opts?: AutoIndexOptions): Promise<AutoIndexResult>;

package/dist/setup/auto-index.js ADDED Viewed

@@ -0,0 +1,138 @@
+/**
+ * Shared helper that runs the first search index build automatically
+ * from `init`, `install-protocols`, and `setup-llm`.
+ *
+ * Gated on the LLM stack being ready (Ollama + the configured embedding
+ * model). If the LLM isn't ready, this helper returns a `skipped_llm`
+ * result with a hint string the caller prints. The hint references
+ * `setup-llm` so the user has a clear path forward.
+ *
+ * Indexing on a fresh project takes ~30s — small enough that auto-
+ * running on first install is friendlier than asking. Subsequent calls
+ * are incremental via the per-file SHA hashes, so re-running on an
+ * existing index is cheap.
+ *
+ * @module setup/auto-index
+ */
+import { existsSync } from 'node:fs';
+import { resolveBuildRoot, resolveCatalogueRoot, resolveHashPath, resolveIndexPath, } from '../path-resolution.js';
+import { DEFAULT_OLLAMA_HOST, detectModelPresent, detectOllamaApi } from './ollama-detect.js';
+import { DEFAULT_EMBEDDING_MODEL } from './run-llm-setup.js';
+/**
+ * Run the indexer when conditions allow. Always runs (the indexer is
+ * incremental — unchanged files are SHA-skipped without embedding work),
+ * so this both *creates* the index on first call and *refreshes* it on
+ * subsequent calls. Returns `skipped_llm_not_ready` with a hint when
+ * the Ollama probe fails — the caller prints the hint and the user runs
+ * `setup-llm` to fix things.
+ *
+ * Never throws on user-facing failures.
+ */
+export async function ensureIndexBuilt(opts = {}) {
+    const cwd = opts.cwd ?? process.cwd();
+    const out = opts.out ?? ((text) => process.stderr.write(text));
+    // Resolve where the index file lives without forcing the LLM stack to
+    // load — path resolution is cheap and offline. When the project has
+    // no `docs/build/` yet (e.g. install-protocols invoked in a non-
+    // scaffolded directory), resolveBuildRoot throws — we treat that as a
+    // silent no-op, since there is nothing meaningful to index.
+    const ctx = { cwd, env: process.env };
+    let buildRoot;
+    let catalogueRoot;
+    let indexPath;
+    let hashPath;
+    try {
+        buildRoot = resolveBuildRoot(undefined, ctx);
+        catalogueRoot = resolveCatalogueRoot(undefined, ctx);
+        indexPath = resolveIndexPath(buildRoot, undefined, ctx);
+        hashPath = resolveHashPath(buildRoot, undefined, ctx);
+    }
+    catch {
+        return { kind: 'skipped_no_catalogue' };
+    }
+    // We do not short-circuit on `existsSync(indexPath)` — the indexer is
+    // already incremental via the per-file SHA hash store, so running it
+    // when the index is up-to-date is cheap (~1s on a 270-file catalogue
+    // with no changes). Short-circuiting here would leave newer files
+    // un-embedded until the user ran `nuos-catalogue index` manually,
+    // which is exactly the discoverability gap the auto-index is meant to
+    // close.
+    // Probe the LLM stack — index requires Ollama + the model. If either
+    // is missing, skip with a hint pointing at setup-llm.
+    const apiHost = process.env.NUOS_CATALOGUE_OLLAMA_HOST ?? DEFAULT_OLLAMA_HOST;
+    const modelId = process.env.NUOS_CATALOGUE_OLLAMA_MODEL ?? DEFAULT_EMBEDDING_MODEL;
+    const api = await detectOllamaApi(apiHost);
+    if (!api.reachable) {
+        return {
+            kind: 'skipped_llm_not_ready',
+            reason: `Ollama is not running at ${apiHost}`,
+            hint: 'Run `nuos-catalogue setup-llm` to set up local semantic search, then re-run `nuos-catalogue index`.',
+        };
+    }
+    const model = await detectModelPresent(apiHost, modelId);
+    if (!model.present) {
+        return {
+            kind: 'skipped_llm_not_ready',
+            reason: `${modelId} is not pulled`,
+            hint: 'Run `nuos-catalogue setup-llm` to pull the embedding model (~600 MB), then re-run `nuos-catalogue index`.',
+        };
+    }
+    // LLM is ready. Run the indexer. The first run on a fresh project is
+    // ~30s of starter-kit content; subsequent runs are fast — the
+    // per-file SHA hashes mean unchanged files are skipped without
+    // embedding.
+    const isFirstRun = !existsSync(indexPath);
+    if (isFirstRun) {
+        out('Building search index for docs/build/ … (first run may take ~30 seconds)\n');
+    }
+    else {
+        out('Refreshing search index (incremental — only changed files are re-embedded)…\n');
+    }
+    try {
+        const { selectEmbedderFromEnv } = await import('../embedder/select.js');
+        const { openStore } = await import('../store/open.js');
+        const { runIndex } = await import('../indexer/upsert.js');
+        const embedder = await selectEmbedderFromEnv();
+        const store = await openStore({ storagePath: indexPath, dimensions: embedder.dimensions });
+        try {
+            const report = await runIndex({
+                catalogueRoot,
+                hashFilePath: hashPath,
+                store,
+                embedder,
+                force: Boolean(opts.force),
+                dryRun: false,
+            });
+            const changed = report.indexed + report.updated;
+            const secs = (report.durationMs / 1000).toFixed(1);
+            if (isFirstRun) {
+                out(`✓ Indexed ${report.indexed} file(s), ${report.chunks} chunks embedded in ${secs}s\n`);
+            }
+            else if (changed === 0) {
+                out(`✓ Index up-to-date (${report.unchanged} files checked, none changed) in ${secs}s\n`);
+            }
+            else {
+                out(`✓ Re-indexed ${changed} changed file(s) (${report.unchanged} unchanged), ` +
+                    `${report.chunks} chunks embedded in ${secs}s\n`);
+            }
+            return {
+                kind: 'ran',
+                indexPath,
+                indexed: changed,
+                unchanged: report.unchanged,
+                chunks: report.chunks,
+                durationMs: report.durationMs,
+            };
+        }
+        finally {
+            // Unload-after-use commitment — embedder releases the model.
+            await embedder.dispose();
+        }
+    }
+    catch (err) {
+        const message = err instanceof Error ? err.message : String(err);
+        out(`\n✗ Index refresh failed: ${message}\n`);
+        out('Re-run `nuos-catalogue index` manually to retry.\n');
+        return { kind: 'failed', error: message };
+    }
+}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@nusoft/nuos-build-catalogue",
-  "version": "0.19.1",
+  "version": "0.20.1",
   "description": "NuOS build-catalogue tooling: semantic search (WU 110) + migration runner that lifts markdown artefacts into JSON-backed workflow records (WU 111, Phase G).",
   "type": "module",
   "bin": {