npm - @phren/cli - Versions diffs - 0.0.1 - Mend

@phren/cli 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (185) hide show

package/LICENSE +21 -0
package/README.md +590 -0
package/mcp/dist/capabilities/cli.js +61 -0
package/mcp/dist/capabilities/index.js +15 -0
package/mcp/dist/capabilities/mcp.js +61 -0
package/mcp/dist/capabilities/types.js +57 -0
package/mcp/dist/capabilities/vscode.js +61 -0
package/mcp/dist/capabilities/web-ui.js +61 -0
package/mcp/dist/cli-actions.js +302 -0
package/mcp/dist/cli-config.js +580 -0
package/mcp/dist/cli-extract.js +305 -0
package/mcp/dist/cli-govern.js +371 -0
package/mcp/dist/cli-graph.js +169 -0
package/mcp/dist/cli-hooks-citations.js +44 -0
package/mcp/dist/cli-hooks-context.js +56 -0
package/mcp/dist/cli-hooks-globs.js +83 -0
package/mcp/dist/cli-hooks-output.js +130 -0
package/mcp/dist/cli-hooks-retrieval.js +2 -0
package/mcp/dist/cli-hooks-session.js +1402 -0
package/mcp/dist/cli-hooks.js +350 -0
package/mcp/dist/cli-namespaces.js +989 -0
package/mcp/dist/cli-ops.js +253 -0
package/mcp/dist/cli-search.js +407 -0
package/mcp/dist/cli.js +108 -0
package/mcp/dist/content-archive.js +278 -0
package/mcp/dist/content-citation.js +391 -0
package/mcp/dist/content-dedup.js +622 -0
package/mcp/dist/content-learning.js +472 -0
package/mcp/dist/content-metadata.js +186 -0
package/mcp/dist/content-validate.js +462 -0
package/mcp/dist/core-finding.js +54 -0
package/mcp/dist/core-project.js +36 -0
package/mcp/dist/core-search.js +50 -0
package/mcp/dist/data-access.js +400 -0
package/mcp/dist/data-tasks.js +821 -0
package/mcp/dist/embedding.js +344 -0
package/mcp/dist/entrypoint.js +387 -0
package/mcp/dist/finding-context.js +172 -0
package/mcp/dist/finding-impact.js +181 -0
package/mcp/dist/finding-journal.js +122 -0
package/mcp/dist/finding-lifecycle.js +259 -0
package/mcp/dist/governance-audit.js +22 -0
package/mcp/dist/governance-locks.js +96 -0
package/mcp/dist/governance-policy.js +648 -0
package/mcp/dist/governance-scores.js +355 -0
package/mcp/dist/hooks.js +449 -0
package/mcp/dist/impact-scoring.js +22 -0
package/mcp/dist/index-query.js +168 -0
package/mcp/dist/index.js +205 -0
package/mcp/dist/init-config.js +336 -0
package/mcp/dist/init-preferences.js +62 -0
package/mcp/dist/init-setup.js +1305 -0
package/mcp/dist/init-shared.js +29 -0
package/mcp/dist/init.js +1730 -0
package/mcp/dist/link-checksums.js +62 -0
package/mcp/dist/link-context.js +257 -0
package/mcp/dist/link-doctor.js +591 -0
package/mcp/dist/link-skills.js +212 -0
package/mcp/dist/link.js +596 -0
package/mcp/dist/logger.js +15 -0
package/mcp/dist/machine-identity.js +38 -0
package/mcp/dist/mcp-config.js +254 -0
package/mcp/dist/mcp-data.js +315 -0
package/mcp/dist/mcp-extract-facts.js +78 -0
package/mcp/dist/mcp-extract.js +133 -0
package/mcp/dist/mcp-finding.js +557 -0
package/mcp/dist/mcp-graph.js +339 -0
package/mcp/dist/mcp-hooks.js +256 -0
package/mcp/dist/mcp-memory.js +58 -0
package/mcp/dist/mcp-ops.js +328 -0
package/mcp/dist/mcp-search.js +628 -0
package/mcp/dist/mcp-session.js +651 -0
package/mcp/dist/mcp-skills.js +189 -0
package/mcp/dist/mcp-tasks.js +551 -0
package/mcp/dist/mcp-types.js +7 -0
package/mcp/dist/memory-ui-assets.js +6 -0
package/mcp/dist/memory-ui-data.js +513 -0
package/mcp/dist/memory-ui-graph.js +1910 -0
package/mcp/dist/memory-ui-page.js +353 -0
package/mcp/dist/memory-ui-scripts.js +1387 -0
package/mcp/dist/memory-ui-server.js +1218 -0
package/mcp/dist/memory-ui-styles.js +555 -0
package/mcp/dist/memory-ui.js +9 -0
package/mcp/dist/package-metadata.js +13 -0
package/mcp/dist/phren-art.js +52 -0
package/mcp/dist/phren-core.js +108 -0
package/mcp/dist/phren-dotenv.js +67 -0
package/mcp/dist/phren-paths.js +476 -0
package/mcp/dist/proactivity.js +172 -0
package/mcp/dist/profile-store.js +228 -0
package/mcp/dist/project-config.js +85 -0
package/mcp/dist/project-locator.js +25 -0
package/mcp/dist/project-topics.js +1134 -0
package/mcp/dist/provider-adapters.js +176 -0
package/mcp/dist/runtime-profile.js +18 -0
package/mcp/dist/session-checkpoints.js +131 -0
package/mcp/dist/session-utils.js +68 -0
package/mcp/dist/shared-content.js +8 -0
package/mcp/dist/shared-embedding-cache.js +143 -0
package/mcp/dist/shared-fragment-graph.js +456 -0
package/mcp/dist/shared-governance.js +4 -0
package/mcp/dist/shared-index.js +1334 -0
package/mcp/dist/shared-ollama.js +192 -0
package/mcp/dist/shared-paths.js +1 -0
package/mcp/dist/shared-retrieval.js +796 -0
package/mcp/dist/shared-search-fallback.js +375 -0
package/mcp/dist/shared-sqljs.js +42 -0
package/mcp/dist/shared-stemmer.js +171 -0
package/mcp/dist/shared-vector-index.js +199 -0
package/mcp/dist/shared.js +114 -0
package/mcp/dist/shell-entry.js +209 -0
package/mcp/dist/shell-input.js +943 -0
package/mcp/dist/shell-palette.js +119 -0
package/mcp/dist/shell-render.js +252 -0
package/mcp/dist/shell-state-store.js +81 -0
package/mcp/dist/shell-types.js +13 -0
package/mcp/dist/shell-view-list.js +14 -0
package/mcp/dist/shell-view.js +707 -0
package/mcp/dist/shell.js +352 -0
package/mcp/dist/skill-files.js +117 -0
package/mcp/dist/skill-registry.js +279 -0
package/mcp/dist/skill-state.js +28 -0
package/mcp/dist/startup-embedding.js +57 -0
package/mcp/dist/status.js +323 -0
package/mcp/dist/synonyms.json +670 -0
package/mcp/dist/task-hygiene.js +251 -0
package/mcp/dist/task-lifecycle.js +347 -0
package/mcp/dist/tasks-github.js +76 -0
package/mcp/dist/telemetry.js +165 -0
package/mcp/dist/test-global-setup.js +37 -0
package/mcp/dist/tool-registry.js +104 -0
package/mcp/dist/update.js +97 -0
package/mcp/dist/utils.js +543 -0
package/package.json +67 -0
package/skills/README.md +7 -0
package/skills/consolidate/SKILL.md +152 -0
package/skills/discover/SKILL.md +175 -0
package/skills/init/SKILL.md +216 -0
package/skills/profiles/SKILL.md +121 -0
package/skills/sync/SKILL.md +261 -0
package/starter/README.md +74 -0
package/starter/global/CLAUDE.md +89 -0
package/starter/global/skills/humanize.md +30 -0
package/starter/global/skills/pipeline.md +35 -0
package/starter/global/skills/release.md +35 -0
package/starter/machines.yaml +8 -0
package/starter/my-api/.claude/skills/README.md +7 -0
package/starter/my-api/CLAUDE.md +33 -0
package/starter/my-api/FINDINGS.md +9 -0
package/starter/my-api/summary.md +7 -0
package/starter/my-api/tasks.md +7 -0
package/starter/my-first-project/.claude/skills/README.md +7 -0
package/starter/my-first-project/CLAUDE.md +49 -0
package/starter/my-first-project/FINDINGS.md +24 -0
package/starter/my-first-project/summary.md +11 -0
package/starter/my-first-project/tasks.md +25 -0
package/starter/my-frontend/.claude/skills/README.md +7 -0
package/starter/my-frontend/CLAUDE.md +33 -0
package/starter/my-frontend/FINDINGS.md +9 -0
package/starter/my-frontend/summary.md +7 -0
package/starter/my-frontend/tasks.md +7 -0
package/starter/profiles/default.yaml +4 -0
package/starter/profiles/personal.yaml +4 -0
package/starter/profiles/work.yaml +4 -0
package/starter/templates/README.md +7 -0
package/starter/templates/frontend/CLAUDE.md +23 -0
package/starter/templates/frontend/FINDINGS.md +7 -0
package/starter/templates/frontend/reference/README.md +4 -0
package/starter/templates/frontend/summary.md +7 -0
package/starter/templates/frontend/tasks.md +11 -0
package/starter/templates/library/CLAUDE.md +22 -0
package/starter/templates/library/FINDINGS.md +7 -0
package/starter/templates/library/reference/README.md +4 -0
package/starter/templates/library/summary.md +7 -0
package/starter/templates/library/tasks.md +11 -0
package/starter/templates/monorepo/CLAUDE.md +21 -0
package/starter/templates/monorepo/FINDINGS.md +7 -0
package/starter/templates/monorepo/reference/README.md +4 -0
package/starter/templates/monorepo/summary.md +7 -0
package/starter/templates/monorepo/tasks.md +11 -0
package/starter/templates/python-project/CLAUDE.md +21 -0
package/starter/templates/python-project/FINDINGS.md +7 -0
package/starter/templates/python-project/reference/README.md +4 -0
package/starter/templates/python-project/summary.md +7 -0
package/starter/templates/python-project/tasks.md +10 -0

package/mcp/dist/shared-search-fallback.js ADDED Viewed

@@ -0,0 +1,375 @@
+import { createHash } from "crypto";
+import { debugLog } from "./shared.js";
+import { STOP_WORDS } from "./utils.js";
+import { porterStem } from "./shared-stemmer.js";
+import { classifyFile, normalizeIndexedContent, rowToDocWithRowid } from "./shared-index.js";
+import { embedText, cosineSimilarity, getEmbeddingModel, getOllamaUrl, getCloudEmbeddingUrl } from "./shared-ollama.js";
+import { getEmbeddingCache } from "./shared-embedding-cache.js";
+import { getPersistentVectorIndex } from "./shared-vector-index.js";
+import * as fs from "fs";
+import * as path from "path";
+const HYBRID_SEARCH_FLAG = "PHREN_FEATURE_HYBRID_SEARCH";
+const COSINE_SIMILARITY_MIN = 0.15;
+const COSINE_MAX_CORPUS = 10000;
+const COSINE_CANDIDATE_CAP = 500; // max docs loaded into memory for cosine scoring
+const COSINE_WINDOW_COUNT = 4;
+function splitPathSegments(filePath) {
+    return filePath.split(/[\\/]+/).filter(Boolean);
+}
+export function deriveVectorDocIdentity(phrenPath, fullPath) {
+    const normalizedPhrenPath = phrenPath.replace(/[\\/]+/g, "/").replace(/\/+$/, "");
+    const normalizedFullPath = fullPath.replace(/[\\/]+/g, "/");
+    let rel = fullPath;
+    if (normalizedFullPath === normalizedPhrenPath) {
+        rel = "";
+    }
+    else if (normalizedFullPath.startsWith(`${normalizedPhrenPath}/`)) {
+        rel = normalizedFullPath.slice(normalizedPhrenPath.length + 1);
+    }
+    else {
+        const relative = path.relative(phrenPath, fullPath);
+        if (!relative.startsWith("..") && !path.isAbsolute(relative)) {
+            rel = relative;
+        }
+    }
+    const relParts = splitPathSegments(rel);
+    return {
+        project: relParts[0] ?? "",
+        filename: splitPathSegments(fullPath).at(-1) ?? "",
+        relFile: relParts.slice(1).join("/"),
+    };
+}
+// Module-level cache for TF-IDF document frequencies.
+// Keyed by a fingerprint of the candidate doc IDs so that different candidate subsets and
+// incremental index mutations produce distinct cache entries rather than reusing stale counts.
+// Intentionally not locked: single-threaded JS event loop, cache is eventually consistent,
+// worst case is a redundant recompute. No data loss is possible since this is a pure computation cache.
+// Max 100 entries to bound memory (LRU-style: oldest key evicted on overflow).
+const MAX_DF_CACHE_SIZE = 100;
+const dfCache = new Map();
+/** Invalidate the DF cache. Call after a full index rebuild. */
+export function invalidateDfCache() {
+    dfCache.clear();
+    tokenCache.clear();
+}
+// Module-level cache for tokenized document content.
+// Keyed by a short content hash so the same document content is only tokenized once per server lifetime.
+// Cleared on full rebuild (same lifecycle as dfCache). Max 2000 entries to bound memory.
+// Intentionally not locked: single-threaded JS event loop, cache is eventually consistent,
+// worst case is a redundant recompute. No data loss is possible since this is a pure computation cache.
+const MAX_TOKEN_CACHE = 2000;
+const tokenCache = new Map();
+function cachedTokenize(text) {
+    const key = createHash("sha256").update(text).digest("hex").slice(0, 16);
+    const hit = tokenCache.get(key);
+    if (hit)
+        return hit;
+    const tokens = tokenize(text);
+    if (tokenCache.size >= MAX_TOKEN_CACHE) {
+        // Evict oldest entry
+        tokenCache.delete(tokenCache.keys().next().value ?? "");
+    }
+    tokenCache.set(key, tokens);
+    return tokens;
+}
+function deterministicSeed(text) {
+    let hash = 2166136261;
+    for (let i = 0; i < text.length; i++) {
+        hash ^= text.charCodeAt(i);
+        hash = Math.imul(hash, 16777619);
+    }
+    return hash >>> 0;
+}
+function loadCosineFallbackWindow(db, startRowid, limit, wrapBefore) {
+    const where = wrapBefore === undefined ? "rowid >= ?" : "rowid < ?";
+    const params = [wrapBefore ?? startRowid, limit];
+    const rows = db.exec(`SELECT rowid, project, filename, type, content, path FROM docs WHERE ${where} ORDER BY rowid LIMIT ?`, params);
+    return rows?.[0]?.values ?? [];
+}
+/**
+ * Tokenize text into non-stop-word tokens for TF-IDF computation, with stemming.
+ */
+function tokenize(text) {
+    return text
+        .toLowerCase()
+        .replace(/[^\w\s]/g, " ")
+        .split(/\s+/)
+        .filter(w => w.length > 1 && !STOP_WORDS.has(w))
+        .map(w => porterStem(w));
+}
+/**
+ * Compute TF-IDF cosine similarity scores for a query against a corpus of documents.
+ * Returns an array of similarity scores in the same order as docs.
+ * @param corpusN - Total number of documents in the full corpus (for IDF denominator).
+ *   Defaults to docs.length, which is correct when docs IS the full corpus.
+ *   Pass the real total when docs is a pre-filtered subset so IDF scores are not inflated.
+ */
+function tfidfCosine(docs, query, corpusN) {
+    const queryTokens = tokenize(query);
+    if (queryTokens.length === 0)
+        return docs.map(() => 0);
+    // Collect all unique terms from query + all docs (use cached tokenization for repeated content)
+    const allTokens = new Set(queryTokens);
+    const docTokenLists = docs.map(d => {
+        const tokens = cachedTokenize(d);
+        for (const t of tokens)
+            allTokens.add(t);
+        return tokens;
+    });
+    // Build a Set per document for O(1) term lookups
+    const docTokenSets = docTokenLists.map(tokens => new Set(tokens));
+    const terms = [...allTokens];
+    // Use the full corpus N for IDF so scores are comparable even when docs is a subset.
+    const N = corpusN ?? docs.length;
+    // Compute document frequency for each term, keyed by a fingerprint of the candidate doc set
+    // so that different subsets and incremental index mutations get distinct cache entries.
+    const candidateFingerprint = docTokenLists.map(tl => tl.slice(0, 4).join(",")).join("|").slice(0, 128);
+    const cacheKey = `fp:${candidateFingerprint}`;
+    const cachedDf = dfCache.get(cacheKey);
+    const df = cachedDf ?? new Map();
+    // Compute DF for any terms not yet in cache
+    for (const term of terms) {
+        if (!df.has(term)) {
+            let count = 0;
+            for (const docSet of docTokenSets) {
+                if (docSet.has(term))
+                    count++;
+            }
+            df.set(term, count);
+        }
+    }
+    if (!cachedDf) {
+        if (dfCache.size >= MAX_DF_CACHE_SIZE)
+            dfCache.delete(dfCache.keys().next().value ?? "");
+        dfCache.set(cacheKey, df);
+    }
+    function buildVector(tokens) {
+        const tf = new Map();
+        for (const t of tokens)
+            tf.set(t, (tf.get(t) ?? 0) + 1);
+        return terms.map(term => {
+            const termTf = (tf.get(term) ?? 0) / (tokens.length || 1);
+            const idf = Math.log((N + 1) / ((df.get(term) ?? 0) + 1)) + 1;
+            return termTf * idf;
+        });
+    }
+    function cosine(a, b) {
+        let dot = 0, normA = 0, normB = 0;
+        for (let i = 0; i < a.length; i++) {
+            dot += a[i] * b[i];
+            normA += a[i] * a[i];
+            normB += b[i] * b[i];
+        }
+        const denom = Math.sqrt(normA) * Math.sqrt(normB);
+        return denom === 0 ? 0 : dot / denom;
+    }
+    const queryVec = buildVector(queryTokens);
+    return docTokenLists.map(docTokens => cosine(queryVec, buildVector(docTokens)));
+}
+/**
+ * Cosine fallback search: when FTS5 returns fewer than COSINE_FALLBACK_THRESHOLD results,
+ * load all docs and rank by TF-IDF cosine similarity.
+ * Only activated when PHREN_FEATURE_HYBRID_SEARCH=1 and corpus size <= COSINE_MAX_CORPUS.
+ * Returns DocRow[] ranked by similarity (threshold > COSINE_SIMILARITY_MIN), excluding already-found rowids.
+ */
+export function cosineFallback(db, query, excludeRowids, limit) {
+    // Feature flag guard — default ON; set PHREN_FEATURE_HYBRID_SEARCH=0 to disable
+    const flagVal = process.env[HYBRID_SEARCH_FLAG];
+    if (flagVal !== undefined && ["0", "false", "off", "no"].includes(flagVal.trim().toLowerCase())) {
+        return [];
+    }
+    // Count total docs to guard against large corpora
+    let totalDocs = 0;
+    let minRowid = 0;
+    let maxRowid = 0;
+    try {
+        const statsResult = db.exec("SELECT MIN(rowid), MAX(rowid), COUNT(*) FROM docs");
+        if (statsResult?.length && statsResult[0]?.values?.length) {
+            minRowid = Number(statsResult[0].values[0][0] ?? 0);
+            maxRowid = Number(statsResult[0].values[0][1] ?? 0);
+            totalDocs = Number(statsResult[0].values[0][2] ?? 0);
+        }
+    }
+    catch (err) {
+        if ((process.env.PHREN_DEBUG || process.env.PHREN_DEBUG))
+            process.stderr.write(`[phren] cosineFallback count: ${err instanceof Error ? err.message : String(err)}\n`);
+        return [];
+    }
+    if (totalDocs > COSINE_MAX_CORPUS) {
+        debugLog(`cosineFallback: corpus size ${totalDocs} exceeds ${COSINE_MAX_CORPUS}, skipping`);
+        return [];
+    }
+    // Load docs with candidate capping to bound memory usage.
+    // If corpus fits in cap, load all; otherwise use FTS5 keyword pre-filter to get relevant candidates.
+    let allRows = null;
+    try {
+        if (totalDocs <= COSINE_CANDIDATE_CAP) {
+            const results = db.exec("SELECT rowid, project, filename, type, content, path FROM docs");
+            if (!Array.isArray(results) || !results.length || !results[0]?.values?.length)
+                return [];
+            allRows = results[0].values;
+        }
+        else {
+            // Pre-filter: use FTS5 to get top candidates, then fill to cap with deterministic rowid windows
+            const safeQ = query.replace(/[^\w\s]/g, " ").trim().split(/\s+/).filter(w => w.length > 2).slice(0, 5).join(" OR ");
+            const ftsRows = [];
+            if (safeQ) {
+                try {
+                    const ftsRes = db.exec(`SELECT rowid, project, filename, type, content, path FROM docs WHERE docs MATCH ? ORDER BY rank LIMIT ${COSINE_CANDIDATE_CAP}`, [safeQ]);
+                    if (ftsRes?.length && ftsRes[0]?.values?.length)
+                        ftsRows.push(...ftsRes[0].values);
+                }
+                catch (err) {
+                    if ((process.env.PHREN_DEBUG || process.env.PHREN_DEBUG))
+                        process.stderr.write(`[phren] cosineFallback FTS pre-filter: ${err instanceof Error ? err.message : String(err)}\n`);
+                }
+            }
+            // If FTS gave fewer than cap, supplement with deterministic rowid windows.
+            if (ftsRows.length < COSINE_CANDIDATE_CAP && totalDocs > 0 && maxRowid >= minRowid) {
+                const ftsRowIds = new Set(ftsRows.map(r => Number(r[0])));
+                const remaining = COSINE_CANDIDATE_CAP - ftsRows.length;
+                const span = Math.max(1, maxRowid - minRowid + 1);
+                const windowCount = Math.min(COSINE_WINDOW_COUNT, remaining);
+                const perWindow = Math.max(1, Math.ceil(remaining / Math.max(1, windowCount)));
+                const stride = Math.max(1, Math.floor(span / Math.max(1, windowCount)));
+                const seed = deterministicSeed(query);
+                const pushRows = (rows) => {
+                    for (const row of rows) {
+                        const rowid = Number(row[0]);
+                        if (ftsRowIds.has(rowid))
+                            continue;
+                        ftsRowIds.add(rowid);
+                        ftsRows.push(row);
+                        if (ftsRows.length >= COSINE_CANDIDATE_CAP)
+                            break;
+                    }
+                };
+                try {
+                    for (let i = 0; i < windowCount && ftsRows.length < COSINE_CANDIDATE_CAP; i++) {
+                        const offset = (seed + i * stride) % span;
+                        const startRowid = minRowid + offset;
+                        pushRows(loadCosineFallbackWindow(db, startRowid, perWindow));
+                        if (ftsRows.length >= COSINE_CANDIDATE_CAP)
+                            break;
+                        pushRows(loadCosineFallbackWindow(db, startRowid, perWindow, startRowid));
+                    }
+                    if (ftsRows.length < COSINE_CANDIDATE_CAP) {
+                        pushRows(loadCosineFallbackWindow(db, minRowid, COSINE_CANDIDATE_CAP - ftsRows.length));
+                    }
+                }
+                catch (err) {
+                    if ((process.env.PHREN_DEBUG || process.env.PHREN_DEBUG))
+                        process.stderr.write(`[phren] cosineFallback deterministicSample: ${err instanceof Error ? err.message : String(err)}\n`);
+                }
+            }
+            if (ftsRows.length === 0)
+                return [];
+            allRows = ftsRows;
+            debugLog(`cosineFallback: pre-filtered ${totalDocs} docs to ${allRows.length} candidates`);
+        }
+    }
+    catch (err) {
+        if ((process.env.PHREN_DEBUG || process.env.PHREN_DEBUG))
+            process.stderr.write(`[phren] cosineFallback loadDocs: ${err instanceof Error ? err.message : String(err)}\n`);
+        return [];
+    }
+    // Separate rowids, DocRows, and content strings for scoring
+    const docContents = [];
+    const docMeta = [];
+    for (const row of allRows ?? []) {
+        const { rowid, doc } = rowToDocWithRowid(row);
+        if (excludeRowids.has(rowid))
+            continue;
+        docContents.push(doc.content);
+        docMeta.push(doc);
+    }
+    if (docContents.length === 0)
+        return [];
+    // Pass totalDocs so IDF denominators reflect the full corpus, not just the candidate subset.
+    const scores = tfidfCosine(docContents, query, totalDocs);
+    // Collect scored results above threshold
+    const scored = [];
+    for (let i = 0; i < scores.length; i++) {
+        if (scores[i] > COSINE_SIMILARITY_MIN) {
+            scored.push({ score: scores[i], doc: docMeta[i] });
+        }
+    }
+    // Sort descending by score and return top-limit
+    scored.sort((a, b) => b.score - a.score);
+    return scored.slice(0, limit).map(s => s.doc);
+}
+/**
+ * Vector-based semantic search fallback using pre-computed Ollama embeddings.
+ * Only runs when Ollama is configured (PHREN_OLLAMA_URL is set or defaults).
+ * Returns DocRow[] sorted by cosine similarity, above 0.5 threshold.
+ */
+export async function vectorFallback(phrenPath, query, excludePaths, limit, project) {
+    // Run when either Ollama or a cloud embedding endpoint is available
+    if (!getOllamaUrl() && !getCloudEmbeddingUrl())
+        return [];
+    const cache = getEmbeddingCache(phrenPath);
+    // Ensure the cache is loaded from disk — in hook subprocesses the singleton
+    // starts empty because load() is only called in the MCP server / CLI entry.
+    if (cache.size() === 0) {
+        try {
+            await cache.load();
+        }
+        catch (err) {
+            if ((process.env.PHREN_DEBUG || process.env.PHREN_DEBUG))
+                process.stderr.write(`[phren] vectorFallback cacheLoad: ${err instanceof Error ? err.message : String(err)}\n`);
+        }
+    }
+    if (cache.size() === 0)
+        return [];
+    const queryVec = await embedText(query);
+    if (!queryVec || queryVec.length === 0)
+        return [];
+    const model = getEmbeddingModel();
+    // Apply project scoping: when a project is detected, restrict vector results to that
+    // project and the global project to prevent cross-project memory injection.
+    const entries = cache.getAllEntries().filter(e => {
+        if (e.model !== model)
+            return false;
+        if (excludePaths.has(e.path))
+            return false;
+        if (project) {
+            // Allow global docs and docs from the active project
+            const entryProject = deriveVectorDocIdentity(phrenPath, e.path).project;
+            if (entryProject !== project && entryProject !== "global")
+                return false;
+        }
+        return true;
+    });
+    if (entries.length === 0)
+        return [];
+    const eligiblePaths = new Set(entries.map((entry) => entry.path));
+    const vectorIndex = getPersistentVectorIndex(phrenPath);
+    vectorIndex.ensure(cache.getAllEntries());
+    const indexedPaths = vectorIndex.query(model, queryVec, limit, eligiblePaths);
+    const candidatePaths = indexedPaths.length > 0 ? new Set(indexedPaths) : eligiblePaths;
+    const scored = entries
+        .filter((entry) => candidatePaths.has(entry.path))
+        .map(e => ({ path: e.path, score: cosineSimilarity(queryVec, e.vec) }))
+        .filter(e => e.score > 0.50)
+        .sort((a, b) => b.score - a.score)
+        .slice(0, limit);
+    return scored.map(e => {
+        const { project: entryProject, filename, relFile } = deriveVectorDocIdentity(phrenPath, e.path);
+        // Use the same path-aware classifyFile logic as the indexer so reference/skills/etc.
+        // get their correct type instead of always falling back to "other".
+        const type = classifyFile(filename, relFile);
+        // Hydrate and normalize content from disk with the same pipeline as the indexer.
+        let content = "";
+        try {
+            if (e.path && fs.existsSync(e.path)) {
+                const raw = fs.readFileSync(e.path, "utf-8");
+                content = normalizeIndexedContent(raw, type, phrenPath, 10000);
+            }
+        }
+        catch (err) {
+            if ((process.env.PHREN_DEBUG || process.env.PHREN_DEBUG))
+                process.stderr.write(`[phren] vectorFallback fileRead: ${err instanceof Error ? err.message : String(err)}\n`);
+        }
+        return { project: entryProject, filename, type, content, path: e.path };
+    });
+}

package/mcp/dist/shared-sqljs.js ADDED Viewed

@@ -0,0 +1,42 @@
+import * as fs from "fs";
+import * as path from "path";
+import { fileURLToPath } from "url";
+import { createRequire } from "module";
+const require = createRequire(import.meta.url);
+/**
+ * Locate the sql.js-fts5 WASM binary by require.resolve with path-probe fallback.
+ * Shared between shared-index.ts and embedding.ts to avoid duplication.
+ */
+function findWasmBinary() {
+    try {
+        const resolved = require.resolve("sql.js-fts5/dist/sql-wasm.wasm");
+        if (fs.existsSync(resolved))
+            return fs.readFileSync(resolved);
+    }
+    catch (err) {
+        if ((process.env.PHREN_DEBUG || process.env.PHREN_DEBUG))
+            process.stderr.write(`[phren] findWasmBinary requireResolve: ${err instanceof Error ? err.message : String(err)}\n`);
+        // fall through to path probing
+    }
+    const __filename = fileURLToPath(import.meta.url);
+    let dir = path.dirname(__filename);
+    for (let i = 0; i < 5; i++) {
+        const candidateA = path.join(dir, "node_modules", "sql.js-fts5", "dist", "sql-wasm.wasm");
+        if (fs.existsSync(candidateA))
+            return fs.readFileSync(candidateA);
+        const candidateB = path.join(dir, "sql.js-fts5", "dist", "sql-wasm.wasm");
+        if (fs.existsSync(candidateB))
+            return fs.readFileSync(candidateB);
+        dir = path.dirname(dir);
+    }
+    return undefined;
+}
+const _initSqlJs = require("sql.js-fts5");
+/**
+ * Bootstrap sql.js-fts5: find the WASM binary and initialise the library.
+ * Shared across shared-index.ts and embedding.ts to avoid duplication.
+ */
+export async function bootstrapSqlJs() {
+    const wasmBinary = findWasmBinary();
+    return _initSqlJs(wasmBinary ? { wasmBinary } : {});
+}

package/mcp/dist/shared-stemmer.js ADDED Viewed

@@ -0,0 +1,171 @@
+/**
+ * Porter stemmer implementation for English words.
+ * Based on the Porter (1980) algorithm.
+ */
+export function porterStem(word) {
+    if (word.length <= 2)
+        return word;
+    function isConsonant(w, i) {
+        const c = w[i];
+        if (c === 'a' || c === 'e' || c === 'i' || c === 'o' || c === 'u')
+            return false;
+        if (c === 'y')
+            return i === 0 ? true : !isConsonant(w, i - 1);
+        return true;
+    }
+    function measure(stem) {
+        if (stem.length === 0)
+            return 0;
+        let m = 0;
+        let i = 0;
+        // skip initial consonants
+        while (i < stem.length && isConsonant(stem, i))
+            i++;
+        while (i < stem.length) {
+            // count vowel sequence
+            while (i < stem.length && !isConsonant(stem, i))
+                i++;
+            if (i >= stem.length)
+                break;
+            m++;
+            // count consonant sequence
+            while (i < stem.length && isConsonant(stem, i))
+                i++;
+        }
+        return m;
+    }
+    function hasVowel(stem) {
+        for (let i = 0; i < stem.length; i++) {
+            if (!isConsonant(stem, i))
+                return true;
+        }
+        return false;
+    }
+    function endsDoubleConsonant(w) {
+        if (w.length < 2)
+            return false;
+        return w[w.length - 1] === w[w.length - 2] && isConsonant(w, w.length - 1);
+    }
+    function endsCVC(w) {
+        if (w.length < 3)
+            return false;
+        const l = w.length;
+        if (!isConsonant(w, l - 1) || isConsonant(w, l - 2) || !isConsonant(w, l - 3))
+            return false;
+        const last = w[l - 1];
+        return last !== 'w' && last !== 'x' && last !== 'y';
+    }
+    function endsWith(w, suffix) {
+        if (w.length < suffix.length)
+            return null;
+        if (w.endsWith(suffix))
+            return w.slice(0, -suffix.length);
+        return null;
+    }
+    let w = word;
+    // Step 1a
+    if (w.endsWith("sses")) {
+        w = w.slice(0, -2);
+    }
+    else if (w.endsWith("ies")) {
+        w = w.slice(0, -2);
+    }
+    else if (!w.endsWith("ss") && w.endsWith("s") && w.length > 2) {
+        w = w.slice(0, -1);
+    }
+    // Step 1b
+    let step1bExtra = false;
+    if (w.endsWith("eed")) {
+        const stem = w.slice(0, -3);
+        if (measure(stem) > 0)
+            w = w.slice(0, -1); // eed -> ee
+    }
+    else {
+        let stemFound = null;
+        if (w.endsWith("ed")) {
+            stemFound = w.slice(0, -2);
+        }
+        else if (w.endsWith("ing")) {
+            stemFound = w.slice(0, -3);
+        }
+        if (stemFound !== null && hasVowel(stemFound)) {
+            w = stemFound;
+            step1bExtra = true;
+        }
+    }
+    if (step1bExtra) {
+        if (w.endsWith("at") || w.endsWith("bl") || w.endsWith("iz")) {
+            w += "e";
+        }
+        else if (endsDoubleConsonant(w) && !w.endsWith("l") && !w.endsWith("s") && !w.endsWith("z")) {
+            w = w.slice(0, -1);
+        }
+        else if (measure(w) === 1 && endsCVC(w)) {
+            w += "e";
+        }
+    }
+    // Step 1c
+    if (w.endsWith("y") && w.length > 2 && hasVowel(w.slice(0, -1))) {
+        w = w.slice(0, -1) + "i";
+    }
+    // Step 2
+    const step2Map = {
+        ational: "ate", tional: "tion", enci: "ence", anci: "ance",
+        izer: "ize", abli: "able", alli: "al", entli: "ent", eli: "e",
+        ousli: "ous", ization: "ize", ation: "ate", ator: "ate",
+        alism: "al", iveness: "ive", fulness: "ful", ousness: "ous",
+        aliti: "al", iviti: "ive", biliti: "ble",
+    };
+    for (const [suffix, replacement] of Object.entries(step2Map)) {
+        const stem = endsWith(w, suffix);
+        if (stem !== null && measure(stem) > 0) {
+            w = stem + replacement;
+            break;
+        }
+    }
+    // Step 3
+    const step3Map = {
+        icate: "ic", ative: "", iciti: "ic",
+        ical: "ic", ful: "", ness: "",
+    };
+    for (const [suffix, replacement] of Object.entries(step3Map)) {
+        const stem = endsWith(w, suffix);
+        if (stem !== null && measure(stem) > 0) {
+            w = stem + replacement;
+            break;
+        }
+    }
+    // Step 4
+    const step4Suffixes = [
+        "al", "ance", "ence", "er", "ic", "able", "ible", "ant",
+        "ement", "ment", "ent", "ion", "ou", "ism", "ate", "iti",
+        "ous", "ive", "ize",
+    ];
+    for (const suffix of step4Suffixes) {
+        const stem = endsWith(w, suffix);
+        if (stem !== null && measure(stem) > 1) {
+            if (suffix === "ion") {
+                if (stem.endsWith("s") || stem.endsWith("t")) {
+                    w = stem;
+                }
+            }
+            else {
+                w = stem;
+            }
+            break;
+        }
+    }
+    // Step 5a
+    if (w.endsWith("e")) {
+        const stem = w.slice(0, -1);
+        const m = measure(stem);
+        if (m > 1 || (m === 1 && !endsCVC(stem))) {
+            w = stem;
+        }
+    }
+    // Step 5b
+    if (measure(w) > 1 && endsDoubleConsonant(w) && w.endsWith("l")) {
+        w = w.slice(0, -1);
+    }
+    return w;
+}