npm - notoken-core - Versions diffs - 1.5.1 → 2.0.0 - Mend

notoken-core 1.5.1 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (99) hide show

package/config/chat-responses.json +767 -0
package/config/concept-clusters.json +31 -0
package/config/entities.json +93 -0
package/config/image-prompts.json +20 -0
package/config/intent-vectors.json +1 -0
package/config/intents.json +5023 -65
package/config/ollama-models.json +193 -0
package/config/rules.json +32 -1
package/dist/automation/discordPatchright.d.ts +35 -0
package/dist/automation/discordPatchright.js +424 -0
package/dist/automation/discordSetup.d.ts +31 -0
package/dist/automation/discordSetup.js +338 -0
package/dist/conversation/coreference.js +44 -4
package/dist/conversation/pendingActions.d.ts +55 -0
package/dist/conversation/pendingActions.js +127 -0
package/dist/conversation/store.d.ts +72 -0
package/dist/conversation/store.js +140 -1
package/dist/conversation/topicTracker.d.ts +36 -0
package/dist/conversation/topicTracker.js +141 -0
package/dist/execution/ssh.d.ts +42 -1
package/dist/execution/ssh.js +532 -3
package/dist/handlers/executor.js +3981 -16
package/dist/index.d.ts +25 -3
package/dist/index.js +36 -2
package/dist/nlp/batchParser.d.ts +30 -0
package/dist/nlp/batchParser.js +77 -0
package/dist/nlp/conceptExpansion.d.ts +54 -0
package/dist/nlp/conceptExpansion.js +136 -0
package/dist/nlp/conceptRouter.d.ts +49 -0
package/dist/nlp/conceptRouter.js +302 -0
package/dist/nlp/confidenceCalibrator.d.ts +62 -0
package/dist/nlp/confidenceCalibrator.js +116 -0
package/dist/nlp/correctionLearner.d.ts +45 -0
package/dist/nlp/correctionLearner.js +207 -0
package/dist/nlp/entitySpellCorrect.d.ts +35 -0
package/dist/nlp/entitySpellCorrect.js +141 -0
package/dist/nlp/knowledgeGraph.d.ts +70 -0
package/dist/nlp/knowledgeGraph.js +380 -0
package/dist/nlp/llmFallback.js +28 -1
package/dist/nlp/multiClassifier.js +91 -6
package/dist/nlp/multiIntent.d.ts +43 -0
package/dist/nlp/multiIntent.js +154 -0
package/dist/nlp/parseIntent.d.ts +6 -1
package/dist/nlp/parseIntent.js +180 -5
package/dist/nlp/ruleParser.js +315 -0
package/dist/nlp/semanticSimilarity.d.ts +30 -0
package/dist/nlp/semanticSimilarity.js +174 -0
package/dist/nlp/vocabularyBuilder.d.ts +43 -0
package/dist/nlp/vocabularyBuilder.js +224 -0
package/dist/nlp/wikidata.d.ts +49 -0
package/dist/nlp/wikidata.js +228 -0
package/dist/policy/confirm.d.ts +10 -0
package/dist/policy/confirm.js +39 -0
package/dist/policy/safety.js +6 -4
package/dist/utils/aliases.d.ts +5 -0
package/dist/utils/aliases.js +39 -0
package/dist/utils/analysis.js +71 -15
package/dist/utils/browser.d.ts +64 -0
package/dist/utils/browser.js +364 -0
package/dist/utils/commandHistory.d.ts +20 -0
package/dist/utils/commandHistory.js +108 -0
package/dist/utils/completer.d.ts +17 -0
package/dist/utils/completer.js +79 -0
package/dist/utils/config.js +32 -2
package/dist/utils/dbQuery.d.ts +25 -0
package/dist/utils/dbQuery.js +248 -0
package/dist/utils/discordDiag.d.ts +35 -0
package/dist/utils/discordDiag.js +826 -0
package/dist/utils/diskCleanup.d.ts +36 -0
package/dist/utils/diskCleanup.js +775 -0
package/dist/utils/entityResolver.d.ts +107 -0
package/dist/utils/entityResolver.js +468 -0
package/dist/utils/imageGen.d.ts +92 -0
package/dist/utils/imageGen.js +2031 -0
package/dist/utils/installTracker.d.ts +57 -0
package/dist/utils/installTracker.js +160 -0
package/dist/utils/multiExec.d.ts +21 -0
package/dist/utils/multiExec.js +141 -0
package/dist/utils/openclawDiag.d.ts +29 -0
package/dist/utils/openclawDiag.js +1035 -0
package/dist/utils/output.js +4 -0
package/dist/utils/platform.js +2 -1
package/dist/utils/progressReporter.d.ts +50 -0
package/dist/utils/progressReporter.js +58 -0
package/dist/utils/projectDetect.d.ts +44 -0
package/dist/utils/projectDetect.js +319 -0
package/dist/utils/projectScanner.d.ts +44 -0
package/dist/utils/projectScanner.js +312 -0
package/dist/utils/shellCompat.d.ts +78 -0
package/dist/utils/shellCompat.js +186 -0
package/dist/utils/smartArchive.d.ts +16 -0
package/dist/utils/smartArchive.js +172 -0
package/dist/utils/smartRetry.d.ts +26 -0
package/dist/utils/smartRetry.js +114 -0
package/dist/utils/updater.d.ts +1 -0
package/dist/utils/updater.js +1 -1
package/dist/utils/version.d.ts +20 -0
package/dist/utils/version.js +212 -0
package/package.json +6 -3

package/dist/nlp/knowledgeGraph.js ADDED Viewed

@@ -0,0 +1,380 @@
+/**
+ * Knowledge Graph — persistent entity-relationship store.
+ * Persists to ~/.notoken/knowledge-graph.json.
+ * Auto-populates from entities.json, rules.json, and running system state.
+ */
+import { existsSync, mkdirSync, readFileSync, writeFileSync } from "node:fs";
+import { homedir } from "node:os";
+import { join } from "node:path";
+import { loadEntities } from "../utils/entityResolver.js";
+// ─── Persistence ────────────────────────────────────────────────────────────
+const GRAPH_DIR = join(homedir(), ".notoken");
+const GRAPH_PATH = join(GRAPH_DIR, "knowledge-graph.json");
+let _graph = null;
+export function loadKnowledgeGraph() {
+    if (_graph)
+        return _graph;
+    if (existsSync(GRAPH_PATH)) {
+        try {
+            _graph = JSON.parse(readFileSync(GRAPH_PATH, "utf-8"));
+            return _graph;
+        }
+        catch { /* rebuild */ }
+    }
+    _graph = buildGraph();
+    saveKnowledgeGraph(_graph);
+    return _graph;
+}
+export function saveKnowledgeGraph(graph) {
+    const g = graph ?? _graph;
+    if (!g)
+        return;
+    if (!existsSync(GRAPH_DIR))
+        mkdirSync(GRAPH_DIR, { recursive: true });
+    writeFileSync(GRAPH_PATH, JSON.stringify(g, null, 2) + "\n");
+    _graph = g;
+}
+// ─── Mutation ───────────────────────────────────────────────────────────────
+export function addEntity(name, type, aliases = [], properties = {}) {
+    const g = loadKnowledgeGraph();
+    const entity = { name, type, aliases, properties };
+    g.entities[name] = entity;
+    return entity;
+}
+export function addRelation(from, to, relation, properties) {
+    const g = loadKnowledgeGraph();
+    const rel = { from, to, relation, properties };
+    if (!g.relations.some((r) => r.from === from && r.to === to && r.relation === relation))
+        g.relations.push(rel);
+    return rel;
+}
+// ─── Queries ────────────────────────────────────────────────────────────────
+/** Find an entity by exact name, alias, or prefix (min 3 chars). */
+export function getEntity(name) {
+    const g = loadKnowledgeGraph();
+    const lower = name.toLowerCase();
+    if (g.entities[name])
+        return g.entities[name];
+    for (const [key, ent] of Object.entries(g.entities)) {
+        if (key.toLowerCase() === lower)
+            return ent;
+    }
+    for (const ent of Object.values(g.entities)) {
+        if (ent.aliases.some((a) => a.toLowerCase() === lower))
+            return ent;
+    }
+    if (lower.length >= 3) {
+        for (const ent of Object.values(g.entities)) {
+            if (ent.name.toLowerCase().startsWith(lower))
+                return ent;
+        }
+    }
+    return null;
+}
+/** Find all entities related to entityName, optionally filtered by relation type. */
+export function getRelated(entityName, relation) {
+    const g = loadKnowledgeGraph();
+    const results = [];
+    for (const rel of g.relations) {
+        if (relation && rel.relation !== relation)
+            continue;
+        if (rel.from === entityName && g.entities[rel.to])
+            results.push({ entity: g.entities[rel.to], relation: rel, direction: "outgoing" });
+        else if (rel.to === entityName && g.entities[rel.from])
+            results.push({ entity: g.entities[rel.from], relation: rel, direction: "incoming" });
+    }
+    return results;
+}
+/**
+ * Resolve "it", "the server", "that service" using graph context + recent entities.
+ * Returns the best candidate. Use resolveCandidates() for all scored options.
+ */
+export function resolveReference(text, recentEntities) {
+    const candidates = resolveCandidates(text, recentEntities);
+    return candidates.length > 0 ? candidates[0].entity : null;
+}
+/**
+ * Get all resolution candidates, scored and ranked.
+ * Scores: recent entity = 1.0 - (0.1 * position), type match = +0.2, relation match = +0.15
+ */
+export function resolveCandidates(text, recentEntities) {
+    const lower = text.toLowerCase().trim();
+    const g = loadKnowledgeGraph();
+    const candidates = [];
+    // Direct match — highest confidence
+    const direct = getEntity(lower);
+    if (direct)
+        return [{ entity: direct, score: 1.0, reason: "direct match" }];
+    // Determine what type we're looking for
+    let wantType = null;
+    const typed = lower.match(/^(?:the|that|this)\s+(server|service|database|container|port|package|llm|channel|path|user)$/);
+    if (typed)
+        wantType = typed[1];
+    // For "it"/"that"/"this" — prefer services and containers (actionable things)
+    const isAnaphoric = /^(it|that|this)$/.test(lower);
+    if (isAnaphoric)
+        wantType = null; // consider all types
+    // Score recent entities
+    for (let i = 0; i < recentEntities.length; i++) {
+        const ent = g.entities[recentEntities[i]];
+        if (!ent)
+            continue;
+        let score = 1.0 - (i * 0.15); // Recency: most recent = 1.0, then 0.85, 0.7, ...
+        let reason = `recent entity (#${i + 1})`;
+        // Type match bonus
+        if (wantType && ent.type === wantType) {
+            score += 0.2;
+            reason += `, type match (${wantType})`;
+        }
+        // For "it" — prefer services/containers over servers/ports
+        if (isAnaphoric) {
+            if (ent.type === "service" || ent.type === "container") {
+                score += 0.15;
+                reason += ", actionable type";
+            }
+            else if (ent.type === "server") {
+                score += 0.05;
+                reason += ", server";
+            }
+        }
+        // Relationship bonus — if this entity is related to other recent entities
+        for (const other of recentEntities.slice(0, 3)) {
+            if (other === recentEntities[i])
+                continue;
+            const rels = g.relations.filter(r => (r.from === ent.name && r.to === other) || (r.to === ent.name && r.from === other));
+            if (rels.length > 0) {
+                score += 0.1;
+                reason += `, related to ${other}`;
+                break;
+            }
+        }
+        candidates.push({ entity: ent, score: Math.min(score, 1.0), reason });
+    }
+    // If no recent entities matched and we want a type, search all entities of that type
+    if (candidates.length === 0 && wantType) {
+        for (const ent of Object.values(g.entities)) {
+            if (ent.type === wantType) {
+                candidates.push({ entity: ent, score: 0.3, reason: `type match (${wantType}), no recency` });
+            }
+        }
+    }
+    return candidates.sort((a, b) => b.score - a.score);
+}
+/** Use relationships to infer intent context from tokens. Resolves anaphora and finds target/location. */
+export function inferIntent(tokens, recentEntities = []) {
+    const resolvedEntities = [];
+    const impliedRelations = [];
+    let target, location;
+    for (const token of tokens) {
+        const resolved = resolveReference(token, recentEntities) ?? getEntity(token);
+        if (!resolved)
+            continue;
+        resolvedEntities.push({ token, entity: resolved });
+        if (!target && (resolved.type === "service" || resolved.type === "container" || resolved.type === "package"))
+            target = resolved;
+        else if (!location && resolved.type === "server")
+            location = resolved;
+    }
+    if (target && location) {
+        const g = loadKnowledgeGraph();
+        for (const rel of g.relations) {
+            if ((rel.from === target.name && rel.to === location.name) || (rel.from === location.name && rel.to === target.name)) {
+                impliedRelations.push(rel);
+            }
+        }
+    }
+    return { resolvedEntities, impliedRelations, target, location };
+}
+/** General-purpose query — find entities by type and/or property filter. */
+export function queryGraph(filter) {
+    const g = loadKnowledgeGraph();
+    return Object.values(g.entities).filter((ent) => {
+        if (filter.type && ent.type !== filter.type)
+            return false;
+        if (filter.property !== undefined) {
+            const val = ent.properties[filter.property];
+            if (val === undefined)
+                return false;
+            if (filter.value !== undefined && val !== filter.value)
+                return false;
+        }
+        return true;
+    });
+}
+// ─── Graph Builder ──────────────────────────────────────────────────────────
+function loadRulesConfig() {
+    for (const p of [
+        join(import.meta.url.replace("file://", "").replace(/\/[^/]+\/[^/]+$/, ""), "../config/rules.json"),
+        join(process.cwd(), "packages/core/config/rules.json"),
+        join(process.cwd(), "config/rules.json"),
+    ]) {
+        if (existsSync(p)) {
+            try {
+                return JSON.parse(readFileSync(p, "utf-8")).serviceAliases ?? {};
+            }
+            catch { /* skip */ }
+        }
+    }
+    return {};
+}
+function populateFromEntities(g, ents) {
+    for (const [name, srv] of Object.entries(ents.servers)) {
+        g.entities[name] = { name, type: "server", aliases: srv.aliases ?? [],
+            properties: { host: srv.host, ...(srv.user ? { user: srv.user } : {}), ...(srv.description ? { description: srv.description } : {}) } };
+        if (srv.host)
+            g.relations.push({ from: name, to: `ip:${srv.host}`, relation: "has_ip" });
+    }
+    for (const [name, db] of Object.entries(ents.databases)) {
+        g.entities[name] = { name, type: "database", aliases: db.aliases ?? [],
+            properties: { dbType: db.type, host: db.host, dbName: db.name, ...(db.port ? { port: db.port } : {}), ...(db.user ? { user: db.user } : {}) } };
+        if (db.port)
+            g.relations.push({ from: name, to: `port:${db.port}`, relation: "has_port" });
+    }
+    for (const [id, inst] of Object.entries(ents.installations ?? {})) {
+        const props = { service: inst.service, environment: inst.environment };
+        if (inst.path)
+            props.path = inst.path;
+        if (inst.version)
+            props.version = inst.version;
+        if (inst.port)
+            props.port = inst.port;
+        if (inst.model)
+            props.model = inst.model;
+        if (inst.status)
+            props.status = inst.status;
+        g.entities[id] = { name: id, type: "service", aliases: inst.aliases ?? [], properties: props };
+        if (inst.port)
+            g.relations.push({ from: id, to: `port:${inst.port}`, relation: "has_port" });
+        if (inst.model) {
+            const llmName = `llm:${inst.model}`;
+            if (!g.entities[llmName])
+                g.entities[llmName] = { name: llmName, type: "llm", aliases: [inst.model.split("/").pop()], properties: { model: inst.model } };
+            g.relations.push({ from: id, to: llmName, relation: "uses" });
+        }
+        const serverName = Object.keys(ents.servers).find((s) => inst.environment === s || inst.aliases.some((a) => a.includes(s)));
+        if (serverName)
+            g.relations.push({ from: id, to: serverName, relation: "runs_on" });
+    }
+}
+function populateFromRules(g, serviceAliases) {
+    for (const [svc, aliases] of Object.entries(serviceAliases)) {
+        if (!g.entities[svc]) {
+            g.entities[svc] = { name: svc, type: "service", aliases, properties: {} };
+        }
+        else {
+            for (const a of aliases) {
+                if (!g.entities[svc].aliases.includes(a))
+                    g.entities[svc].aliases.push(a);
+            }
+        }
+    }
+}
+function populateFromSystem(g) {
+    let execSync;
+    try {
+        execSync = require("node:child_process").execSync;
+    }
+    catch {
+        return;
+    }
+    const tryExec = (cmd) => { try {
+        return execSync(cmd, { timeout: 5_000, encoding: "utf-8", stdio: ["pipe", "pipe", "pipe"] }).trim();
+    }
+    catch {
+        return "";
+    } };
+    // Docker containers
+    const dockerPs = tryExec("docker ps --format '{{.Names}}\\t{{.Image}}\\t{{.Ports}}' 2>/dev/null");
+    for (const line of (dockerPs || "").split("\n").filter(Boolean)) {
+        const [name, image, ports] = line.split("\t");
+        if (name)
+            g.entities[`container:${name}`] = { name: `container:${name}`, type: "container", aliases: [name], properties: { image: image ?? "", ports: ports ?? "" } };
+    }
+    // Listening ports
+    const ssOut = tryExec("ss -tlnp 2>/dev/null | tail -n +2");
+    for (const line of (ssOut || "").split("\n").filter(Boolean)) {
+        const portM = line.match(/:(\d+)\s/), procM = line.match(/users:\(\("([^"]+)"/);
+        if (!portM)
+            continue;
+        const key = `port:${portM[1]}`, proc = procM?.[1] ?? "unknown";
+        if (!g.entities[key])
+            g.entities[key] = { name: key, type: "port", aliases: [`port ${portM[1]}`], properties: { port: Number(portM[1]), process: proc } };
+        if (proc !== "unknown" && g.entities[proc])
+            g.relations.push({ from: proc, to: key, relation: "has_port" });
+    }
+}
+/** Build the full knowledge graph from all sources. */
+export function buildGraph() {
+    const g = { entities: {}, relations: [], lastBuilt: new Date().toISOString() };
+    populateFromEntities(g, loadEntities(true));
+    populateFromRules(g, loadRulesConfig());
+    populateFromSystem(g);
+    return g;
+}
+/** Force a rebuild of the graph from all sources and persist. */
+export function rebuildGraph() {
+    _graph = buildGraph();
+    saveKnowledgeGraph(_graph);
+    return _graph;
+}
+// ─── Learning from execution ──────────────────────────────────────────────
+/**
+ * Learn from a successfully executed intent.
+ * Grows the graph over time by recording:
+ *   - Services that were restarted/checked (type: service)
+ *   - Servers that were targeted (type: server)
+ *   - Relationships discovered (service → runs_on → server)
+ *   - New entities mentioned by the user
+ *
+ * Called after every successful execution. Persists periodically.
+ */
+let _learnCount = 0;
+export function learnFromExecution(intent, fields, rawText) {
+    const g = loadKnowledgeGraph();
+    const service = fields.service;
+    const environment = fields.environment;
+    const path = fields.path;
+    const target = fields.target;
+    // Learn services
+    if (service && !g.entities[service]) {
+        const type = intent.startsWith("docker.") ? "container" : "service";
+        g.entities[service] = { name: service, type, aliases: [], properties: {} };
+    }
+    // Learn servers/environments
+    if (environment && environment !== "local" && environment !== "localhost" && environment !== "dev") {
+        if (!g.entities[environment]) {
+            g.entities[environment] = { name: environment, type: "server", aliases: [], properties: {} };
+        }
+        // Learn relationship: service runs_on environment
+        if (service) {
+            const rel = { from: service, to: environment, relation: "runs_on" };
+            if (!g.relations.some(r => r.from === rel.from && r.to === rel.to && r.relation === rel.relation)) {
+                g.relations.push(rel);
+            }
+        }
+    }
+    // Learn paths
+    if (path && path !== "." && !g.entities[`path:${path}`]) {
+        g.entities[`path:${path}`] = { name: `path:${path}`, type: "path", aliases: [path], properties: { path } };
+    }
+    // Learn targets (from disk.scan, file operations, etc.)
+    if (target && !g.entities[target]) {
+        g.entities[target] = { name: target, type: "service", aliases: [], properties: {} };
+    }
+    // Learn from specific intents
+    if (intent === "entity.define") {
+        // User taught us a new entity — already handled by entityResolver
+        // but mark the graph as needing a rebuild next time
+        g.lastBuilt = undefined;
+    }
+    // Persist every 5 learn calls (not every single one — too much I/O)
+    _learnCount++;
+    if (_learnCount % 5 === 0) {
+        saveKnowledgeGraph(g);
+    }
+}
+/** Flush any pending graph changes to disk. */
+export function flushGraph() {
+    if (_graph)
+        saveKnowledgeGraph(_graph);
+}

package/dist/nlp/llmFallback.js CHANGED Viewed

@@ -18,7 +18,7 @@ import { detectLocalPlatform } from "../utils/platform.js";
  * Order: explicit config → auto-detect Ollama → nothing.
  */
 export function isLLMConfigured() {
-    return !!(process.env.NOTOKEN_LLM_ENDPOINT || process.env.NOTOKEN_LLM_CLI || detectOllama());
+    return !!(process.env.NOTOKEN_LLM_ENDPOINT || process.env.NOTOKEN_LLM_CLI || detectOllama() || detectCodex());
 }
 /** Which LLM backend is active? */
 export function getLLMBackend() {
@@ -28,8 +28,25 @@ export function getLLMBackend() {
         return "api";
     if (detectOllama())
         return "ollama";
+    if (detectCodex())
+        return "codex";
     return null;
 }
+let codexChecked = false;
+let codexAvailable = false;
+function detectCodex() {
+    if (codexChecked)
+        return codexAvailable;
+    codexChecked = true;
+    try {
+        execSync("command -v codex", { timeout: 1000, stdio: "pipe" });
+        codexAvailable = true;
+    }
+    catch {
+        codexAvailable = false;
+    }
+    return codexAvailable;
+}
 let ollamaChecked = false;
 let ollamaAvailable = false;
 function detectOllama() {
@@ -67,6 +84,12 @@ export async function llmFallback(rawText, context) {
         if (apiResult)
             return apiResult;
     }
+    // Try Codex (auto-detected local)
+    if (detectCodex()) {
+        const codexResult = await tryLLMCli(rawText, { ...context, _cli: "codex" });
+        if (codexResult)
+            return codexResult;
+    }
     // Try Ollama (auto-detected local)
     if (detectOllama()) {
         const ollamaResult = await tryOllama(rawText, context);
@@ -91,6 +114,10 @@ async function tryLLMCli(rawText, context) {
             execSync("command -v chatgpt", { stdio: "pipe" });
             cmd = `chatgpt ${JSON.stringify(prompt)}`;
         }
+        else if (cli === "codex") {
+            execSync("command -v codex", { stdio: "pipe" });
+            cmd = `codex ${JSON.stringify(prompt)}`;
+        }
         else {
             return null;
         }

package/dist/nlp/multiClassifier.js CHANGED Viewed

@@ -1,9 +1,14 @@
 import { loadIntents, loadRules } from "../utils/config.js";
 import { semanticParse, fuzzyMatch } from "./semantic.js";
 import { parseByRules } from "./ruleParser.js";
+import { existsSync, readFileSync } from "node:fs";
+import { resolve, dirname } from "node:path";
+import { fileURLToPath } from "node:url";
+import { expandQuery } from "./conceptExpansion.js";
 const CLASSIFIER_WEIGHTS = {
     synonym: 1.0,
     semantic: 0.8,
+    vector: 0.7,
     context: 0.6,
     fuzzy: 0.5,
 };
@@ -12,8 +17,24 @@ const CLASSIFIER_WEIGHTS = {
  */
 export function classifyMulti(rawText, recentIntents) {
     const votes = [];
-    // 1. Synonym classifier (existing rule parser)
+    // 0. Expand query with synonym clusters for better matching
+    // "reboot the server" → "reboot the server restart cycle reload bounce"
+    let expandedText = rawText;
+    try {
+        expandedText = expandQuery(rawText);
+    }
+    catch { /* concept expansion not available */ }
+    // 1. Synonym classifier — run on both original AND expanded text
     votes.push(...classifySynonym(rawText));
+    if (expandedText !== rawText) {
+        // Run again on expanded text but with lower weight
+        const expandedVotes = classifySynonym(expandedText);
+        for (const v of expandedVotes) {
+            v.confidence *= 0.7; // Expansion matches are less certain
+            v.reason += " (expanded)";
+        }
+        votes.push(...expandedVotes);
+    }
     // 2. Semantic classifier (compromise-powered)
     votes.push(...classifySemantic(rawText));
     // 3. Context classifier (recent history)
@@ -22,19 +43,23 @@ export function classifyMulti(rawText, recentIntents) {
     }
     // 4. Fuzzy classifier (keyboard distance)
     votes.push(...classifyFuzzy(rawText));
-    // Merge votes into weighted scores
+    // 5. Vector classifier (precomputed TF-IDF cosine similarity)
+    votes.push(...classifyVector(rawText));
+    // Merge votes: max weighted score + bonus for agreement
     const scoreMap = new Map();
     for (const vote of votes) {
         const weight = CLASSIFIER_WEIGHTS[vote.classifier] ?? 1.0;
-        const existing = scoreMap.get(vote.intent) ?? { total: 0, count: 0 };
-        existing.total += vote.confidence * weight;
+        const weighted = vote.confidence * weight;
+        const existing = scoreMap.get(vote.intent) ?? { maxWeighted: 0, totalWeighted: 0, count: 0 };
+        existing.maxWeighted = Math.max(existing.maxWeighted, weighted);
+        existing.totalWeighted += weighted;
         existing.count += 1;
         scoreMap.set(vote.intent, existing);
     }
     const scores = Array.from(scoreMap.entries())
-        .map(([intent, { total, count }]) => ({
+        .map(([intent, { maxWeighted, count }]) => ({
         intent,
-        score: total / count,
+        score: maxWeighted + Math.min(0.15, (count - 1) * 0.05),
         votes: count,
     }))
         .sort((a, b) => b.score - a.score);
@@ -179,3 +204,63 @@ function scoreEntityMatch(parse, def) {
     }
     return matches / total;
 }
+let _vectorData = null;
+function loadVectors() {
+    if (_vectorData)
+        return _vectorData;
+    const paths = [
+        resolve(dirname(fileURLToPath(import.meta.url)), "../../config/intent-vectors.json"),
+        resolve(process.cwd(), "config/intent-vectors.json"),
+    ];
+    for (const p of paths) {
+        if (existsSync(p)) {
+            try {
+                _vectorData = JSON.parse(readFileSync(p, "utf-8"));
+                return _vectorData;
+            }
+            catch { /* skip */ }
+        }
+    }
+    return null;
+}
+const VECTOR_STOP = new Set(["a", "an", "the", "is", "it", "in", "on", "to", "for", "of", "and", "or", "my", "me", "i", "we", "you", "do", "does", "did", "be", "am", "are", "was", "were", "have", "has", "had", "this", "that", "what", "which", "who", "how", "where", "when", "why", "not", "no", "but", "if", "so", "at", "by", "with", "from", "up", "out", "can", "could", "would", "should", "will", "may", "might", "just", "about", "all", "please"]);
+function classifyVector(rawText) {
+    const data = loadVectors();
+    if (!data)
+        return [];
+    const tokens = rawText.toLowerCase().replace(/[^a-z0-9_.\-\/]/g, " ").split(/\s+/).filter((w) => w.length > 1 && !VECTOR_STOP.has(w));
+    if (tokens.length === 0)
+        return [];
+    const vocabIndex = new Map(data.vocab.map((v, i) => [v, i]));
+    const inputVec = {};
+    let magnitude = 0;
+    const tf = new Map();
+    for (const t of tokens)
+        tf.set(t, (tf.get(t) ?? 0) + 1);
+    for (const [term, count] of tf) {
+        const idx = vocabIndex.get(term);
+        if (idx !== undefined) {
+            inputVec[idx] = count;
+            magnitude += count * count;
+        }
+    }
+    magnitude = Math.sqrt(magnitude);
+    if (magnitude === 0)
+        return [];
+    for (const idx of Object.keys(inputVec))
+        inputVec[Number(idx)] /= magnitude;
+    const votes = [];
+    for (const [intentName, intentVec] of Object.entries(data.vectors)) {
+        let dot = 0;
+        for (const [idx, val] of Object.entries(inputVec)) {
+            const iv = intentVec[idx];
+            if (iv)
+                dot += val * iv;
+        }
+        if (dot > 0.1) {
+            votes.push({ classifier: "vector", intent: intentName, confidence: Math.min(0.95, dot), reason: `TF-IDF cosine: ${dot.toFixed(3)}` });
+        }
+    }
+    votes.sort((a, b) => b.confidence - a.confidence);
+    return votes.slice(0, 3);
+}

package/dist/nlp/multiIntent.d.ts ADDED Viewed

@@ -0,0 +1,43 @@
+/**
+ * Multi-intent parser.
+ *
+ * Splits compound sentences into individual intents and creates a plan.
+ *
+ * "check if the firewall is blocking port 443 and also check dns for my domain"
+ * →  Step 1: firewall.list (check port 443)
+ *    Step 2: dns.lookup (check domain)
+ *
+ * "show me disk usage, check memory, and list running containers"
+ * →  Step 1: server.check_disk
+ *    Step 2: server.check_memory
+ *    Step 3: docker.list
+ *
+ * Splitting rules:
+ *   - Split on: "and", "also", "then", "after that", ",", ";"
+ *   - But NOT inside quoted strings or after "and" that joins nouns ("cats and dogs")
+ *   - Each part is parsed independently through rule parser + concept router
+ *   - Only creates a plan if 2+ distinct intents are found
+ */
+export interface PlanStep {
+    intent: string;
+    rawText: string;
+    confidence: number;
+    description: string;
+    requiresConfirmation: boolean;
+    riskLevel: string;
+}
+export interface MultiIntentPlan {
+    steps: PlanStep[];
+    originalText: string;
+    isSingleIntent: boolean;
+}
+/**
+ * Split a compound sentence into parts.
+ */
+export declare function splitCompoundSentence(text: string): string[];
+/**
+ * Parse a potentially compound sentence into a multi-step plan.
+ * Returns a single-step plan if only one intent is found.
+ */
+export declare function parseMultiIntent(rawText: string): MultiIntentPlan;
+export declare function formatPlanSteps(plan: MultiIntentPlan): string;