npm - knolo-core - Versions diffs - 0.3.0 → 3.1.1 - Mend

knolo-core 0.3.0 → 3.1.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

package/DOCS.md +16 -2
package/README.md +376 -46
package/bin/knolo.mjs +256 -45
package/dist/agent.d.ts +53 -0
package/dist/agent.js +175 -0
package/dist/builder.d.ts +2 -0
package/dist/builder.js +28 -6
package/dist/index.d.ts +14 -2
package/dist/index.js +9 -2
package/dist/pack.d.ts +2 -0
package/dist/pack.js +22 -3
package/dist/query.d.ts +1 -0
package/dist/query.js +43 -1
package/dist/router.d.ts +28 -0
package/dist/router.js +74 -0
package/dist/routing_profile.d.ts +19 -0
package/dist/routing_profile.js +102 -0
package/dist/tool_gate.d.ts +3 -0
package/dist/tool_gate.js +8 -0
package/dist/tool_parse.d.ts +2 -0
package/dist/tool_parse.js +102 -0
package/dist/tools.d.ts +27 -0
package/dist/tools.js +34 -0
package/dist/trace.d.ts +45 -0
package/dist/trace.js +12 -0
package/package.json +4 -2

package/DOCS.md CHANGED Viewed

@@ -71,8 +71,16 @@ npx knolo docs.json knowledge.knolo
 # semantic-enabled build (embeddings JSON + model id)
 npx knolo docs.json knowledge.knolo --embeddings embeddings.json --model-id text-embedding-3-small
+# embed agents from a local directory (.json/.yml/.yaml)
+npx knolo docs.json knowledge.knolo --agents ./examples/agents
 ```
+### Agents and namespace binding
+When agent definitions are embedded into `meta.agents`, `resolveAgent(pack, { agentId, query, patch })` enforces **strict namespace binding**: `retrievalDefaults.namespace` always wins over caller `query.namespace`. This keeps retrieval deterministic and on-policy for each agent.
 ---
 ## Concepts
@@ -176,9 +184,15 @@ const hits: Hit[] = query(pack, '“react native bridge” throttling', {
 ### Semantic helper ergonomics
 ```ts
-import { hasSemantic, validateSemanticQueryOptions } from "knolo-core";
+import { hasSemantic, validateQueryOptions, validateSemanticQueryOptions } from "knolo-core";
 if (hasSemantic(pack)) {
+  validateQueryOptions({
+    topK: 10,
+    namespace: "mobile",
+    queryExpansion: { enabled: true, docs: 3, terms: 4 },
+  });
   validateSemanticQueryOptions({
     enabled: true,
     topN: 40,
@@ -188,7 +202,7 @@ if (hasSemantic(pack)) {
 }
 ```
-`validateSemanticQueryOptions(...)` throws useful errors for invalid option types/ranges (`topN`, `minLexConfidence`, blend weights, missing `Float32Array` embedding type).
+`validateQueryOptions(...)` and `validateSemanticQueryOptions(...)` throw useful errors for invalid option types/ranges (for example `topK`, `queryExpansion.docs`, `topN`, `minLexConfidence`, blend weights, and missing `Float32Array` embedding types).
 **What the ranker does**

package/README.md CHANGED Viewed

@@ -16,7 +16,7 @@ Build a portable `.knolo` pack and run deterministic lexical retrieval with opti
 ---
-## ✨ What’s in v0.3.0
+## ✨ What’s in v0.3.1
 - **Deterministic lexical quality upgrades**
   - required phrase enforcement (quoted + `requirePhrases`)
@@ -31,6 +31,10 @@ Build a portable `.knolo` pack and run deterministic lexical retrieval with opti
 - **Stability & diversity**
   - near-duplicate suppression + MMR diversity
   - KNS tie-break signal for stable close-score ordering
+- **Agent/runtime utilities**
+  - embedded agent registries with strict namespace binding
+  - tool call parsing + policy gating helpers
+  - provider-agnostic routing profile + route decision validators
 - **Portable packs**
   - single `.knolo` artifact
   - semantic payload embedded directly in pack when enabled
@@ -54,26 +58,34 @@ npm run build
 ---
+## 🧪 Playground
+Try KnoLo Core directly in your browser with the hosted playground:
+- https://playgrounds.knolo.dev
+---
 ## 🚀 Quickstart
 ### 1) Build + mount + query
 ```ts
-import { buildPack, mountPack, query, makeContextPatch } from "knolo-core";
+import { buildPack, mountPack, query, makeContextPatch } from 'knolo-core';
 const docs = [
   {
-    id: "bridge-guide",
-    namespace: "mobile",
-    heading: "React Native Bridge",
-    text: "The bridge sends messages between JS and native modules. Throttling limits event frequency."
+    id: 'bridge-guide',
+    namespace: 'mobile',
+    heading: 'React Native Bridge',
+    text: 'The bridge sends messages between JS and native modules. Throttling limits event frequency.',
   },
   {
-    id: "perf-notes",
-    namespace: "mobile",
-    heading: "Debounce vs Throttle",
-    text: "Debounce waits for silence; throttle enforces a maximum trigger rate."
-  }
+    id: 'perf-notes',
+    namespace: 'mobile',
+    heading: 'Debounce vs Throttle',
+    text: 'Debounce waits for silence; throttle enforces a maximum trigger rate.',
+  },
 ];
 const bytes = await buildPack(docs);
@@ -81,11 +93,11 @@ const kb = await mountPack({ src: bytes });
 const hits = query(kb, '"react native" throttle', {
   topK: 5,
-  requirePhrases: ["maximum trigger rate"],
-  namespace: "mobile"
+  requirePhrases: ['maximum trigger rate'],
+  namespace: 'mobile',
 });
-const patch = makeContextPatch(hits, { budget: "small" });
+const patch = makeContextPatch(hits, { budget: 'small' });
 console.log(hits, patch);
 ```
@@ -95,34 +107,45 @@ console.log(hits, patch);
 ```json
 [
-  { "id": "guide", "heading": "Guide", "text": "Install deps.\n\n## Throttle\nLimit event frequency." },
-  { "id": "faq", "heading": "FAQ", "text": "What is throttling? It reduces event frequency." }
+  {
+    "id": "guide",
+    "heading": "Guide",
+    "text": "Install deps.\n\n## Throttle\nLimit event frequency."
+  },
+  {
+    "id": "faq",
+    "heading": "FAQ",
+    "text": "What is throttling? It reduces event frequency."
+  }
 ]
 ```
 ```bash
 npx knolo docs.json knowledge.knolo
+# embed agents from a local directory (.json/.yml/.yaml)
+npx knolo docs.json knowledge.knolo --agents ./examples/agents
 ```
 Then query in app:
 ```ts
-import { mountPack, query } from "knolo-core";
+import { mountPack, query } from 'knolo-core';
-const kb = await mountPack({ src: "./knowledge.knolo" });
-const hits = query(kb, "throttle events", { topK: 3 });
+const kb = await mountPack({ src: './knowledge.knolo' });
+const hits = query(kb, 'throttle events', { topK: 3 });
 ```
 ---
-## 🔀 Hybrid retrieval with embeddings (recommended direction)
+## 🔀 Hybrid retrieval with embeddings (optional)
 KnoLo’s core retrieval remains lexical-first and deterministic. Semantic signals are added as an **optional rerank stage** when lexical confidence is low (or forced).
 ### Build a semantic-enabled pack
 ```ts
-import { buildPack } from "knolo-core";
+import { buildPack } from 'knolo-core';
 // embeddings must align 1:1 with docs/block order
 const embeddings: Float32Array[] = await embedDocumentsInOrder(docs);
@@ -130,32 +153,32 @@ const embeddings: Float32Array[] = await embedDocumentsInOrder(docs);
 const bytes = await buildPack(docs, {
   semantic: {
     enabled: true,
-    modelId: "text-embedding-3-small",
+    modelId: 'text-embedding-3-small',
     embeddings,
-    quantization: { type: "int8_l2norm", perVectorScale: true }
-  }
+    quantization: { type: 'int8_l2norm', perVectorScale: true },
+  },
 });
 ```
 ### Query with semantic rerank
 ```ts
-import { mountPack, query, hasSemantic } from "knolo-core";
+import { mountPack, query, hasSemantic } from 'knolo-core';
 const kb = await mountPack({ src: bytes });
-const queryEmbedding = await embedQuery("react native bridge throttling");
+const queryEmbedding = await embedQuery('react native bridge throttling');
-const hits = query(kb, "react native bridge throttling", {
+const hits = query(kb, 'react native bridge throttling', {
   topK: 8,
   semantic: {
     enabled: hasSemantic(kb),
-    mode: "rerank",
+    mode: 'rerank',
     topN: 50,
     minLexConfidence: 0.35,
     blend: { enabled: true, wLex: 0.75, wSem: 0.25 },
     queryEmbedding,
-    force: false
-  }
+    force: false,
+  },
 });
 ```
@@ -165,8 +188,8 @@ const hits = query(kb, "react native bridge throttling", {
 import {
   quantizeEmbeddingInt8L2Norm,
   encodeScaleF16,
-  decodeScaleF16
-} from "knolo-core";
+  decodeScaleF16,
+} from 'knolo-core';
 const { q, scale } = quantizeEmbeddingInt8L2Norm(queryEmbedding);
 const packed = encodeScaleF16(scale);
@@ -188,25 +211,74 @@ type BuildInputDoc = {
 };
 type BuildPackOptions = {
+  agents?: AgentRegistry | AgentDefinitionV1[];
   semantic?: {
     enabled: boolean;
     modelId: string;
     embeddings: Float32Array[];
     quantization?: {
-      type: "int8_l2norm";
+      type: 'int8_l2norm';
       perVectorScale?: true;
     };
   };
 };
 ```
+### Agents in pack metadata
+Agents are optional and embedded in `meta.agents` so a single `.knolo` artifact can ship retrieval behavior + prompt defaults on-prem. Agent registries are validated once at `mountPack()` time, so invalid embedded registries fail fast during mount.
+Agent namespace binding is **strict**: when `resolveAgent()` composes retrieval options, `retrievalDefaults.namespace` is always enforced and caller-provided `query.namespace` is ignored.
+```ts
+type AgentPromptTemplate = string[] | { format: 'markdown'; template: string };
+type AgentRegistry = {
+  version: 1;
+  agents: AgentDefinitionV1[];
+};
+type PackMeta = {
+  version: number;
+  stats: { docs: number; blocks: number; terms: number; avgBlockLen?: number };
+  agents?: AgentRegistry;
+};
+type AgentDefinitionV1 = {
+  id: string;
+  version: 1;
+  name?: string;
+  description?: string;
+  systemPrompt: AgentPromptTemplate;
+  retrievalDefaults: {
+    namespace: string[]; // required
+    topK?: number;
+    queryExpansion?: QueryOptions['queryExpansion'];
+    semantic?: Omit<
+      NonNullable<QueryOptions['semantic']>,
+      'queryEmbedding' | 'enabled' | 'force'
+    > & { enabled?: boolean };
+    minScore?: number;
+    requirePhrases?: string[];
+    source?: string[];
+  };
+  toolPolicy?: { mode: 'allow' | 'deny'; tools: string[] };
+  metadata?: Record<string, string | number | boolean | null>;
+};
+```
 ### `mountPack({ src }) => Promise<Pack>`
 ```ts
 type Pack = {
   meta: {
     version: number;
-    stats: { docs: number; blocks: number; terms: number; avgBlockLen?: number };
+    stats: {
+      docs: number;
+      blocks: number;
+      terms: number;
+      avgBlockLen?: number;
+    };
   };
   lexicon: Map<string, number>;
   postings: Uint32Array;
@@ -219,7 +291,7 @@ type Pack = {
     version: 1;
     modelId: string;
     dims: number;
-    encoding: "int8_l2norm";
+    encoding: 'int8_l2norm';
     perVectorScale: boolean;
     vecs: Int8Array;
     scales?: Uint16Array;
@@ -245,7 +317,7 @@ type QueryOptions = {
   };
   semantic?: {
     enabled?: boolean;
-    mode?: "rerank";
+    mode?: 'rerank';
     topN?: number;
     minLexConfidence?: number;
     blend?: {
@@ -267,6 +339,264 @@ type Hit = {
 };
 ```
+### Agent runtime helpers
+- `listAgents(pack) => string[]`
+- `getAgent(pack, agentId) => AgentDefinitionV1 | undefined`
+- `resolveAgent(pack, { agentId, query?, patch? }) => { agent, systemPrompt, retrievalOptions }`
+- `buildSystemPrompt(agent, patch?) => string`
+- `isToolAllowed(agent, toolId) => boolean` (defaults to allow-all when no `toolPolicy`)
+- `assertToolAllowed(agent, toolId) => void` (throws deterministic error when blocked)
+- `parseToolCallV1FromText(text) => ToolCallV1 | null` (safe parser for model outputs)
+- `assertToolCallAllowed(agent, call) => void` (policy gate for parsed calls)
+- `isToolCallV1(value) / isToolResultV1(value)` (runtime-safe type guards)
+- `getAgentRoutingProfileV1(agent) => AgentRoutingProfileV1`
+- `getPackRoutingProfilesV1(pack) => AgentRoutingProfileV1[]`
+- `isRouteDecisionV1(value) => boolean` (strict contract guard for router output)
+- `validateRouteDecisionV1(decision, registryById) => { ok: true } | { ok: false; error: string }`
+- `selectAgentIdFromRouteDecisionV1(decision, registryById, { fallbackAgentId? }) => { agentId, reason }`
+### Routing discoverability conventions
+To make an agent easier to route, use these optional `metadata` keys on `AgentDefinitionV1`:
+- `tags`: comma-separated (`"shopping,checkout"`) or JSON array string (`"[\"shopping\",\"checkout\"]"`)
+- `examples`: comma-separated, newline-separated, or JSON array string
+- `capabilities`: comma-separated, newline-separated, or JSON array string
+- `heading`: short UI heading shown in routing cards
+`knolo-core` parses these into a compact routing profile with trimming + dedupe + caps and never throws on bad metadata formats.
+```ts
+type AgentRoutingProfileV1 = {
+  agentId: string;
+  namespace?: string;
+  heading?: string;
+  description?: string;
+  tags: string[];
+  examples: string[];
+  capabilities: string[];
+  toolPolicy?: unknown;
+  toolPolicySummary?: {
+    mode: 'allow_all' | 'deny_all' | 'mixed' | 'unknown';
+    allowed?: string[];
+    denied?: string[];
+  };
+};
+```
+Example profile payload:
+```json
+{
+  "agentId": "shopping.agent",
+  "namespace": "shopping",
+  "heading": "Shopping Assistant",
+  "description": "Handles product lookup, checkout help, and order tracking.",
+  "tags": ["shopping", "checkout", "order-status"],
+  "examples": ["track my order", "find running shoes under $120"],
+  "capabilities": ["catalog_search", "order_lookup"],
+  "toolPolicySummary": {
+    "mode": "mixed",
+    "allowed": ["search_docs", "order_lookup"]
+  }
+}
+```
+### Route decision contract
+`knolo-core` does not call Ollama (or any model provider). A runtime can call any router model, then validate the output with this contract:
+```ts
+type RouteCandidateV1 = {
+  agentId: string;
+  score: number; // 0..1
+  why?: string;
+};
+type RouteDecisionV1 = {
+  type: 'route_decision';
+  intent?: string;
+  entities?: Record<string, unknown>;
+  candidates: RouteCandidateV1[];
+  selected: string;
+  needsTools?: string[];
+  risk?: 'low' | 'med' | 'high';
+};
+```
+JSON example:
+```json
+{
+  "type": "route_decision",
+  "intent": "order_tracking",
+  "entities": { "orderId": "A-1023" },
+  "candidates": [
+    { "agentId": "shopping.agent", "score": 0.91, "why": "Order-related intent" },
+    { "agentId": "returns.agent", "score": 0.37 }
+  ],
+  "selected": "shopping.agent",
+  "needsTools": ["order_lookup"],
+  "risk": "low"
+}
+```
+Validation and selection notes:
+- `isRouteDecisionV1(...)` is strict and rejects malformed payloads.
+- `validateRouteDecisionV1(...)` requires `selected` and every candidate `agentId` to exist in the mounted registry and rejects duplicate candidate ids.
+- `selectAgentIdFromRouteDecisionV1(...)` is deterministic and never throws:
+  1. use `selected` if registered,
+  2. else highest-score registered candidate,
+  3. else caller `fallbackAgentId` if valid,
+  4. else lexicographically first registered agent id.
+### Router runtime flow (provider-agnostic)
+1. Receive user input text.
+2. Build routing profiles from mounted pack agents via `getPackRoutingProfilesV1(pack)`.
+3. Send input + profiles to your router model (Ollama or any provider) outside `knolo-core`.
+4. Parse model output JSON and gate with `isRouteDecisionV1`.
+5. Validate against mounted registry with `validateRouteDecisionV1`.
+6. Pick final agent using `selectAgentIdFromRouteDecisionV1`.
+7. Call `resolveAgent(pack, { agentId, ... })` and run your existing loop.
+### Tool call + result contracts
+```ts
+type ToolCallV1 = {
+  type: 'tool_call';
+  callId: string;
+  tool: string;
+  args: Record<string, unknown>;
+};
+type ToolResultV1 = {
+  type: 'tool_result';
+  callId: string;
+  tool: string;
+  ok: boolean;
+  output?: unknown; // when ok=true
+  error?: { message: string; code?: string; details?: unknown }; // when ok=false
+};
+```
+JSON examples:
+```json
+{
+  "type": "tool_call",
+  "callId": "call-42",
+  "tool": "search_docs",
+  "args": { "query": "bridge throttle" }
+}
+```
+```json
+{
+  "type": "tool_result",
+  "callId": "call-42",
+  "tool": "search_docs",
+  "ok": true,
+  "output": { "hits": [{ "id": "mobile-doc" }] }
+}
+```
+### Runtime loop shape (model-agnostic)
+1. Run model with current conversation state.
+2. Parse text output with `parseToolCallV1FromText(...)`.
+3. If parsed: gate with `assertToolCallAllowed(resolved.agent, call)`.
+4. Runtime executes the tool and creates `ToolResultV1`.
+5. Feed the tool result back into the conversation and continue until completion.
+### Trace events for timeline UIs
+```ts
+type TraceEventV1 =
+  | {
+      type: 'route.requested';
+      ts: string;
+      text: string;
+      agentCount: number;
+    }
+  | {
+      type: 'route.decided';
+      ts: string;
+      decision: RouteDecisionV1;
+      selectedAgentId: string;
+    }
+  | { type: 'agent.selected'; ts: string; agentId: string; namespace?: string }
+  | {
+      type: 'prompt.resolved';
+      ts: string;
+      agentId: string;
+      promptHash?: string;
+      patchKeys?: string[];
+    }
+  | { type: 'tool.requested'; ts: string; agentId: string; call: ToolCallV1 }
+  | {
+      type: 'tool.executed';
+      ts: string;
+      agentId: string;
+      result: ToolResultV1;
+      durationMs?: number;
+    }
+  | {
+      type: 'run.completed';
+      ts: string;
+      agentId: string;
+      status: 'ok' | 'error';
+    };
+```
+Helpers: `nowIso()` for timestamps and `createTrace()` for lightweight trace collection.
+### Build a pack with agents and resolve at runtime
+```ts
+import {
+  buildPack,
+  mountPack,
+  resolveAgent,
+  query,
+  isToolAllowed,
+  assertToolAllowed,
+} from 'knolo-core';
+const bytes = await buildPack(docs, {
+  agents: [
+    {
+      id: 'mobile.agent',
+      version: 1,
+      systemPrompt: {
+        format: 'markdown',
+        template: 'You are {{team}} support.',
+      },
+      retrievalDefaults: { namespace: ['mobile'], topK: 5 },
+      toolPolicy: { mode: 'allow', tools: ['search_docs'] },
+    },
+  ],
+});
+const pack = await mountPack({ src: bytes });
+const resolved = resolveAgent(pack, {
+  agentId: 'mobile.agent',
+  patch: { team: 'mobile' },
+  query: { namespace: ['backend'], topK: 8 },
+});
+console.log(resolved.retrievalOptions.namespace); // ['mobile'] (strict binding)
+if (isToolAllowed(resolved.agent, 'search_docs')) {
+  // invoke search_docs
+}
+assertToolAllowed(resolved.agent, 'search_docs');
+const hits = query(pack, 'bridge throttle', resolved.retrievalOptions);
+```
 ### `makeContextPatch(hits, { budget }) => ContextPatch`
 Budgets: `"mini" | "small" | "full"`
@@ -278,10 +608,10 @@ Budgets: `"mini" | "small" | "full"`
 ### Namespace + source filtering
 ```ts
-const hits = query(kb, "retry backoff", {
-  namespace: ["sdk", "api"],
-  source: ["errors-guide", "http-reference"],
-  topK: 6
+const hits = query(kb, 'retry backoff', {
+  namespace: ['sdk', 'api'],
+  source: ['errors-guide', 'http-reference'],
+  topK: 6,
 });
 ```
@@ -290,29 +620,29 @@ const hits = query(kb, "retry backoff", {
 If your query has no free tokens but includes required phrases, KnoLo still forms candidates from phrase tokens and enforces phrase presence.
 ```ts
-const hits = query(kb, '"event loop"', { requirePhrases: ["single thread"] });
+const hits = query(kb, '"event loop"', { requirePhrases: ['single thread'] });
 ```
 ### Precision mode with minimum score
 ```ts
-const strictHits = query(kb, "jwt refresh token rotation", {
+const strictHits = query(kb, 'jwt refresh token rotation', {
   topK: 5,
-  minScore: 2.5
+  minScore: 2.5,
 });
 ```
 ### Validate semantic query options early
 ```ts
-import { validateSemanticQueryOptions } from "knolo-core";
+import { validateSemanticQueryOptions } from 'knolo-core';
 validateSemanticQueryOptions({
   enabled: true,
   topN: 40,
   minLexConfidence: 0.3,
   blend: { enabled: true, wLex: 0.8, wSem: 0.2 },
-  queryEmbedding
+  queryEmbedding,
 });
 ```
@@ -356,7 +686,7 @@ Yes. Runtime text encoder/decoder compatibility is included.
 ---
-## 🗺️ Direction / roadmap
+## 🗺️ Roadmap
 - stronger hybrid retrieval evaluation tooling
 - richer pack introspection and diagnostics