npm - @kaleidorg/mind - Versions diffs - 0.2.0 → 0.4.0 - Mend

@kaleidorg/mind 0.2.0 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (130) hide show

package/dist/capabilities.d.ts +4 -0
package/dist/capabilities.d.ts.map +1 -1
package/dist/capabilities.js +7 -0
package/dist/capabilities.js.map +1 -1
package/dist/engine.d.ts +9 -0
package/dist/engine.d.ts.map +1 -1
package/dist/engine.js +1 -0
package/dist/engine.js.map +1 -1
package/dist/funnel.d.ts +6 -0
package/dist/funnel.d.ts.map +1 -1
package/dist/funnel.js +26 -6
package/dist/funnel.js.map +1 -1
package/dist/index.d.ts +9 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +8 -0
package/dist/index.js.map +1 -1
package/dist/kaleidoswap/contract.d.ts +72 -0
package/dist/kaleidoswap/contract.d.ts.map +1 -0
package/dist/kaleidoswap/contract.js +125 -0
package/dist/kaleidoswap/contract.js.map +1 -0
package/dist/knowledge/btc-map.d.ts +87 -0
package/dist/knowledge/btc-map.d.ts.map +1 -0
package/dist/knowledge/btc-map.js +365 -0
package/dist/knowledge/btc-map.js.map +1 -0
package/dist/lsps1/contract.d.ts +55 -0
package/dist/lsps1/contract.d.ts.map +1 -0
package/dist/lsps1/contract.js +91 -0
package/dist/lsps1/contract.js.map +1 -0
package/dist/memory/store.d.ts +7 -1
package/dist/memory/store.d.ts.map +1 -1
package/dist/memory/store.js +43 -3
package/dist/memory/store.js.map +1 -1
package/dist/memory/types.d.ts +12 -0
package/dist/memory/types.d.ts.map +1 -1
package/dist/qvac/assistant.d.ts +73 -0
package/dist/qvac/assistant.d.ts.map +1 -0
package/dist/qvac/assistant.js +97 -0
package/dist/qvac/assistant.js.map +1 -0
package/dist/qvac/config.d.ts +64 -0
package/dist/qvac/config.d.ts.map +1 -0
package/dist/qvac/config.js +71 -0
package/dist/qvac/config.js.map +1 -0
package/dist/qvac/delegate.d.ts +48 -0
package/dist/qvac/delegate.d.ts.map +1 -0
package/dist/qvac/delegate.js +51 -0
package/dist/qvac/delegate.js.map +1 -0
package/dist/qvac/index.d.ts +19 -0
package/dist/qvac/index.d.ts.map +1 -0
package/dist/qvac/index.js +19 -0
package/dist/qvac/index.js.map +1 -0
package/dist/qvac/parse.d.ts +44 -0
package/dist/qvac/parse.d.ts.map +1 -0
package/dist/qvac/parse.js +28 -0
package/dist/qvac/parse.js.map +1 -0
package/dist/qvac/provider.d.ts +49 -0
package/dist/qvac/provider.d.ts.map +1 -0
package/dist/qvac/provider.js +68 -0
package/dist/qvac/provider.js.map +1 -0
package/dist/qvac/stream.d.ts +37 -0
package/dist/qvac/stream.d.ts.map +1 -0
package/dist/qvac/stream.js +29 -0
package/dist/qvac/stream.js.map +1 -0
package/dist/qvac/text.d.ts +19 -0
package/dist/qvac/text.d.ts.map +1 -0
package/dist/qvac/text.js +56 -0
package/dist/qvac/text.js.map +1 -0
package/dist/qvac/voice.d.ts +69 -0
package/dist/qvac/voice.d.ts.map +1 -0
package/dist/qvac/voice.js +51 -0
package/dist/qvac/voice.js.map +1 -0
package/dist/recipe/kaleidoswap-atomic.d.ts +27 -0
package/dist/recipe/kaleidoswap-atomic.d.ts.map +1 -0
package/dist/recipe/kaleidoswap-atomic.js +111 -0
package/dist/recipe/kaleidoswap-atomic.js.map +1 -0
package/dist/recipe/runner.d.ts.map +1 -1
package/dist/recipe/runner.js +13 -1
package/dist/recipe/runner.js.map +1 -1
package/dist/skills/registry.d.ts.map +1 -1
package/dist/skills/registry.js +20 -2
package/dist/skills/registry.js.map +1 -1
package/dist/wallet/confirm.d.ts +12 -0
package/dist/wallet/confirm.d.ts.map +1 -0
package/dist/wallet/confirm.js +67 -0
package/dist/wallet/confirm.js.map +1 -0
package/package.json +16 -1
package/skills/README.md +6 -1
package/skills/kaleido-lsps/SKILL.md +56 -0
package/skills/kaleido-trading/SKILL.md +85 -18
package/skills/merchant-finder/SKILL.md +87 -0
package/skills/paid-data/SKILL.md +12 -0
package/skills/wallet-assistant/SKILL.md +38 -0
package/src/capabilities.ts +12 -0
package/src/context/context.test.ts +6 -2
package/src/engine.ts +6 -0
package/src/funnel.ts +32 -7
package/src/index.ts +43 -0
package/src/kaleidoswap/contract.test.ts +147 -0
package/src/kaleidoswap/contract.ts +212 -0
package/src/knowledge/btc-map.test.ts +188 -0
package/src/knowledge/btc-map.ts +446 -0
package/src/lsps1/contract.test.ts +81 -0
package/src/lsps1/contract.ts +132 -0
package/src/memory/memory.test.ts +55 -0
package/src/memory/store.ts +49 -4
package/src/memory/types.ts +13 -0
package/src/qvac/assistant.test.ts +132 -0
package/src/qvac/assistant.ts +146 -0
package/src/qvac/config.test.ts +44 -0
package/src/qvac/config.ts +76 -0
package/src/qvac/delegate.test.ts +68 -0
package/src/qvac/delegate.ts +71 -0
package/src/qvac/index.ts +72 -0
package/src/qvac/parse.test.ts +52 -0
package/src/qvac/parse.ts +57 -0
package/src/qvac/provider.test.ts +107 -0
package/src/qvac/provider.ts +124 -0
package/src/qvac/stream.test.ts +79 -0
package/src/qvac/stream.ts +56 -0
package/src/qvac/text.test.ts +70 -0
package/src/qvac/text.ts +60 -0
package/src/qvac/voice.test.ts +151 -0
package/src/qvac/voice.ts +122 -0
package/src/recipe/kaleidoswap-atomic.test.ts +138 -0
package/src/recipe/kaleidoswap-atomic.ts +117 -0
package/src/recipe/runner.ts +13 -1
package/src/skills/registry.ts +21 -2
package/src/skills/skills.test.ts +42 -0
package/src/wallet/confirm.test.ts +57 -0
package/src/wallet/confirm.ts +74 -0
package/skills/kaleido-wallet/SKILL.md +0 -28

package/src/qvac/delegate.ts ADDED Viewed

@@ -0,0 +1,71 @@
+/**
+ * Delegation helpers — the provider firewall (who may connect) and the
+ * consumer-side delegate config. Pure data builders (no `@qvac/sdk` import) so
+ * they stay shared + testable; the host passes the result to
+ * `startQVACProvider({ firewall })` / `loadModel({ delegate })`.
+ *
+ * Security note: a QVAC provider is reachable by anyone who learns its
+ * Hyperswarm public key. Advertising with no firewall means any such peer can
+ * run inference on your machine. Use {@link allowListFirewall} so a desktop
+ * provider serves ONLY its paired phone(s).
+ */
+/** Firewall for `startQVACProvider` — restrict who may delegate to this provider. */
+export interface ProviderFirewall {
+  mode: 'allow' | 'deny';
+  publicKeys: string[];
+}
+function normalizeKeys(keys: Iterable<string>): string[] {
+  return [...new Set([...keys].map((k) => k.trim()).filter(Boolean))];
+}
+/**
+ * Allow ONLY these consumer public keys to delegate (zero-trust). Pass the
+ * paired phone(s)' public keys so no one else can use the desktop brain even if
+ * they learn its public key.
+ */
+export function allowListFirewall(consumerPublicKeys: Iterable<string>): ProviderFirewall {
+  return { mode: 'allow', publicKeys: normalizeKeys(consumerPublicKeys) };
+}
+/** Deny these consumer public keys; everyone else may connect. */
+export function denyListFirewall(consumerPublicKeys: Iterable<string>): ProviderFirewall {
+  return { mode: 'deny', publicKeys: normalizeKeys(consumerPublicKeys) };
+}
+/**
+ * Parse a comma/space/newline-separated key list (e.g. from an env var or a
+ * pairing store) into an allow-list firewall, or `undefined` when none are
+ * configured — the caller then advertises openly and should warn.
+ */
+export function firewallFromKeyList(raw: string | null | undefined): ProviderFirewall | undefined {
+  if (!raw) return undefined;
+  const keys = raw.split(/[\s,]+/).map((k) => k.trim()).filter(Boolean);
+  return keys.length ? allowListFirewall(keys) : undefined;
+}
+/** Consumer-side config for `loadModel({ delegate })`. */
+export interface DelegateConfig {
+  providerPublicKey: string;
+  fallbackToLocal: boolean;
+  timeout?: number;
+  forceNewConnection?: boolean;
+}
+/**
+ * Build the `delegate` config for a delegated `loadModel`. `fallbackToLocal`
+ * defaults to false (the host owns recovery), matching rate's existing
+ * LLM/Whisper/TTS delegated loads.
+ */
+export function buildDelegateConfig(
+  providerPublicKey: string,
+  opts: { fallbackToLocal?: boolean; timeout?: number; forceNewConnection?: boolean } = {},
+): DelegateConfig {
+  return {
+    providerPublicKey: providerPublicKey.trim(),
+    fallbackToLocal: opts.fallbackToLocal ?? false,
+    ...(opts.timeout != null ? { timeout: opts.timeout } : {}),
+    ...(opts.forceNewConnection != null ? { forceNewConnection: opts.forceNewConnection } : {}),
+  };
+}

package/src/qvac/index.ts ADDED Viewed

@@ -0,0 +1,72 @@
+/**
+ * @kaleidorg/mind-qvac — the single home for all @qvac/sdk logic behind
+ * @kaleidorg/mind. Hosts (rate mobile, desktop provider, cli) supply @qvac/sdk
+ * as a peer dependency; this package owns the orchestration so the logic lives
+ * in one place instead of drifting copies per host.
+ *
+ * This first slice exports the platform-agnostic core (pure text helpers, model
+ * configs, completion parsing). The QVAC-calling provider/voice/host wrappers
+ * land next, on top of these.
+ */
+export {
+  cleanAssistantVisibleText,
+  sanitizeForSupertonic,
+} from './text.js';
+export {
+  LOCAL_LLM_CONFIG,
+  LOCAL_LLM_CONFIG_GPU,
+  DELEGATE_LLM_CONFIG,
+  TTS_SAMPLE_RATE,
+  DEFAULT_VOICE_STREAM_PARAMS,
+  WHISPER_LANGS,
+  normalizeWhisperLang,
+} from './config.js';
+export {
+  finalToTurn,
+  type QvacFinalLike,
+  type ParsedTurn,
+} from './parse.js';
+export {
+  consumeRun,
+  type CompletionEventLike,
+  type CompletionRunLike,
+  type StreamHandlers,
+  type ConsumedTurn,
+} from './stream.js';
+export {
+  createQvacProvider,
+  type QvacProviderOptions,
+  type QvacTurnInput,
+} from './provider.js';
+export {
+  createQvacVoice,
+  type QvacVoice,
+  type QvacVoiceOptions,
+  type VoiceSession,
+  type PcmAudio,
+} from './voice.js';
+export {
+  runVoiceAssistant,
+  shouldHandleUtterance,
+  DEFAULT_IGNORED_UTTERANCES,
+  type VoiceAssistantSession,
+  type VoiceAssistantHandlers,
+  type VoiceAssistantOptions,
+  type VoiceAssistantState,
+  type VoiceTranscriptEvent,
+} from './assistant.js';
+export {
+  allowListFirewall,
+  denyListFirewall,
+  firewallFromKeyList,
+  buildDelegateConfig,
+  type ProviderFirewall,
+  type DelegateConfig,
+} from './delegate.js';

package/src/qvac/parse.test.ts ADDED Viewed

@@ -0,0 +1,52 @@
+import { describe, it, expect } from 'vitest';
+import { finalToTurn } from './parse.js';
+describe('finalToTurn', () => {
+  it('uses contentText for visible text and strips reasoning', () => {
+    const out = finalToTurn({ contentText: '<think>x</think>Hello' });
+    expect(out.text).toBe('Hello');
+  });
+  it('falls back to the streamed text when contentText is empty', () => {
+    const out = finalToTurn({ contentText: '' }, 'streamed answer');
+    expect(out.text).toBe('streamed answer');
+  });
+  it('prefers raw.fullText for rawContent (history push-back)', () => {
+    const out = finalToTurn({ contentText: 'Hi', raw: { fullText: 'FRAMED<tool/>Hi' } });
+    expect(out.rawContent).toBe('FRAMED<tool/>Hi');
+    expect(out.text).toBe('Hi');
+  });
+  it('falls back to the raw text for rawContent when no framed form', () => {
+    const out = finalToTurn({ contentText: 'Hi' });
+    expect(out.rawContent).toBe('Hi');
+  });
+  it('maps tool calls and defaults missing arguments to {}', () => {
+    const out = finalToTurn({
+      contentText: '',
+      toolCalls: [{ id: 'a', name: 'get_balance' }, { name: 'send', arguments: { sats: 5000 } }],
+    });
+    expect(out.toolCalls).toEqual([
+      { id: 'a', name: 'get_balance', arguments: {} },
+      { id: undefined, name: 'send', arguments: { sats: 5000 } },
+    ]);
+  });
+  it('flags truncation when the SDK stops on length', () => {
+    const out = finalToTurn({ contentText: 'partial', stopReason: 'length' });
+    expect(out.truncated).toBe(true);
+    expect(out.stopReason).toBe('length');
+  });
+  it('does not flag truncation on a natural stop', () => {
+    const out = finalToTurn({ contentText: 'done' });
+    expect(out.truncated).toBe(false);
+  });
+  it('handles an empty final without throwing', () => {
+    const out = finalToTurn({});
+    expect(out).toEqual({ text: '', rawContent: '', toolCalls: [], truncated: false, stopReason: undefined });
+  });
+});

package/src/qvac/parse.ts ADDED Viewed

@@ -0,0 +1,57 @@
+/**
+ * Pure mapping from a QVAC completion `final` frame to the shape the shared
+ * @kaleidorg/mind Engine consumes. Kept SDK-free (structural input type) so it
+ * is testable without loading a model, and so the same mapping runs on mobile,
+ * desktop, and the eval harness.
+ */
+import { cleanAssistantVisibleText } from './text.js';
+/** Structural subset of a QVAC `completion().final` we depend on. */
+export interface QvacFinalLike {
+  /** Visible assistant text (excludes `<think>` reasoning). */
+  contentText?: string;
+  /** Raw assistant frame, incl. tool-call framing, for history push-back. */
+  raw?: { fullText?: string };
+  /** Tool calls the model requested this turn (empty ⇒ final answer). */
+  toolCalls?: Array<{ id?: string; name: string; arguments?: Record<string, unknown> }>;
+  /**
+   * Why generation stopped. QVAC 0.13 emits `"length"` when the token budget is
+   * exhausted, `"cancelled"` on abort, `undefined` on a natural stop. We surface
+   * it so the funnel can tell a truncated tool-call from a complete one.
+   */
+  stopReason?: 'length' | 'cancelled' | string;
+}
+export interface ParsedTurn {
+  /** Cleaned assistant content for display. */
+  text: string;
+  /** Raw assistant frame to push back into history for the next turn. */
+  rawContent: string;
+  /** Tool calls the model requested (arguments defaulted to `{}`). */
+  toolCalls: Array<{ id?: string; name: string; arguments: Record<string, unknown> }>;
+  /** True when generation was cut off by the token budget (incomplete output). */
+  truncated: boolean;
+  /** Raw stop reason from the SDK, when provided. */
+  stopReason?: string;
+}
+/**
+ * Map a completion `final` (plus the streamed fallback text) into a ParsedTurn.
+ * `rawContent` prefers the SDK's framed `raw.fullText` so the Engine can anchor
+ * the next turn; falls back to the visible text when a provider has no raw form.
+ */
+export function finalToTurn(final: QvacFinalLike, streamed = ''): ParsedTurn {
+  const rawText = final.contentText || streamed;
+  const text = cleanAssistantVisibleText(rawText);
+  return {
+    text,
+    rawContent: final.raw?.fullText ?? rawText,
+    toolCalls: (final.toolCalls ?? []).map((c) => ({
+      id: c.id,
+      name: c.name,
+      arguments: c.arguments ?? {},
+    })),
+    truncated: final.stopReason === 'length',
+    stopReason: final.stopReason,
+  };
+}

package/src/qvac/provider.test.ts ADDED Viewed

@@ -0,0 +1,107 @@
+import { describe, it, expect, vi } from 'vitest';
+import { createQvacProvider } from './provider.js';
+/** A fake `completion` that records its params and replays scripted events. */
+function fakeCompletion(
+  final: Record<string, unknown>,
+  events: Array<{ type: string; text?: string }> = [],
+) {
+  const calls: any[] = [];
+  const fn = (params: any) => {
+    calls.push(params);
+    return {
+      requestId: 'req-1',
+      events: (async function* () {
+        for (const e of events) yield e;
+      })(),
+      final: Promise.resolve(final),
+    };
+  };
+  return { fn, calls };
+}
+const noopCancel = (async () => {}) as any;
+describe('createQvacProvider.runTurn', () => {
+  it('throws when no model is loaded', async () => {
+    const p = createQvacProvider({
+      completion: (() => { throw new Error('should not be called'); }) as any,
+      cancel: noopCancel,
+      getModelId: () => null,
+    });
+    await expect(p.runTurn({ messages: [{ role: 'user', content: 'hi' }], tools: [] }))
+      .rejects.toThrow(/not loaded/);
+  });
+  it('prepends the system message and sets generationParams + captureThinking', async () => {
+    const { fn, calls } = fakeCompletion({ contentText: 'Hello', toolCalls: [], raw: { fullText: 'Hello' } });
+    const p = createQvacProvider({
+      completion: fn as any,
+      cancel: noopCancel,
+      getModelId: () => 'm1',
+      defaultTemperature: 0.5,
+      defaultMaxTokens: 256,
+    });
+    const out = await p.runTurn({ system: 'You are X', messages: [{ role: 'user', content: 'hi' }], tools: [] });
+    expect(out.text).toBe('Hello');
+    const params = calls[0];
+    expect(params.modelId).toBe('m1');
+    expect(params.history).toEqual([
+      { role: 'system', content: 'You are X' },
+      { role: 'user', content: 'hi' },
+    ]);
+    expect(params.stream).toBe(true);
+    expect(params.captureThinking).toBe(true);
+    expect(params.generationParams).toEqual({ temp: 0.5, predict: 256 });
+    expect(params.tools).toBeUndefined();
+  });
+  it('maps tools by schema and honours per-call temperature/maxTokens', async () => {
+    const { fn, calls } = fakeCompletion({
+      contentText: '',
+      toolCalls: [{ id: 'a', name: 'get_balance', arguments: {} }],
+      raw: { fullText: '' },
+    });
+    const p = createQvacProvider({ completion: fn as any, cancel: noopCancel, getModelId: () => 'm1' });
+    const out = await p.runTurn({
+      messages: [{ role: 'user', content: 'balance?' }],
+      tools: [{ name: 'get_balance', description: 'balance', parameters: { shape: true } }],
+      temperature: 0.9,
+      maxTokens: 99,
+    } as any);
+    expect(out.toolCalls).toEqual([{ id: 'a', name: 'get_balance', arguments: {} }]);
+    const params = calls[0];
+    expect(params.tools).toEqual([{ name: 'get_balance', description: 'balance', parameters: { shape: true } }]);
+    expect(params.generationParams).toEqual({ temp: 0.9, predict: 99 });
+  });
+  it('omits generationParams when no temperature/maxTokens is set (keeps SDK defaults)', async () => {
+    const { fn, calls } = fakeCompletion({ contentText: 'ok', toolCalls: [], raw: { fullText: 'ok' } });
+    const p = createQvacProvider({ completion: fn as any, cancel: noopCancel, getModelId: () => 'm1' });
+    await p.runTurn({ messages: [{ role: 'user', content: 'x' }], tools: [] });
+    expect(calls[0].generationParams).toBeUndefined();
+  });
+  it('streams visible content tokens to onToken', async () => {
+    const { fn } = fakeCompletion(
+      { contentText: 'Hi there', toolCalls: [], raw: { fullText: 'Hi there' } },
+      [{ type: 'contentDelta', text: 'Hi ' }, { type: 'contentDelta', text: 'there' }],
+    );
+    const tokens: string[] = [];
+    const p = createQvacProvider({ completion: fn as any, cancel: noopCancel, getModelId: () => 'm1' });
+    await p.runTurn({ messages: [{ role: 'user', content: 'x' }], tools: [], onToken: (t) => tokens.push(t) });
+    expect(tokens).toEqual(['Hi ', 'there']);
+  });
+});
+describe('createQvacProvider.cancel', () => {
+  it('forwards the requestId to the SDK cancel', async () => {
+    const cancel = vi.fn(async () => {});
+    const { fn } = fakeCompletion({ contentText: 'ok', toolCalls: [], raw: { fullText: 'ok' } });
+    const p = createQvacProvider({ completion: fn as any, cancel: cancel as any, getModelId: () => 'm1' });
+    await p.cancel!('req-9');
+    expect(cancel).toHaveBeenCalledWith({ requestId: 'req-9' });
+  });
+});

package/src/qvac/provider.ts ADDED Viewed

@@ -0,0 +1,124 @@
+/**
+ * createQvacProvider — turns `@qvac/sdk` `completion()` into the shared
+ * `@kaleidorg/mind` `LLMProvider` the Engine/Funnel consumes. This is the one
+ * place the SDK is called for inference; every host (rate, desktop provider,
+ * cli) uses it instead of hand-rolling its own completion wrapper.
+ *
+ * The SDK functions are *injected*, not imported, so this package carries no
+ * runtime dependency on `@qvac/sdk` (the import below is type-only and erased).
+ * Hosts pass their own `completion`/`cancel` — rate the static RN import, the
+ * desktop sidecar its lazily-loaded SDK facade — which also makes this provider
+ * unit-testable with a fake completion.
+ *
+ * The host owns model lifecycle (load/unload, local-vs-delegated) and passes
+ * `getModelId()` so a turn always runs against the currently-loaded model.
+ * Tools are forwarded by schema only; the Engine executes them via its
+ * ToolSources, so signing/spending stays on the host even when inference is
+ * delegated to a desktop peer.
+ */
+import type * as QvacSdk from '@qvac/sdk';
+import type { LLMProvider, TurnInput, TurnOutput } from '../providers/types.js';
+import { consumeRun } from './stream.js';
+type CompletionFn = typeof QvacSdk.completion;
+type CancelFn = typeof QvacSdk.cancel;
+export interface QvacProviderOptions {
+  /** The SDK's `completion` (injected — see module docs). */
+  completion: CompletionFn;
+  /** The SDK's `cancel` (injected). */
+  cancel: CancelFn;
+  /** Resolve the loaded model id for this turn (null ⇒ not loaded → throws). */
+  getModelId: () => string | null;
+  /**
+   * Default sampling temperature. Omit to leave it to the SDK/model default —
+   * `generationParams` is only sent when a temperature or max-tokens is set, so
+   * a host that passes neither preserves the SDK's own defaults.
+   */
+  defaultTemperature?: number;
+  /** Default max output tokens — caps a turn so it can't ramble. Omit for uncapped. */
+  defaultMaxTokens?: number;
+  /** Stream the model's `<think>` reasoning, when a host wants to surface it. */
+  onThinking?: (token: string) => void;
+}
+/** TurnInput plus the per-call knobs the funnel/voice paths pass through. */
+export interface QvacTurnInput extends TurnInput {
+  temperature?: number;
+  maxTokens?: number;
+  onThinking?: (token: string) => void;
+}
+export function createQvacProvider(options: QvacProviderOptions): LLMProvider {
+  return {
+    name: 'qvac',
+    async runTurn(input: QvacTurnInput): Promise<TurnOutput> {
+      const modelId = options.getModelId();
+      if (!modelId) throw new Error('QVAC model not loaded');
+      const history = input.system
+        ? [{ role: 'system', content: input.system }, ...input.messages]
+        : input.messages;
+      // Tools are forwarded by schema only (name/description/parameters). We
+      // carry `parameters` through verbatim (Zod for in-process tools, JSON
+      // Schema for MCP) — the model only needs the shape to pick a call; the
+      // Engine validates + executes.
+      const tools = input.tools.length
+        ? input.tools.map((t) => ({
+            name: t.name,
+            description: t.description,
+            parameters: t.parameters,
+          }))
+        : undefined;
+      // QVAC 0.13 nests sampling under `generationParams`; top-level
+      // `temperature`/`max_tokens` (as older rate code passed) are dropped by
+      // validation, so the cap silently no-op'd. Build it here, and only send it
+      // when a value is set so a host that passes neither keeps SDK defaults.
+      const temp = input.temperature ?? options.defaultTemperature;
+      const predict = input.maxTokens ?? options.defaultMaxTokens;
+      const generationParams =
+        temp !== undefined || predict !== undefined
+          ? {
+              ...(temp !== undefined ? { temp } : {}),
+              ...(predict !== undefined ? { predict } : {}),
+            }
+          : undefined;
+      const run = options.completion({
+        modelId,
+        history,
+        stream: true,
+        // Split `<think>` into separate thinkingDelta events so reasoning never
+        // pollutes the visible answer.
+        captureThinking: true,
+        ...(generationParams ? { generationParams } : {}),
+        ...(tools ? { tools } : {}),
+      } as unknown as Parameters<CompletionFn>[0]);
+      const result = await consumeRun(run, {
+        onToken: input.onToken,
+        onThinking: input.onThinking ?? options.onThinking,
+      });
+      return {
+        text: result.text,
+        rawContent: result.rawContent,
+        toolCalls: result.toolCalls,
+        requestId: result.requestId,
+      };
+    },
+    async cancel(requestId: string): Promise<void> {
+      // The cancel only lands once the server has begun the request; a same-tick
+      // cancel may race the begin and is logged as a no-match by the SDK.
+      try {
+        await options.cancel({ requestId });
+      } catch (err) {
+        console.warn('[qvac] cancel failed:', err);
+      }
+    },
+  };
+}

package/src/qvac/stream.test.ts ADDED Viewed

@@ -0,0 +1,79 @@
+import { describe, it, expect } from 'vitest';
+import { consumeRun, type CompletionEventLike, type CompletionRunLike } from './stream.js';
+import type { QvacFinalLike } from './parse.js';
+function fakeRun(
+  events: CompletionEventLike[],
+  final: QvacFinalLike,
+  requestId = 'req-1',
+): CompletionRunLike {
+  return {
+    requestId,
+    events: (async function* () {
+      for (const e of events) yield e;
+    })(),
+    final: Promise.resolve(final),
+  };
+}
+describe('consumeRun', () => {
+  it('forwards visible content tokens and accumulates the streamed fallback', async () => {
+    const tokens: string[] = [];
+    const run = fakeRun(
+      [
+        { type: 'contentDelta', text: 'Hel' },
+        { type: 'contentDelta', text: 'lo' },
+      ],
+      { contentText: '', toolCalls: [], raw: { fullText: '' } },
+    );
+    const out = await consumeRun(run, { onToken: (t) => tokens.push(t) });
+    expect(tokens).toEqual(['Hel', 'lo']);
+    // contentText empty ⇒ falls back to the streamed accumulation.
+    expect(out.text).toBe('Hello');
+  });
+  it('routes thinkingDelta to onThinking, not onToken', async () => {
+    const visible: string[] = [];
+    const thinking: string[] = [];
+    const run = fakeRun(
+      [
+        { type: 'thinkingDelta', text: 'plan…' },
+        { type: 'contentDelta', text: 'Answer' },
+      ],
+      { contentText: 'Answer', toolCalls: [], raw: { fullText: 'Answer' } },
+    );
+    await consumeRun(run, {
+      onToken: (t) => visible.push(t),
+      onThinking: (t) => thinking.push(t),
+    });
+    expect(visible).toEqual(['Answer']);
+    expect(thinking).toEqual(['plan…']);
+  });
+  it('returns parsed tool calls + requestId and flags truncation from stopReason', async () => {
+    const run = fakeRun(
+      [],
+      {
+        contentText: 'partial',
+        toolCalls: [{ id: 't1', name: 'get_balance', arguments: {} }],
+        raw: { fullText: 'partial' },
+        stopReason: 'length',
+      },
+      'req-xyz',
+    );
+    const out = await consumeRun(run);
+    expect(out.requestId).toBe('req-xyz');
+    expect(out.toolCalls).toEqual([{ id: 't1', name: 'get_balance', arguments: {} }]);
+    expect(out.truncated).toBe(true);
+  });
+  it('ignores delta events with no text', async () => {
+    const tokens: string[] = [];
+    const run = fakeRun(
+      [{ type: 'contentDelta' }, { type: 'toolCall' }, { type: 'contentDelta', text: 'hi' }],
+      { contentText: 'hi', toolCalls: [], raw: { fullText: 'hi' } },
+    );
+    await consumeRun(run, { onToken: (t) => tokens.push(t) });
+    expect(tokens).toEqual(['hi']);
+  });
+});

package/src/qvac/stream.ts ADDED Viewed

@@ -0,0 +1,56 @@
+/**
+ * Consume a QVAC `completion()` run: drain the event stream (forwarding visible
+ * + thinking tokens) and fold the `final` frame into a ParsedTurn.
+ *
+ * Defined over a structural `CompletionRunLike` (not the SDK type) so it stays
+ * SDK-free and unit-testable with a fake run — the real `CompletionRun` is
+ * assignable to it. The actual `@qvac/sdk` import lives in `provider.ts`.
+ */
+import { finalToTurn, type ParsedTurn, type QvacFinalLike } from './parse.js';
+/** Minimal shape of a QVAC completion event we react to. */
+export interface CompletionEventLike {
+  type: string;
+  /** Present on `contentDelta` / `thinkingDelta` / `rawDelta`. */
+  text?: string;
+}
+/** Structural subset of `completion()`'s return we depend on. */
+export interface CompletionRunLike {
+  requestId: string;
+  events: AsyncIterable<CompletionEventLike>;
+  final: Promise<QvacFinalLike>;
+}
+export interface StreamHandlers {
+  /** Visible assistant tokens (excludes `<think>` reasoning). */
+  onToken?: (token: string) => void;
+  /** The model's `<think>` reasoning, streamed separately. */
+  onThinking?: (token: string) => void;
+}
+export interface ConsumedTurn extends ParsedTurn {
+  requestId: string;
+}
+/**
+ * Stream a run to completion. `contentDelta` → onToken (and the streamed
+ * fallback text), `thinkingDelta` → onThinking. Returns the parsed turn plus the
+ * run's `requestId` (for cancellation bookkeeping by the caller).
+ */
+export async function consumeRun(
+  run: CompletionRunLike,
+  handlers: StreamHandlers = {},
+): Promise<ConsumedTurn> {
+  let streamed = '';
+  for await (const event of run.events) {
+    if (event.type === 'contentDelta' && typeof event.text === 'string') {
+      streamed += event.text;
+      handlers.onToken?.(event.text);
+    } else if (event.type === 'thinkingDelta' && typeof event.text === 'string') {
+      handlers.onThinking?.(event.text);
+    }
+  }
+  const final = await run.final;
+  return { ...finalToTurn(final, streamed), requestId: run.requestId };
+}