npm - @alexkroman1/aai - Versions diffs - 1.4.5 → 1.5.0 - Mend

@alexkroman1/aai 1.4.5 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (78) hide show

package/.turbo/turbo-build.log +9 -9
package/CHANGELOG.md +13 -0
package/dist/assemblyai-C969QGi4.js +35 -0
package/dist/cartesia-BfQPOQ7Y.js +37 -0
package/dist/host/_pipeline-test-fakes.d.ts +3 -1
package/dist/host/providers/stt/deepgram.d.ts +28 -0
package/dist/host/providers/tts/cartesia.d.ts +1 -1
package/dist/host/providers/tts/rime.d.ts +44 -0
package/dist/host/runtime-barrel.d.ts +4 -2
package/dist/host/runtime-barrel.js +1432 -1208
package/dist/host/runtime.d.ts +2 -2
package/dist/host/s2s.d.ts +16 -16
package/dist/host/session-core.d.ts +37 -0
package/dist/host/transports/pipeline-transport.d.ts +48 -0
package/dist/host/transports/s2s-transport.d.ts +19 -0
package/dist/host/transports/types.d.ts +45 -0
package/dist/host/ws-handler.d.ts +14 -10
package/dist/sdk/protocol.d.ts +6 -5
package/dist/sdk/providers/llm-barrel.js +1 -1
package/dist/sdk/providers/stt/deepgram.d.ts +35 -0
package/dist/sdk/providers/stt-barrel.d.ts +1 -0
package/dist/sdk/providers/stt-barrel.js +2 -2
package/dist/sdk/providers/tts/cartesia.d.ts +12 -4
package/dist/sdk/providers/tts/rime.d.ts +42 -0
package/dist/sdk/providers/tts-barrel.d.ts +1 -0
package/dist/sdk/providers/tts-barrel.js +2 -2
package/host/_pipeline-test-fakes.ts +6 -3
package/host/_test-utils.ts +209 -128
package/host/cleanup.test.ts +25 -298
package/host/integration/pipeline-reference.integration.test.ts +30 -35
package/host/providers/resolve.ts +10 -2
package/host/providers/stt/deepgram.test.ts +229 -0
package/host/providers/stt/deepgram.ts +172 -0
package/host/providers/tts/cartesia.ts +7 -3
package/host/providers/tts/rime.test.ts +251 -0
package/host/providers/tts/rime.ts +322 -0
package/host/runtime-barrel.ts +4 -2
package/host/runtime.test.ts +13 -46
package/host/runtime.ts +131 -23
package/host/s2s.test.ts +122 -131
package/host/s2s.ts +44 -52
package/host/session-core.test.ts +257 -0
package/host/session-core.ts +262 -0
package/host/transports/pipeline-transport.test.ts +651 -0
package/host/transports/pipeline-transport.ts +532 -0
package/host/{fixture-replay.test.ts → transports/s2s-transport-fixtures.test.ts} +76 -106
package/host/transports/s2s-transport.test.ts +56 -0
package/host/transports/s2s-transport.ts +116 -0
package/host/transports/types.test.ts +22 -0
package/host/transports/types.ts +51 -0
package/host/ws-handler.test.ts +324 -242
package/host/ws-handler.ts +56 -59
package/package.json +2 -1
package/sdk/__snapshots__/exports.test.ts.snap +3 -3
package/sdk/protocol-compat.test.ts +8 -0
package/sdk/protocol.ts +6 -5
package/sdk/providers/stt/deepgram.ts +43 -0
package/sdk/providers/stt-barrel.ts +2 -0
package/sdk/providers/tts/cartesia.ts +15 -5
package/sdk/providers/tts/rime.ts +52 -0
package/sdk/providers/tts-barrel.ts +2 -0
package/dist/assemblyai-Cxg9eobY.js +0 -18
package/dist/cartesia-DwDk2tEu.js +0 -10
package/dist/host/pipeline-session-ctx.d.ts +0 -24
package/dist/host/pipeline-session.d.ts +0 -52
package/dist/host/session-ctx.d.ts +0 -73
package/dist/host/session.d.ts +0 -62
package/host/pipeline-session-ctx.test.ts +0 -31
package/host/pipeline-session-ctx.ts +0 -36
package/host/pipeline-session.test.ts +0 -672
package/host/pipeline-session.ts +0 -533
package/host/s2s-fixtures.test.ts +0 -237
package/host/session-ctx.test.ts +0 -387
package/host/session-ctx.ts +0 -134
package/host/session-fixture-replay.test.ts +0 -128
package/host/session.test.ts +0 -634
package/host/session.ts +0 -412
/package/dist/{anthropic-BrUCPKUc.js → anthropic-CcLZygAr.js} +0 -0

package/host/{fixture-replay.test.ts → transports/s2s-transport-fixtures.test.ts} RENAMED Viewed

@@ -1,6 +1,6 @@
 // Copyright 2025 the AAI authors. MIT license.
 /**
- * Fixture replay tests with a REAL Runtime.
+ * Fixture replay tests with a REAL Runtime — now wired to the transport layer.
  *
  * Replays recorded AssemblyAI S2S messages (from Kokoro TTS audio) through
  * a real agent session — real tool execution, real Zod arg validation, real
@@ -9,12 +9,16 @@
  * This exercises: AgentDef → toAgentConfig → tool schemas → Zod validation
  * → executeToolCall → session orchestration (reply guards, tool buffering,
  * turnPromise chaining, conversation history).
+ *
+ * Migrated from host/fixture-replay.test.ts (Task 19). Uses createFixtureSession
+ * which spies on s2s-transport.ts _internals.connectS2s and fires S2sCallbacks
+ * directly — no nanoevents / old S2sEvents system.
  */
 import { afterEach, describe, expect, test, vi } from "vitest";
 import { z } from "zod";
-import type { AgentDef } from "../sdk/types.ts";
-import { createFixtureSession, flush } from "./_test-utils.ts";
+import type { AgentDef } from "../../sdk/types.ts";
+import { createFixtureSession, flush } from "../_test-utils.ts";
 // ─── Test agents with deterministic tools ────────────────────────────────────
@@ -67,7 +71,7 @@ const statefulAgent: AgentDef<{ callCount: number }> = {
 // ─── Tests ───────────────────────────────────────────────────────────────────
-describe("fixture replay with real executor", () => {
+describe("fixture replay with real executor (transport layer)", () => {
   let cleanup: () => void;
   afterEach(() => {
@@ -79,15 +83,15 @@ describe("fixture replay with real executor", () => {
   test("tool call fixture: Zod validates args, real tool executes, result sent to S2S", async () => {
     const ctx = createFixtureSession(weatherAgent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("tool-call-sequence.json");
     // Wait for the async tool execution pipeline to complete
-    await vi.waitFor(() => expect(ctx.mockHandle.sendToolResult).toHaveBeenCalled());
+    await vi.waitFor(() => expect(ctx.fakeHandle.sendToolResult).toHaveBeenCalled());
     // Verify the real tool was called and produced correct output
-    const [callId, resultStr] = vi.mocked(ctx.mockHandle.sendToolResult).mock.calls[0] as [
+    const [callId, resultStr] = vi.mocked(ctx.fakeHandle.sendToolResult).mock.calls[0] as [
       string,
       string,
     ];
@@ -101,34 +105,30 @@ describe("fixture replay with real executor", () => {
   test("tool call fixture: client receives tool_call with validated args", async () => {
     const ctx = createFixtureSession(weatherAgent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("tool-call-sequence.json");
-    await vi.waitFor(() => expect(ctx.mockHandle.sendToolResult).toHaveBeenCalled());
+    await vi.waitFor(() => expect(ctx.fakeHandle.sendToolResult).toHaveBeenCalled());
-    const toolStart = ctx.client.events.find((e) => (e as { type: string }).type === "tool_call") as
-      | { toolName: string; args: Record<string, unknown> }
-      | undefined;
-    expect(toolStart?.toolName).toBe("get_weather");
-    expect(toolStart?.args).toEqual({ city: "San Francisco" });
+    expect(ctx.client.toolCallEvents.length).toBeGreaterThan(0);
+    const toolEvent = ctx.client.toolCallEvents[0];
+    expect(toolEvent?.name).toBe("get_weather");
+    expect(toolEvent?.args).toEqual({ city: "San Francisco" });
   });
   test("tool call fixture: conversation history accumulates user + assistant messages", async () => {
     const ctx = createFixtureSession(weatherAgent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("tool-call-sequence.json");
-    await vi.waitFor(() => expect(ctx.mockHandle.sendToolResult).toHaveBeenCalled());
+    await vi.waitFor(() => expect(ctx.fakeHandle.sendToolResult).toHaveBeenCalled());
     await flush();
     // Client received user transcript
-    const turns = ctx.client.events.filter(
-      (e) => (e as { type: string }).type === "user_transcript",
-    );
-    expect(turns.length).toBeGreaterThan(0);
-    const userText = (turns.at(-1) as { text: string }).text;
-    expect(userText.toLowerCase()).toContain("weather");
+    expect(ctx.client.userTranscripts.length).toBeGreaterThan(0);
+    const lastUserText = ctx.client.userTranscripts.at(-1) ?? "";
+    expect(lastUserText.toLowerCase()).toContain("weather");
   });
   // ── Simple question: no tools, just session lifecycle ──────────────────
@@ -136,29 +136,25 @@ describe("fixture replay with real executor", () => {
   test("simple question fixture: greeting + agent response reach client", async () => {
     const ctx = createFixtureSession(simpleAgent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("simple-question-sequence.json");
     await flush();
-    const chats = ctx.client.events.filter(
-      (e) => (e as { type: string }).type === "agent_transcript",
-    );
-    expect(chats.length).toBeGreaterThanOrEqual(2); // greeting + answer
+    expect(ctx.client.agentTranscripts.length).toBeGreaterThanOrEqual(2); // greeting + answer
   });
   test("simple question fixture: user speech events forwarded to client", async () => {
     const ctx = createFixtureSession(simpleAgent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("simple-question-sequence.json");
     await flush();
-    const types = ctx.client.events.map((e) => (e as { type: string }).type);
-    expect(types).toContain("speech_started");
-    expect(types).toContain("speech_stopped");
-    expect(types).toContain("user_transcript");
+    expect(ctx.client.speechStartedCount).toBeGreaterThan(0);
+    expect(ctx.client.speechStoppedCount).toBeGreaterThan(0);
+    expect(ctx.client.userTranscripts.length).toBeGreaterThan(0);
   });
   // ── Stateful agent: session state persists across tool calls ───────────
@@ -166,12 +162,12 @@ describe("fixture replay with real executor", () => {
   test("stateful agent: tool accesses and mutates session state", async () => {
     const ctx = createFixtureSession(statefulAgent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("tool-call-sequence.json");
-    await vi.waitFor(() => expect(ctx.mockHandle.sendToolResult).toHaveBeenCalled());
+    await vi.waitFor(() => expect(ctx.fakeHandle.sendToolResult).toHaveBeenCalled());
-    const [, resultStr] = vi.mocked(ctx.mockHandle.sendToolResult).mock.calls[0] as [
+    const [, resultStr] = vi.mocked(ctx.fakeHandle.sendToolResult).mock.calls[0] as [
       string,
       string,
     ];
@@ -181,17 +177,16 @@ describe("fixture replay with real executor", () => {
   // ── Greeting only: session lifecycle without user audio ────────────────
-  test("greeting fixture: session setup completes with tts_done", async () => {
+  test("greeting fixture: session setup completes with reply_done", async () => {
     const ctx = createFixtureSession(simpleAgent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("greeting-session-sequence.json");
     await flush();
-    const types = ctx.client.events.map((e) => (e as { type: string }).type);
-    expect(types).toContain("agent_transcript");
-    expect(types).toContain("reply_done");
+    expect(ctx.client.agentTranscripts.length).toBeGreaterThan(0);
+    expect(ctx.client.replyDoneCount).toBeGreaterThan(0);
   });
   // ── Tool schemas: real agent produces correct S2S tool schemas ─────────
@@ -231,13 +226,13 @@ describe("fixture replay with real executor", () => {
     const ctx = createFixtureSession(agent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("tool-call-sequence.json");
-    await vi.waitFor(() => expect(ctx.mockHandle.sendToolResult).toHaveBeenCalled());
+    await vi.waitFor(() => expect(ctx.fakeHandle.sendToolResult).toHaveBeenCalled());
     // Tool result should contain the error
-    const [, resultStr] = vi.mocked(ctx.mockHandle.sendToolResult).mock.calls[0] as [
+    const [, resultStr] = vi.mocked(ctx.fakeHandle.sendToolResult).mock.calls[0] as [
       string,
       string,
     ];
@@ -266,13 +261,13 @@ describe("fixture replay with real executor", () => {
     const ctx = createFixtureSession(agent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("tool-call-sequence.json");
-    await vi.waitFor(() => expect(ctx.mockHandle.sendToolResult).toHaveBeenCalled());
+    await vi.waitFor(() => expect(ctx.fakeHandle.sendToolResult).toHaveBeenCalled());
     // The result should contain a Zod validation error
-    const [, resultStr] = vi.mocked(ctx.mockHandle.sendToolResult).mock.calls[0] as [
+    const [, resultStr] = vi.mocked(ctx.fakeHandle.sendToolResult).mock.calls[0] as [
       string,
       string,
     ];
@@ -304,45 +299,31 @@ describe("fixture replay with real executor", () => {
     const ctx = createFixtureSession(agent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
-    const h = ctx.mockHandle;
+    const cbs = ctx.mockCallbacks;
     // Fire an interrupted transcript — should NOT go into conversation history
-    h._fire("replyStarted", { replyId: "r1" });
-    h._fire("event", {
-      type: "agent_transcript",
-      text: "This was interrupted",
-      _interrupted: true,
-    });
-    h._fire("event", { type: "cancelled" });
+    cbs.onReplyStarted("r1");
+    cbs.onAgentTranscript("This was interrupted", true);
+    cbs.onCancelled();
     await flush();
     // Client sees both agent_transcript and cancelled events
-    const types = ctx.client.events.map((e) => (e as { type: string }).type);
-    expect(types).toContain("agent_transcript");
-    expect(types).toContain("cancelled");
+    expect(ctx.client.agentTranscripts).toContain("This was interrupted");
+    expect(ctx.client.cancelledCount).toBeGreaterThan(0);
     // Fire a non-interrupted transcript — SHOULD go into conversation history
-    h._fire("replyStarted", { replyId: "r2" });
-    h._fire("event", {
-      type: "agent_transcript",
-      text: "This was completed",
-      _interrupted: false,
-    });
-    h._fire("event", { type: "reply_done" });
+    cbs.onReplyStarted("r2");
+    cbs.onAgentTranscript("This was completed", false);
+    cbs.onReplyDone();
     await flush();
     // Trigger a tool call to inspect conversation history.
-    h._fire("event", { type: "user_transcript", text: "check" });
+    cbs.onUserTranscript("check");
     await flush();
-    h._fire("replyStarted", { replyId: "r3" });
-    h._fire("event", {
-      type: "tool_call",
-      toolCallId: "c1",
-      toolName: "check_history",
-      args: { q: "test" },
-    });
+    cbs.onReplyStarted("r3");
+    cbs.onToolCall("c1", "check_history", { q: "test" });
     // Wait for tool to execute (captures messages)
     await vi.waitFor(() => expect(capturedMessages.length).toBeGreaterThan(0));
@@ -376,27 +357,27 @@ describe("fixture replay with real executor", () => {
     const ctx = createFixtureSession(agent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
     ctx.replay("tool-call-sequence.json");
-    await vi.waitFor(() => expect(ctx.mockHandle.sendToolResult).toHaveBeenCalled());
+    await vi.waitFor(() => expect(ctx.fakeHandle.sendToolResult).toHaveBeenCalled());
     // The tool should have seen the user's weather question in messages
     const userMsgs = capturedMessages.filter((m) => m.role === "user");
     expect(userMsgs.some((m) => m.content.toLowerCase().includes("weather"))).toBe(true);
   });
-  // ── Audio chunks forwarded to client.playAudioChunk ────────────────────
+  // ── Audio chunks forwarded to client.audio ─────────────────────────────
-  test("reply.audio events forwarded to client.playAudioChunk", async () => {
+  test("reply.audio events forwarded to client.audio", async () => {
     const ctx = createFixtureSession(simpleAgent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
+    await ctx.start();
-    // Manually fire audio events (replay skips them, so fire directly)
+    // Fire audio events directly via callbacks (replay skips reply.audio)
     const audioBytes = new Uint8Array([10, 20, 30, 40]);
-    ctx.mockHandle._fire("audio", { audio: audioBytes });
-    ctx.mockHandle._fire("audio", { audio: new Uint8Array([50, 60]) });
+    ctx.mockCallbacks.onAudio(audioBytes);
+    ctx.mockCallbacks.onAudio(new Uint8Array([50, 60]));
     expect(ctx.client.audioChunks.length).toBe(2);
     expect(Array.from(ctx.client.audioChunks[0] ?? [])).toEqual([10, 20, 30, 40]);
@@ -422,40 +403,29 @@ describe("fixture replay with real executor", () => {
     const ctx = createFixtureSession(agent);
     cleanup = ctx.cleanup;
-    await ctx.session.start();
-    const h = ctx.mockHandle;
-    h._fire("replyStarted", { replyId: "r1" });
-    h._fire("event", {
-      type: "tool_call",
-      toolCallId: "c1",
-      toolName: "get_weather",
-      args: { city: "NYC" },
-    });
-    h._fire("event", {
-      type: "tool_call",
-      toolCallId: "c2",
-      toolName: "get_weather",
-      args: { city: "LA" },
-    });
+    await ctx.start();
+    const cbs = ctx.mockCallbacks;
+    cbs.onReplyStarted("r1");
+    cbs.onToolCall("c1", "get_weather", { city: "NYC" });
+    cbs.onToolCall("c2", "get_weather", { city: "LA" });
-    // Wait for both tool calls to execute
+    // Wait for both tool calls to be dispatched to the client
     await vi.waitFor(() => {
-      const starts = ctx.client.events.filter((e) => (e as { type: string }).type === "tool_call");
-      expect(starts.length).toBe(2);
+      expect(ctx.client.toolCallEvents.length).toBe(2);
     });
-    // Results NOT sent yet — reply_done hasn't fired
-    expect(ctx.mockHandle.sendToolResult).not.toHaveBeenCalled();
+    // Results NOT sent yet — reply.done hasn't fired
+    expect(ctx.fakeHandle.sendToolResult).not.toHaveBeenCalled();
-    // Fire reply_done — should flush both results
-    h._fire("event", { type: "reply_done" });
+    // Fire reply.done — should flush both results
+    cbs.onReplyDone();
     await vi.waitFor(() => {
-      expect(ctx.mockHandle.sendToolResult).toHaveBeenCalledTimes(2);
+      expect(ctx.fakeHandle.sendToolResult).toHaveBeenCalledTimes(2);
     });
     // Verify both results are correct
-    const calls = vi.mocked(ctx.mockHandle.sendToolResult).mock.calls as [string, string][];
+    const calls = vi.mocked(ctx.fakeHandle.sendToolResult).mock.calls as [string, string][];
     const results = calls.map(([, r]) => JSON.parse(r));
     expect(results.some((r) => r.city === "NYC")).toBe(true);
     expect(results.some((r) => r.city === "LA")).toBe(true);

package/host/transports/s2s-transport.test.ts ADDED Viewed

@@ -0,0 +1,56 @@
+import { describe, expect, test, vi } from "vitest";
+import { createS2sTransport } from "./s2s-transport.ts";
+import type { TransportCallbacks } from "./types.ts";
+function makeCallbacks(): TransportCallbacks {
+  return {
+    onReplyStarted: vi.fn(),
+    onReplyDone: vi.fn(),
+    onCancelled: vi.fn(),
+    onAudioChunk: vi.fn(),
+    onAudioDone: vi.fn(),
+    onUserTranscript: vi.fn(),
+    onAgentTranscript: vi.fn(),
+    onToolCall: vi.fn(),
+    onError: vi.fn(),
+    onSpeechStarted: vi.fn(),
+    onSpeechStopped: vi.fn(),
+  };
+}
+describe("S2sTransport", () => {
+  test("start() opens an S2S connection and sends session.update", async () => {
+    const send = vi.fn();
+    const close = vi.fn();
+    const ws = Object.assign(new EventTarget(), {
+      readyState: 0,
+      send,
+      close,
+      addEventListener: EventTarget.prototype.addEventListener as unknown as (
+        type: string,
+        listener: EventListener,
+      ) => void,
+    }) as unknown as import("../s2s.ts").S2sWebSocket;
+    setTimeout(() => {
+      (ws as unknown as { readyState: number }).readyState = 1;
+      (ws as unknown as EventTarget).dispatchEvent(new Event("open"));
+    }, 0);
+    const t = createS2sTransport({
+      apiKey: "k",
+      s2sConfig: { wssUrl: "wss://fake", inputSampleRate: 16_000, outputSampleRate: 24_000 },
+      sessionConfig: { systemPrompt: "test", tools: [] },
+      toolSchemas: [],
+      callbacks: makeCallbacks(),
+      sid: "sid-1",
+      agent: "a",
+      createWebSocket: () => ws,
+    });
+    await t.start();
+    expect(send).toHaveBeenCalled();
+    const firstSend = JSON.parse(send.mock.calls[0]?.[0] as string);
+    expect(firstSend.type).toBe("session.update");
+    await t.stop();
+    expect(close).toHaveBeenCalled();
+  });
+});

package/host/transports/s2s-transport.ts ADDED Viewed

@@ -0,0 +1,116 @@
+// Copyright 2026 the AAI authors. MIT license.
+// S2S transport — wraps connectS2s and forwards typed callbacks into the SessionCore.
+import type { Logger, S2SConfig } from "../runtime-config.ts";
+import { consoleLogger } from "../runtime-config.ts";
+import {
+  type CreateS2sWebSocket,
+  connectS2s,
+  defaultCreateS2sWebSocket,
+  type S2sHandle,
+  type S2sSessionConfig,
+  type S2sToolSchema,
+} from "../s2s.ts";
+import type { Transport, TransportCallbacks, TransportSessionConfig } from "./types.ts";
+/** @internal Exposed for testing — allows spying on connectS2s in unit tests. */
+export const _internals = { connectS2s };
+export type S2sTransportOptions = {
+  apiKey: string;
+  s2sConfig: S2SConfig;
+  sessionConfig: S2sSessionConfig;
+  toolSchemas: S2sToolSchema[];
+  callbacks: TransportCallbacks;
+  sid: string;
+  agent: string;
+  createWebSocket?: CreateS2sWebSocket;
+  logger?: Logger;
+};
+export function createS2sTransport(opts: S2sTransportOptions): Transport {
+  const log = opts.logger ?? consoleLogger;
+  const createWs = opts.createWebSocket ?? defaultCreateS2sWebSocket;
+  let handle: S2sHandle | null = null;
+  let currentReplyId: string | null = null;
+  async function start(): Promise<void> {
+    handle = await _internals.connectS2s({
+      apiKey: opts.apiKey,
+      config: opts.s2sConfig,
+      createWebSocket: createWs,
+      logger: log,
+      sid: opts.sid,
+      callbacks: {
+        onSessionReady: (providerSessionId) => opts.callbacks.onSessionReady?.(providerSessionId),
+        onReplyStarted: (replyId) => {
+          currentReplyId = replyId;
+          opts.callbacks.onReplyStarted(replyId);
+        },
+        onReplyDone: () => {
+          currentReplyId = null;
+          opts.callbacks.onReplyDone();
+        },
+        onCancelled: () => {
+          currentReplyId = null;
+          opts.callbacks.onCancelled();
+        },
+        onAudio: (bytes) => opts.callbacks.onAudioChunk(bytes),
+        onUserTranscript: opts.callbacks.onUserTranscript,
+        onAgentTranscript: opts.callbacks.onAgentTranscript,
+        onToolCall: opts.callbacks.onToolCall,
+        onSpeechStarted: opts.callbacks.onSpeechStarted,
+        onSpeechStopped: opts.callbacks.onSpeechStopped,
+        onSessionExpired: () => {
+          log.info("S2S session expired", { sid: opts.sid });
+          handle?.close();
+        },
+        onError: (err) => opts.callbacks.onError("internal", err.message),
+        onClose: (code, reason) => {
+          if (currentReplyId !== null) {
+            log.warn("S2S closed with active reply", {
+              sid: opts.sid,
+              agent: opts.agent,
+              activeReplyId: currentReplyId,
+              code,
+              reason,
+            });
+            opts.callbacks.onError("connection", `S2S closed mid-reply (code=${code})`);
+          } else {
+            log.info("S2S closed", { code, reason });
+          }
+        },
+      },
+    });
+    handle.updateSession(opts.sessionConfig);
+  }
+  async function stop(): Promise<void> {
+    handle?.close();
+    handle = null;
+  }
+  return {
+    start,
+    stop,
+    sendUserAudio(bytes) {
+      handle?.sendAudio(bytes);
+    },
+    sendToolResult(callId, result) {
+      handle?.sendToolResult(callId, result);
+    },
+    cancelReply() {
+      // AssemblyAI S2S doesn't expose an explicit cancel RPC — reply is
+      // cancelled when the user speaks. Our `onCancel` from the client is
+      // a best-effort signal.
+      currentReplyId = null;
+    },
+    updateSession(config: TransportSessionConfig) {
+      handle?.updateSession({
+        systemPrompt: config.systemPrompt,
+        tools: (config.tools ?? []) as S2sToolSchema[],
+        ...(config.greeting !== undefined ? { greeting: config.greeting } : {}),
+      });
+    },
+  };
+}

package/host/transports/types.test.ts ADDED Viewed

@@ -0,0 +1,22 @@
+import { describe, expect, test } from "vitest";
+import type { Transport, TransportCallbacks } from "./types.ts";
+describe("Transport types", () => {
+  test("file compiles", () => {
+    // Types only; runtime check is trivial.
+    const stub: Transport = {
+      start: () => Promise.resolve(),
+      stop: () => Promise.resolve(),
+      // biome-ignore lint/suspicious/noEmptyBlockStatements: intentional no-op stub
+      sendUserAudio: () => {},
+      // biome-ignore lint/suspicious/noEmptyBlockStatements: intentional no-op stub
+      sendToolResult: () => {},
+      // biome-ignore lint/suspicious/noEmptyBlockStatements: intentional no-op stub
+      cancelReply: () => {},
+    };
+    expect(stub).toBeDefined();
+    // Ensure TransportCallbacks is referenced (type-only check).
+    type _CB = TransportCallbacks;
+  });
+});

package/host/transports/types.ts ADDED Viewed

@@ -0,0 +1,51 @@
+// Copyright 2026 the AAI authors. MIT license.
+// Transport strategy — per-session provider wiring (S2S, pipeline, etc.).
+import type { SessionErrorCode } from "../../sdk/protocol.ts";
+import type { Message } from "../../sdk/types.ts";
+/**
+ * Typed callbacks into the SessionCore. One per event the transport produces.
+ * Constructed at transport-creation time; no emitter.on-style indirection.
+ */
+export type TransportCallbacks = {
+  onReplyStarted(replyId: string): void;
+  onReplyDone(): void;
+  onCancelled(): void;
+  onAudioChunk(bytes: Uint8Array): void;
+  onAudioDone(): void;
+  onUserTranscript(text: string): void;
+  onAgentTranscript(text: string, interrupted: boolean): void;
+  onToolCall(callId: string, name: string, args: Record<string, unknown>): void;
+  onError(code: SessionErrorCode, message: string): void;
+  onSpeechStarted(): void;
+  onSpeechStopped(): void;
+  onSessionReady?(providerSessionId: string): void;
+};
+/** Minimal config a transport may receive at construction time. */
+export type TransportSessionConfig = {
+  systemPrompt: string;
+  greeting?: string;
+  tools?: unknown[];
+  history?: Message[];
+};
+/**
+ * Transport abstraction — one implementation per provider strategy
+ * (see `s2s-transport.ts`, `pipeline-transport.ts`).
+ */
+export interface Transport {
+  /** Open any underlying connections and send initial session config. */
+  start(): Promise<void>;
+  /** Tear down, flush, close. Idempotent. */
+  stop(): Promise<void>;
+  /** Forward user audio to the provider. */
+  sendUserAudio(bytes: Uint8Array): void;
+  /** Forward a tool result back to the provider's reply stream. */
+  sendToolResult(callId: string, result: string): void;
+  /** Cancel the currently in-flight reply (barge-in / client cancel). */
+  cancelReply(): void;
+  /** Re-send session config (S2S only; pipeline is a no-op). */
+  updateSession?(config: TransportSessionConfig): void;
+}