npm - @copilotkit/aimock - Versions diffs - 1.7.0 - Mend

@copilotkit/aimock 1.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (368) hide show

package/.claude-plugin/marketplace.json +17 -0
package/.claude-plugin/plugin.json +12 -0
package/LICENSE +21 -0
package/README.md +82 -0
package/dist/_virtual/_rolldown/runtime.cjs +29 -0
package/dist/a2a-handler.cjs +203 -0
package/dist/a2a-handler.cjs.map +1 -0
package/dist/a2a-handler.js +199 -0
package/dist/a2a-handler.js.map +1 -0
package/dist/a2a-mock.cjs +292 -0
package/dist/a2a-mock.cjs.map +1 -0
package/dist/a2a-mock.d.cts +41 -0
package/dist/a2a-mock.d.cts.map +1 -0
package/dist/a2a-mock.d.ts +41 -0
package/dist/a2a-mock.d.ts.map +1 -0
package/dist/a2a-mock.js +290 -0
package/dist/a2a-mock.js.map +1 -0
package/dist/a2a-stub.cjs +4 -0
package/dist/a2a-stub.d.cts +3 -0
package/dist/a2a-stub.d.ts +3 -0
package/dist/a2a-stub.js +3 -0
package/dist/a2a-types.d.cts +68 -0
package/dist/a2a-types.d.cts.map +1 -0
package/dist/a2a-types.d.ts +68 -0
package/dist/a2a-types.d.ts.map +1 -0
package/dist/aimock-cli.cjs +112 -0
package/dist/aimock-cli.cjs.map +1 -0
package/dist/aimock-cli.d.cts +19 -0
package/dist/aimock-cli.d.cts.map +1 -0
package/dist/aimock-cli.d.ts +19 -0
package/dist/aimock-cli.d.ts.map +1 -0
package/dist/aimock-cli.js +110 -0
package/dist/aimock-cli.js.map +1 -0
package/dist/aws-event-stream.cjs +117 -0
package/dist/aws-event-stream.cjs.map +1 -0
package/dist/aws-event-stream.d.cts +38 -0
package/dist/aws-event-stream.d.cts.map +1 -0
package/dist/aws-event-stream.d.ts +38 -0
package/dist/aws-event-stream.d.ts.map +1 -0
package/dist/aws-event-stream.js +114 -0
package/dist/aws-event-stream.js.map +1 -0
package/dist/bedrock-converse.cjs +445 -0
package/dist/bedrock-converse.cjs.map +1 -0
package/dist/bedrock-converse.d.cts +50 -0
package/dist/bedrock-converse.d.cts.map +1 -0
package/dist/bedrock-converse.d.ts +50 -0
package/dist/bedrock-converse.d.ts.map +1 -0
package/dist/bedrock-converse.js +443 -0
package/dist/bedrock-converse.js.map +1 -0
package/dist/bedrock.cjs +557 -0
package/dist/bedrock.cjs.map +1 -0
package/dist/bedrock.d.cts +41 -0
package/dist/bedrock.d.cts.map +1 -0
package/dist/bedrock.d.ts +41 -0
package/dist/bedrock.d.ts.map +1 -0
package/dist/bedrock.js +553 -0
package/dist/bedrock.js.map +1 -0
package/dist/chaos.cjs +114 -0
package/dist/chaos.cjs.map +1 -0
package/dist/chaos.d.cts +27 -0
package/dist/chaos.d.cts.map +1 -0
package/dist/chaos.d.ts +27 -0
package/dist/chaos.d.ts.map +1 -0
package/dist/chaos.js +113 -0
package/dist/chaos.js.map +1 -0
package/dist/cli.cjs +268 -0
package/dist/cli.cjs.map +1 -0
package/dist/cli.d.cts +1 -0
package/dist/cli.d.ts +1 -0
package/dist/cli.js +268 -0
package/dist/cli.js.map +1 -0
package/dist/cohere.cjs +434 -0
package/dist/cohere.cjs.map +1 -0
package/dist/cohere.d.cts +34 -0
package/dist/cohere.d.cts.map +1 -0
package/dist/cohere.d.ts +34 -0
package/dist/cohere.d.ts.map +1 -0
package/dist/cohere.js +433 -0
package/dist/cohere.js.map +1 -0
package/dist/config-loader.cjs +111 -0
package/dist/config-loader.cjs.map +1 -0
package/dist/config-loader.d.cts +100 -0
package/dist/config-loader.d.cts.map +1 -0
package/dist/config-loader.d.ts +100 -0
package/dist/config-loader.d.ts.map +1 -0
package/dist/config-loader.js +107 -0
package/dist/config-loader.js.map +1 -0
package/dist/embeddings.cjs +150 -0
package/dist/embeddings.cjs.map +1 -0
package/dist/embeddings.d.cts +12 -0
package/dist/embeddings.d.cts.map +1 -0
package/dist/embeddings.d.ts +12 -0
package/dist/embeddings.d.ts.map +1 -0
package/dist/embeddings.js +150 -0
package/dist/embeddings.js.map +1 -0
package/dist/fixture-loader.cjs +269 -0
package/dist/fixture-loader.cjs.map +1 -0
package/dist/fixture-loader.d.cts +17 -0
package/dist/fixture-loader.d.cts.map +1 -0
package/dist/fixture-loader.d.ts +17 -0
package/dist/fixture-loader.d.ts.map +1 -0
package/dist/fixture-loader.js +265 -0
package/dist/fixture-loader.js.map +1 -0
package/dist/gemini.cjs +403 -0
package/dist/gemini.cjs.map +1 -0
package/dist/gemini.d.cts +10 -0
package/dist/gemini.d.cts.map +1 -0
package/dist/gemini.d.ts +10 -0
package/dist/gemini.d.ts.map +1 -0
package/dist/gemini.js +403 -0
package/dist/gemini.js.map +1 -0
package/dist/helpers.cjs +276 -0
package/dist/helpers.cjs.map +1 -0
package/dist/helpers.d.cts +39 -0
package/dist/helpers.d.cts.map +1 -0
package/dist/helpers.d.ts +39 -0
package/dist/helpers.d.ts.map +1 -0
package/dist/helpers.js +259 -0
package/dist/helpers.js.map +1 -0
package/dist/index.cjs +113 -0
package/dist/index.d.cts +42 -0
package/dist/index.d.ts +42 -0
package/dist/index.js +39 -0
package/dist/interruption.cjs +40 -0
package/dist/interruption.cjs.map +1 -0
package/dist/interruption.d.cts +15 -0
package/dist/interruption.d.cts.map +1 -0
package/dist/interruption.d.ts +15 -0
package/dist/interruption.d.ts.map +1 -0
package/dist/interruption.js +39 -0
package/dist/interruption.js.map +1 -0
package/dist/journal.cjs +65 -0
package/dist/journal.cjs.map +1 -0
package/dist/journal.d.cts +23 -0
package/dist/journal.d.cts.map +1 -0
package/dist/journal.d.ts +23 -0
package/dist/journal.d.ts.map +1 -0
package/dist/journal.js +65 -0
package/dist/journal.js.map +1 -0
package/dist/jsonrpc.cjs +91 -0
package/dist/jsonrpc.cjs.map +1 -0
package/dist/jsonrpc.d.cts +24 -0
package/dist/jsonrpc.d.cts.map +1 -0
package/dist/jsonrpc.d.ts +24 -0
package/dist/jsonrpc.d.ts.map +1 -0
package/dist/jsonrpc.js +90 -0
package/dist/jsonrpc.js.map +1 -0
package/dist/llmock.cjs +223 -0
package/dist/llmock.cjs.map +1 -0
package/dist/llmock.d.cts +70 -0
package/dist/llmock.d.cts.map +1 -0
package/dist/llmock.d.ts +70 -0
package/dist/llmock.d.ts.map +1 -0
package/dist/llmock.js +223 -0
package/dist/llmock.js.map +1 -0
package/dist/logger.cjs +29 -0
package/dist/logger.cjs.map +1 -0
package/dist/logger.d.cts +14 -0
package/dist/logger.d.cts.map +1 -0
package/dist/logger.d.ts +14 -0
package/dist/logger.d.ts.map +1 -0
package/dist/logger.js +28 -0
package/dist/logger.js.map +1 -0
package/dist/mcp-handler.cjs +189 -0
package/dist/mcp-handler.cjs.map +1 -0
package/dist/mcp-handler.js +188 -0
package/dist/mcp-handler.js.map +1 -0
package/dist/mcp-mock.cjs +169 -0
package/dist/mcp-mock.cjs.map +1 -0
package/dist/mcp-mock.d.cts +40 -0
package/dist/mcp-mock.d.cts.map +1 -0
package/dist/mcp-mock.d.ts +40 -0
package/dist/mcp-mock.d.ts.map +1 -0
package/dist/mcp-mock.js +167 -0
package/dist/mcp-mock.js.map +1 -0
package/dist/mcp-stub.cjs +4 -0
package/dist/mcp-stub.d.cts +3 -0
package/dist/mcp-stub.d.ts +3 -0
package/dist/mcp-stub.js +3 -0
package/dist/mcp-types.d.cts +65 -0
package/dist/mcp-types.d.cts.map +1 -0
package/dist/mcp-types.d.ts +65 -0
package/dist/mcp-types.d.ts.map +1 -0
package/dist/messages.cjs +489 -0
package/dist/messages.cjs.map +1 -0
package/dist/messages.d.cts +10 -0
package/dist/messages.d.cts.map +1 -0
package/dist/messages.d.ts +10 -0
package/dist/messages.d.ts.map +1 -0
package/dist/messages.js +489 -0
package/dist/messages.js.map +1 -0
package/dist/metrics.cjs +160 -0
package/dist/metrics.cjs.map +1 -0
package/dist/metrics.d.cts +24 -0
package/dist/metrics.d.cts.map +1 -0
package/dist/metrics.d.ts +24 -0
package/dist/metrics.d.ts.map +1 -0
package/dist/metrics.js +158 -0
package/dist/metrics.js.map +1 -0
package/dist/moderation.cjs +91 -0
package/dist/moderation.cjs.map +1 -0
package/dist/moderation.d.cts +23 -0
package/dist/moderation.d.cts.map +1 -0
package/dist/moderation.d.ts +23 -0
package/dist/moderation.d.ts.map +1 -0
package/dist/moderation.js +91 -0
package/dist/moderation.js.map +1 -0
package/dist/ndjson-writer.cjs +31 -0
package/dist/ndjson-writer.cjs.map +1 -0
package/dist/ndjson-writer.d.cts +17 -0
package/dist/ndjson-writer.d.cts.map +1 -0
package/dist/ndjson-writer.d.ts +17 -0
package/dist/ndjson-writer.d.ts.map +1 -0
package/dist/ndjson-writer.js +31 -0
package/dist/ndjson-writer.js.map +1 -0
package/dist/ollama.cjs +519 -0
package/dist/ollama.cjs.map +1 -0
package/dist/ollama.d.cts +34 -0
package/dist/ollama.d.cts.map +1 -0
package/dist/ollama.d.ts +34 -0
package/dist/ollama.d.ts.map +1 -0
package/dist/ollama.js +517 -0
package/dist/ollama.js.map +1 -0
package/dist/recorder.cjs +311 -0
package/dist/recorder.cjs.map +1 -0
package/dist/recorder.d.cts +23 -0
package/dist/recorder.d.cts.map +1 -0
package/dist/recorder.d.ts +23 -0
package/dist/recorder.d.ts.map +1 -0
package/dist/recorder.js +305 -0
package/dist/recorder.js.map +1 -0
package/dist/rerank.cjs +71 -0
package/dist/rerank.cjs.map +1 -0
package/dist/rerank.d.cts +22 -0
package/dist/rerank.d.cts.map +1 -0
package/dist/rerank.d.ts +22 -0
package/dist/rerank.d.ts.map +1 -0
package/dist/rerank.js +71 -0
package/dist/rerank.js.map +1 -0
package/dist/responses.cjs +637 -0
package/dist/responses.cjs.map +1 -0
package/dist/responses.d.cts +16 -0
package/dist/responses.d.cts.map +1 -0
package/dist/responses.d.ts +16 -0
package/dist/responses.d.ts.map +1 -0
package/dist/responses.js +634 -0
package/dist/responses.js.map +1 -0
package/dist/router.cjs +68 -0
package/dist/router.cjs.map +1 -0
package/dist/router.d.cts +16 -0
package/dist/router.d.cts.map +1 -0
package/dist/router.d.ts +16 -0
package/dist/router.d.ts.map +1 -0
package/dist/router.js +65 -0
package/dist/router.js.map +1 -0
package/dist/search.cjs +59 -0
package/dist/search.cjs.map +1 -0
package/dist/search.d.cts +23 -0
package/dist/search.d.cts.map +1 -0
package/dist/search.d.ts +23 -0
package/dist/search.d.ts.map +1 -0
package/dist/search.js +59 -0
package/dist/search.js.map +1 -0
package/dist/server.cjs +935 -0
package/dist/server.cjs.map +1 -0
package/dist/server.d.cts +28 -0
package/dist/server.d.cts.map +1 -0
package/dist/server.d.ts +28 -0
package/dist/server.d.ts.map +1 -0
package/dist/server.js +933 -0
package/dist/server.js.map +1 -0
package/dist/sse-writer.cjs +59 -0
package/dist/sse-writer.cjs.map +1 -0
package/dist/sse-writer.d.cts +19 -0
package/dist/sse-writer.d.cts.map +1 -0
package/dist/sse-writer.d.ts +19 -0
package/dist/sse-writer.d.ts.map +1 -0
package/dist/sse-writer.js +55 -0
package/dist/sse-writer.js.map +1 -0
package/dist/stream-collapse.cjs +496 -0
package/dist/stream-collapse.cjs.map +1 -0
package/dist/stream-collapse.d.cts +70 -0
package/dist/stream-collapse.d.cts.map +1 -0
package/dist/stream-collapse.d.ts +70 -0
package/dist/stream-collapse.d.ts.map +1 -0
package/dist/stream-collapse.js +489 -0
package/dist/stream-collapse.js.map +1 -0
package/dist/suite.cjs +46 -0
package/dist/suite.cjs.map +1 -0
package/dist/suite.d.cts +31 -0
package/dist/suite.d.cts.map +1 -0
package/dist/suite.d.ts +31 -0
package/dist/suite.d.ts.map +1 -0
package/dist/suite.js +46 -0
package/dist/suite.js.map +1 -0
package/dist/types.d.cts +243 -0
package/dist/types.d.cts.map +1 -0
package/dist/types.d.ts +243 -0
package/dist/types.d.ts.map +1 -0
package/dist/url.cjs +21 -0
package/dist/url.cjs.map +1 -0
package/dist/url.d.cts +16 -0
package/dist/url.d.cts.map +1 -0
package/dist/url.d.ts +16 -0
package/dist/url.d.ts.map +1 -0
package/dist/url.js +20 -0
package/dist/url.js.map +1 -0
package/dist/vector-handler.cjs +239 -0
package/dist/vector-handler.cjs.map +1 -0
package/dist/vector-handler.js +238 -0
package/dist/vector-handler.js.map +1 -0
package/dist/vector-mock.cjs +229 -0
package/dist/vector-mock.cjs.map +1 -0
package/dist/vector-mock.d.cts +39 -0
package/dist/vector-mock.d.cts.map +1 -0
package/dist/vector-mock.d.ts +39 -0
package/dist/vector-mock.d.ts.map +1 -0
package/dist/vector-mock.js +227 -0
package/dist/vector-mock.js.map +1 -0
package/dist/vector-stub.cjs +4 -0
package/dist/vector-stub.d.cts +3 -0
package/dist/vector-stub.d.ts +3 -0
package/dist/vector-stub.js +3 -0
package/dist/vector-types.d.cts +32 -0
package/dist/vector-types.d.cts.map +1 -0
package/dist/vector-types.d.ts +32 -0
package/dist/vector-types.d.ts.map +1 -0
package/dist/watcher.cjs +59 -0
package/dist/watcher.cjs.map +1 -0
package/dist/watcher.js +58 -0
package/dist/watcher.js.map +1 -0
package/dist/ws-framing.cjs +187 -0
package/dist/ws-framing.cjs.map +1 -0
package/dist/ws-framing.d.cts +26 -0
package/dist/ws-framing.d.cts.map +1 -0
package/dist/ws-framing.d.ts +26 -0
package/dist/ws-framing.d.ts.map +1 -0
package/dist/ws-framing.js +184 -0
package/dist/ws-framing.js.map +1 -0
package/dist/ws-gemini-live.cjs +364 -0
package/dist/ws-gemini-live.cjs.map +1 -0
package/dist/ws-gemini-live.d.cts +18 -0
package/dist/ws-gemini-live.d.cts.map +1 -0
package/dist/ws-gemini-live.d.ts +18 -0
package/dist/ws-gemini-live.d.ts.map +1 -0
package/dist/ws-gemini-live.js +364 -0
package/dist/ws-gemini-live.js.map +1 -0
package/dist/ws-realtime.cjs +435 -0
package/dist/ws-realtime.cjs.map +1 -0
package/dist/ws-realtime.d.cts +17 -0
package/dist/ws-realtime.d.cts.map +1 -0
package/dist/ws-realtime.d.ts +17 -0
package/dist/ws-realtime.d.ts.map +1 -0
package/dist/ws-realtime.js +435 -0
package/dist/ws-realtime.js.map +1 -0
package/dist/ws-responses.cjs +164 -0
package/dist/ws-responses.cjs.map +1 -0
package/dist/ws-responses.d.cts +18 -0
package/dist/ws-responses.d.cts.map +1 -0
package/dist/ws-responses.d.ts +18 -0
package/dist/ws-responses.d.ts.map +1 -0
package/dist/ws-responses.js +164 -0
package/dist/ws-responses.js.map +1 -0
package/fixtures/example-greeting.json +12 -0
package/fixtures/example-multi-turn.json +14 -0
package/fixtures/example-tool-call.json +15 -0
package/package.json +118 -0
package/skills/write-fixtures/SKILL.md +625 -0

package/skills/write-fixtures/SKILL.md ADDED Viewed

@@ -0,0 +1,625 @@
+---
+name: write-fixtures
+description: Use when writing test fixtures for @copilotkit/aimock — mock LLM responses, tool call sequences, error injection, multi-turn agent loops, embeddings, structured output, sequential responses, or debugging fixture mismatches
+---
+# Writing aimock Test Fixtures
+## What aimock Is
+aimock is a zero-dependency mock LLM server. Fixture-driven. Multi-provider (OpenAI, Anthropic, Gemini, AWS Bedrock, Azure OpenAI, Vertex AI, Ollama, Cohere). Runs a real HTTP server on a real port — works across processes, unlike MSW-style interceptors. WebSocket support for OpenAI Responses/Realtime and Gemini Live APIs. Chaos testing and Prometheus metrics.
+## Core Mental Model
+- **Fixtures** = match criteria + response
+- **First-match-wins** — order matters
+- All providers share one fixture pool (provider adapters normalize to `ChatCompletionRequest`)
+- Fixtures are live — mutations after `start()` take effect immediately
+- Sequential responses are supported via `sequenceIndex` (match count tracked per fixture)
+## Match Field Reference
+| Field            | Type                                      | Matches Against                                                               |
+| ---------------- | ----------------------------------------- | ----------------------------------------------------------------------------- |
+| `userMessage`    | `string`                                  | Substring of last `role: "user"` message text                                 |
+| `userMessage`    | `RegExp`                                  | Pattern test on last `role: "user"` message text                              |
+| `inputText`      | `string`                                  | Substring of embedding input text (concatenated if multiple inputs)           |
+| `inputText`      | `RegExp`                                  | Pattern test on embedding input text                                          |
+| `toolName`       | `string`                                  | Exact match on any tool in request's `tools[]` array (by `function.name`)     |
+| `toolCallId`     | `string`                                  | Exact match on `tool_call_id` of last `role: "tool"` message                  |
+| `model`          | `string`                                  | Exact match on `req.model`                                                    |
+| `model`          | `RegExp`                                  | Pattern test on `req.model`                                                   |
+| `responseFormat` | `string`                                  | Exact match on `req.response_format.type` (`"json_object"`, `"json_schema"`)  |
+| `sequenceIndex`  | `number`                                  | Matches only when this fixture's match count equals the given index (0-based) |
+| `predicate`      | `(req: ChatCompletionRequest) => boolean` | Custom function — full access to request                                      |
+**AND logic**: all specified fields must match. Empty match `{}` = catch-all.
+Multi-part content (e.g., `[{type: "text", text: "hello"}]`) is automatically extracted — `userMessage` matching works regardless of content format.
+## Response Types
+### Text
+```typescript
+{
+  content: "Hello!";
+}
+```
+### Tool Calls
+```typescript
+{
+  toolCalls: [{ name: "get_weather", arguments: '{"city":"SF"}' }];
+}
+```
+**`arguments` MUST be a JSON string**, not an object. This is the #1 mistake.
+### Embedding
+```typescript
+{
+  embedding: [0.1, 0.2, 0.3, -0.5, 0.8];
+}
+```
+The embedding vector is returned for each input in the request. If no embedding fixture matches, deterministic embeddings are auto-generated from the input text hash — you only need fixtures when you want specific vectors.
+### Error
+```typescript
+{ error: { message: "Rate limited", type: "rate_limit_error" }, status: 429 }
+```
+### Chaos (Failure Injection)
+The optional `chaos` field on a fixture enables probabilistic failure injection:
+```typescript
+{
+  chaos?: {
+    dropRate?: number;      // Probability (0-1) of returning a 500 error
+    malformedRate?: number; // Probability (0-1) of returning malformed JSON
+    disconnectRate?: number; // Probability (0-1) of disconnecting mid-stream
+  }
+}
+```
+Rates are evaluated per-request. When triggered, the chaos failure replaces the normal response.
+## Common Patterns
+### Basic text fixture
+```typescript
+mock.onMessage("hello", { content: "Hi there!" });
+```
+### Tool call → tool result → final response (3-step agent loop)
+The most common pattern. Fixture 1 triggers the tool call, fixture 2 handles the tool result.
+```typescript
+// Step 1: User asks about weather → LLM calls tool
+mock.onMessage("weather", {
+  toolCalls: [{ name: "get_weather", arguments: '{"city":"SF"}' }],
+});
+// Step 2: Tool result comes back → LLM responds with text
+mock.addFixture({
+  match: { predicate: (req) => req.messages.at(-1)?.role === "tool" },
+  response: { content: "It's 72°F in San Francisco." },
+});
+```
+**Why predicate, not userMessage?** After a tool call, the client replays the same conversation with the tool result appended. The user message hasn't changed — `userMessage: "weather"` would match the SAME fixture again, creating an infinite loop.
+### Embedding fixture
+```typescript
+// Match specific input text
+mock.onEmbedding("search query", {
+  embedding: [0.1, 0.2, 0.3, 0.4, 0.5],
+});
+// Match with regex
+mock.onEmbedding(/product.*description/, {
+  embedding: [0.9, -0.1, 0.5, 0.3, 0.2],
+});
+```
+### Structured output / JSON mode
+```typescript
+// onJsonOutput auto-sets responseFormat: "json_object" and stringifies objects
+mock.onJsonOutput("extract entities", {
+  entities: [
+    { name: "Acme Corp", type: "company" },
+    { name: "Jane Doe", type: "person" },
+  ],
+});
+// Equivalent manual form:
+mock.addFixture({
+  match: { userMessage: "extract entities", responseFormat: "json_object" },
+  response: { content: '{"entities":[...]}' },
+});
+```
+### Sequential responses (same match, different responses)
+```typescript
+// First call returns tool call, second returns text
+mock.on(
+  { userMessage: "status", sequenceIndex: 0 },
+  { toolCalls: [{ name: "check_status", arguments: "{}" }] },
+);
+mock.on({ userMessage: "status", sequenceIndex: 1 }, { content: "All systems operational." });
+```
+Match counts are tracked per fixture group and reset with `reset()` or `resetMatchCounts()`.
+### Streaming physics (realistic timing)
+```typescript
+mock.onMessage(
+  "tell me a story",
+  { content: "Once upon a time..." },
+  {
+    streamingProfile: {
+      ttft: 200, // 200ms before first token
+      tps: 30, // 30 tokens per second after that
+      jitter: 0.1, // ±10% random variance
+    },
+  },
+);
+```
+### Predicate-based routing (same user message, different context)
+Common in supervisor/orchestrator patterns where the system prompt changes:
+```typescript
+mock.addFixture({
+  match: {
+    predicate: (req) => {
+      const sys = req.messages.find((m) => m.role === "system")?.content ?? "";
+      return typeof sys === "string" && sys.includes("Flights found: false");
+    },
+  },
+  response: { toolCalls: [{ name: "search_flights", arguments: "{}" }] },
+});
+```
+### Catch-all (always add one)
+Prevents unmatched requests from returning 404 and crashing the test:
+```typescript
+mock.addFixture({
+  match: { predicate: () => true },
+  response: { content: "I understand. How can I help?" },
+});
+```
+### Tool result catch-all with prependFixture
+Must go at the front so it matches before substring-based fixtures:
+```typescript
+mock.prependFixture({
+  match: { predicate: (req) => req.messages.at(-1)?.role === "tool" },
+  response: { content: "Done!" },
+});
+```
+### Stream interruption simulation (v1.3.0+)
+```typescript
+mock.onMessage(
+  "long response",
+  { content: "This will be cut short..." },
+  {
+    truncateAfterChunks: 3, // Stop after 3 SSE chunks
+    disconnectAfterMs: 500, // Or disconnect after 500ms
+  },
+);
+```
+### Chaos testing (probabilistic failures)
+```typescript
+mock.addFixture({
+  match: { userMessage: "flaky" },
+  response: { content: "Sometimes works!" },
+  chaos: { dropRate: 0.3 },
+});
+```
+30% of requests matching this fixture will get a 500 error instead of the response. Can also use `malformedRate` (garbled JSON) or `disconnectRate` (connection dropped mid-stream).
+Server-level chaos applies to ALL requests:
+```typescript
+mock.setChaos({ dropRate: 0.1 }); // 10% of all requests fail
+mock.clearChaos(); // Remove server-level chaos
+```
+### Error injection (one-shot)
+```typescript
+mock.nextRequestError(429, { message: "Rate limited", type: "rate_limit_error" });
+// Next request gets 429, then fixture auto-removes itself
+```
+### JSON fixture files
+```json
+{
+  "fixtures": [
+    {
+      "match": { "userMessage": "hello" },
+      "response": { "content": "Hi!" }
+    },
+    {
+      "match": { "inputText": "search query" },
+      "response": { "embedding": [0.1, 0.2, 0.3] }
+    },
+    {
+      "match": { "userMessage": "status", "sequenceIndex": 0 },
+      "response": { "content": "First response" }
+    }
+  ]
+}
+```
+JSON files cannot use `RegExp` or `predicate` — those are code-only features. `streamingProfile` is supported in JSON fixture files.
+Load with `mock.loadFixtureFile("./fixtures/greetings.json")` or `mock.loadFixtureDir("./fixtures/")`.
+## API Endpoints
+All providers share the same fixture pool — write fixtures once, they work for any endpoint.
+| Endpoint                                                                                 | Provider      | Protocol  |
+| ---------------------------------------------------------------------------------------- | ------------- | --------- |
+| `POST /v1/chat/completions`                                                              | OpenAI        | HTTP      |
+| `POST /v1/responses`                                                                     | OpenAI        | HTTP + WS |
+| `POST /v1/messages`                                                                      | Anthropic     | HTTP      |
+| `POST /v1/embeddings`                                                                    | OpenAI        | HTTP      |
+| `POST /v1beta/models/{model}:{method}`                                                   | Google Gemini | HTTP      |
+| `POST /model/{modelId}/invoke`                                                           | AWS Bedrock   | HTTP      |
+| `POST /openai/deployments/{id}/chat/completions`                                         | Azure OpenAI  | HTTP      |
+| `POST /openai/deployments/{id}/embeddings`                                               | Azure OpenAI  | HTTP      |
+| `GET /health`                                                                            | —             | HTTP      |
+| `GET /ready`                                                                             | —             | HTTP      |
+| `POST /model/{modelId}/invoke-with-response-stream`                                      | AWS Bedrock   | HTTP      |
+| `POST /model/{modelId}/converse`                                                         | AWS Bedrock   | HTTP      |
+| `POST /model/{modelId}/converse-stream`                                                  | AWS Bedrock   | HTTP      |
+| `POST /v1/projects/{p}/locations/{l}/publishers/google/models/{m}:generateContent`       | Vertex AI     | HTTP      |
+| `POST /v1/projects/{p}/locations/{l}/publishers/google/models/{m}:streamGenerateContent` | Vertex AI     | HTTP      |
+| `POST /api/chat`                                                                         | Ollama        | HTTP      |
+| `POST /api/generate`                                                                     | Ollama        | HTTP      |
+| `GET /api/tags`                                                                          | Ollama        | HTTP      |
+| `POST /v2/chat`                                                                          | Cohere        | HTTP      |
+| `GET /metrics`                                                                           | —             | HTTP      |
+| `GET /v1/models`                                                                         | OpenAI-compat | HTTP      |
+| `WS /v1/responses`                                                                       | OpenAI        | WebSocket |
+| `WS /v1/realtime`                                                                        | OpenAI        | WebSocket |
+| `WS /ws/google.ai...BidiGenerateContent`                                                 | Gemini Live   | WebSocket |
+## Critical Gotchas
+1. **Order matters** — first match wins. Specific fixtures before general ones. Use `prependFixture()` to force priority.
+2. **`arguments` must be a JSON string** — `"arguments": "{\"key\":\"value\"}"` not `"arguments": {"key":"value"}`. The type system enforces this but JSON fixtures can get it wrong silently.
+3. **Latency is per-chunk, not total** — `latency: 100` means 100ms between each SSE chunk, not 100ms total response time. Similarly, `truncateAfterChunks` and `disconnectAfterMs` are for simulating stream interruptions (added in v1.3.0).
+4. **`streamingProfile` takes precedence over `latency`** — when both are set on a fixture, `streamingProfile` controls timing. Use one or the other.
+5. **Tool result messages don't change the user message** — after a tool call, the client sends the same conversation + tool result. Matching on `userMessage` will hit the SAME fixture again → infinite loop. Always use `predicate` checking `role === "tool"` for tool results.
+6. **`clearFixtures()` preserves the array reference** — uses `.length = 0`, not reassignment. The running server reads the same array object.
+7. **Journal records everything** — including 404 "no match" responses. Use `mock.getLastRequest()` to debug mismatches.
+8. **All providers share fixtures** — a fixture matching "hello" works whether the request comes via `/v1/chat/completions` (OpenAI), `/v1/messages` (Anthropic), Gemini, Bedrock, or Azure endpoints.
+9. **WebSocket uses the same fixture pool** — no special setup needed for WebSocket-based APIs (OpenAI Responses WS, Realtime, Gemini Live).
+10. **Embeddings auto-generate if no fixture matches** — deterministic vectors are generated from the input text hash. You don't need a catch-all for embedding requests.
+11. **Sequential response counts are tracked per fixture** — counts reset with `reset()` or `resetMatchCounts()`. The count increments after each match of that fixture group (all fixtures sharing the same non-`sequenceIndex` match fields).
+12. **Bedrock uses Anthropic Messages format internally** — the adapter normalizes Bedrock requests to `ChatCompletionRequest`, so the same fixtures work. Bedrock supports both non-streaming (`/invoke`, `/converse`) and streaming (`/invoke-with-response-stream`, `/converse-stream`) endpoints.
+13. **Azure OpenAI routes through the same handlers** — `/openai/deployments/{id}/chat/completions` maps to the completions handler, `/openai/deployments/{id}/embeddings` maps to the embeddings handler. Fixtures work unchanged.
+14. **Ollama defaults to streaming** — opposite of OpenAI. Set `stream: false` explicitly in the request for non-streaming responses.
+15. **Ollama tool call `arguments` is an object, not a JSON string** — unlike OpenAI where `arguments` is a JSON string, Ollama sends and expects a plain object.
+16. **Bedrock streaming uses binary Event Stream format** — not SSE. The `invoke-with-response-stream` and `converse-stream` endpoints use AWS Event Stream binary encoding.
+17. **Vertex AI routes to the same handler as consumer Gemini** — the same fixtures work for both Vertex AI (`/v1/projects/.../models/{m}:generateContent`) and consumer Gemini (`/v1beta/models/{model}:generateContent`).
+18. **Cohere requires `model` field** — returns 400 if `model` is missing from the request body.
+## Mount & Composition
+### mount() API
+Mount additional mock services onto a running LLMock server. All services share one port, one health endpoint, and one request journal.
+```typescript
+const llm = new LLMock({ port: 5555 });
+llm.mount("/mcp", mcpMock); // MCP tools at /mcp
+llm.mount("/a2a", a2aMock); // A2A agents at /a2a
+llm.mount("/vector", vectorMock); // Vector DB at /vector
+await llm.start();
+```
+Any object implementing the `Mountable` interface (a `handleRequest` method that returns `boolean`) can be mounted. Path prefixes are stripped before the service sees the request — `/mcp/tools/list` arrives as `/tools/list`.
+### createMockSuite()
+Unified lifecycle for LLMock + mounted services:
+```typescript
+import { createMockSuite } from "@copilotkit/aimock";
+const suite = createMockSuite({
+  port: 0,
+  fixtures: "./fixtures",
+  services: { "/mcp": mcpMock, "/a2a": a2aMock },
+});
+await suite.start();
+// suite.llm — the LLMock instance
+// suite.url — base URL
+afterEach(() => suite.reset()); // resets everything
+afterAll(() => suite.stop());
+```
+### aimock CLI config file
+The `aimock` CLI reads a JSON config and serves all services on one port:
+```bash
+aimock --config aimock.json --port 4010
+```
+Config format:
+```json
+{
+  "llm": {
+    "fixtures": "./fixtures",
+    "latency": 0,
+    "metrics": true
+  },
+  "services": {
+    "/mcp": { "type": "mcp", "tools": "./mcp-tools.json" },
+    "/a2a": { "type": "a2a", "agents": "./a2a-agents.json" }
+  }
+}
+```
+## VectorMock
+Mock vector database server for testing RAG pipelines. Supports Pinecone, Qdrant, and ChromaDB API formats.
+```typescript
+import { VectorMock } from "@copilotkit/aimock";
+const vector = new VectorMock();
+// Create a collection and register query results
+vector.addCollection("docs", { dimension: 1536 });
+vector.onQuery("docs", [
+  { id: "doc-1", score: 0.95, metadata: { title: "Getting Started" } },
+  { id: "doc-2", score: 0.87, metadata: { title: "API Reference" } },
+]);
+// Upsert vectors
+vector.upsert("docs", [
+  { id: "v1", values: [0.1, 0.2, ...], metadata: { title: "Intro" } },
+]);
+// Dynamic query handler
+vector.onQuery("docs", (query) => {
+  return [{ id: "result", score: 1.0, metadata: { topK: query.topK } }];
+});
+// Standalone or mounted
+const url = await vector.start();
+// Or: llm.mount("/vector", vector);
+```
+### VectorMock endpoints
+| Provider | Endpoints                                                                                                                                |
+| -------- | ---------------------------------------------------------------------------------------------------------------------------------------- |
+| Pinecone | `POST /query`, `POST /vectors/upsert`, `POST /vectors/delete`, `GET /describe-index-stats`                                               |
+| Qdrant   | `POST /collections/{name}/points/search`, `PUT /collections/{name}/points`, `POST /collections/{name}/points/delete`                     |
+| ChromaDB | `POST /api/v1/collections/{id}/query`, `POST /api/v1/collections/{id}/add`, `GET /api/v1/collections`, `DELETE /api/v1/collections/{id}` |
+## Service Mocks (Search / Rerank / Moderation)
+Built-in mocks for common AI-adjacent services. Registered on the LLMock instance directly — no separate server needed.
+### Search (Tavily-compatible)
+```typescript
+// POST /search — matches request `query` field
+mock.onSearch("weather", [
+  { title: "Weather Report", url: "https://example.com", content: "Sunny today" },
+]);
+mock.onSearch(/stock\s+price/i, [
+  { title: "ACME Stock", url: "https://example.com", content: "$42", score: 0.95 },
+]);
+```
+### Rerank (Cohere-compatible)
+```typescript
+// POST /v2/rerank — matches request `query` field
+mock.onRerank("machine learning", [
+  { index: 0, relevance_score: 0.99 },
+  { index: 2, relevance_score: 0.85 },
+]);
+```
+### Moderation (OpenAI-compatible)
+```typescript
+// POST /v1/moderations — matches request `input` field
+mock.onModerate("violent", {
+  flagged: true,
+  categories: { violence: true, hate: false },
+  category_scores: { violence: 0.95, hate: 0.01 },
+});
+// Catch-all — everything passes
+mock.onModerate(/.*/, { flagged: false, categories: {} });
+```
+### Pattern matching
+All three services use the same matching logic:
+- **String patterns** — case-insensitive substring match
+- **RegExp patterns** — full regex test
+- **First match wins** — register specific patterns before catch-alls
+## Debugging Fixture Mismatches
+When a fixture doesn't match:
+1. **Inspect what the server received**: `mock.getLastRequest()` → check `body.messages` array
+2. **Check fixture order**: `mock.getFixtures()` returns fixtures in registration order
+3. **For `userMessage`**: match is against the LAST `role: "user"` message only, substring match (not exact)
+4. **Check the journal**: `mock.getRequests()` shows all requests including which fixture matched (or `null` for 404)
+## E2E Test Setup Pattern
+```typescript
+import { LLMock } from "@copilotkit/aimock";
+// Setup — port: 0 picks a random available port
+const mock = new LLMock({ port: 0 });
+mock.loadFixtureDir("./fixtures");
+await mock.start();
+process.env.OPENAI_BASE_URL = `${mock.url}/v1`;
+// Per-test cleanup
+afterEach(() => mock.reset()); // clears fixtures AND journal
+// Teardown
+afterAll(async () => await mock.stop());
+```
+### Static factory shorthand
+```typescript
+const mock = await LLMock.create({ port: 0 }); // creates + starts in one call
+```
+## API Quick Reference
+| Method                                  | Purpose                                     |
+| --------------------------------------- | ------------------------------------------- |
+| `addFixture(f)`                         | Append fixture (last priority)              |
+| `addFixtures(f[])`                      | Append multiple                             |
+| `prependFixture(f)`                     | Insert at front (highest priority)          |
+| `clearFixtures()`                       | Remove all fixtures                         |
+| `getFixtures()`                         | Read current fixture list                   |
+| `on(match, response, opts?)`            | Shorthand for `addFixture`                  |
+| `onMessage(pattern, response, opts?)`   | Match by user message                       |
+| `onEmbedding(pattern, response, opts?)` | Match by embedding input text               |
+| `onJsonOutput(pattern, json, opts?)`    | Match by user message with `responseFormat` |
+| `onToolCall(name, response, opts?)`     | Match by tool name in `tools[]`             |
+| `onToolResult(id, response, opts?)`     | Match by `tool_call_id`                     |
+| `nextRequestError(status, body?)`       | One-shot error, auto-removes                |
+| `loadFixtureFile(path)`                 | Load JSON fixture file                      |
+| `loadFixtureDir(path)`                  | Load all JSON files in directory            |
+| `start()`                               | Start server, returns URL                   |
+| `stop()`                                | Stop server                                 |
+| `reset()`                               | Clear fixtures + journal + match counts     |
+| `resetMatchCounts()`                    | Clear sequence match counts only            |
+| `getRequests()`                         | All journal entries                         |
+| `getLastRequest()`                      | Most recent journal entry                   |
+| `clearRequests()`                       | Clear journal only                          |
+| `setChaos(opts)`                        | Set server-level chaos rates                |
+| `clearChaos()`                          | Remove server-level chaos                   |
+| `onSearch(pattern, results)`            | Match search requests by query              |
+| `onRerank(pattern, results)`            | Match rerank requests by query              |
+| `onModerate(pattern, result)`           | Match moderation requests by input          |
+| `mount(path, handler)`                  | Mount a Mountable (VectorMock, etc.)        |
+| `url` / `baseUrl`                       | Server URL (throws if not started)          |
+| `port`                                  | Server port number                          |
+Sequential responses use `on()` with `sequenceIndex` in the match — there is no dedicated convenience method.
+## Record-and-Replay (VCR Mode)
+llmock supports a VCR-style record-and-replay workflow: unmatched requests are proxied to real provider APIs, and the responses are saved as standard llmock fixture files for deterministic replay.
+### CLI usage
+```bash
+# Record mode: proxy unmatched requests to real OpenAI and Anthropic APIs
+llmock --record \
+  --provider-openai https://api.openai.com \
+  --provider-anthropic https://api.anthropic.com \
+  -f ./fixtures
+# Strict mode: fail on unmatched requests (no proxying, no catch-all 404)
+llmock --strict -f ./fixtures
+```
+- `--record` enables proxy-on-miss. Requires at least one `--provider-*` flag.
+- `--strict` returns a 503 error when no fixture matches AND no proxy is configured (or the proxy attempt fails), instead of silently returning a 404. The proxy is still tried first when `--record` is set. Use this in CI to prevent unmatched requests from slipping through as silent 404s.
+- Provider flags: `--provider-openai`, `--provider-anthropic`, `--provider-gemini`, `--provider-vertexai`, `--provider-bedrock`, `--provider-azure`, `--provider-ollama`, `--provider-cohere`.
+### How it works
+1. **Existing fixtures are served first** — the router checks all loaded fixtures before considering the proxy.
+2. **Misses are proxied** — if no fixture matches and recording is enabled, the request is forwarded to the real provider API. Upstream URL path prefixes are preserved (e.g., `https://gateway.company.com/llm/v1` correctly proxies to `/llm/v1/chat/completions`).
+3. **All request headers are forwarded (auth headers NOT saved)** — all client request headers are passed through to the upstream provider, except hop-by-hop headers and `host`/`content-length`/`cookie`/`accept-encoding`. Auth headers (`Authorization`, `x-api-key`, `api-key`) are forwarded but stripped from the recorded fixture.
+4. **Responses are saved as standard fixtures** — recorded files land in `{fixturePath}/recorded/` and use the same JSON format as hand-written fixtures. Nothing special about them.
+5. **Streaming responses are collapsed** — SSE streams are collapsed into a single text or tool-call response for the fixture. The original streaming format is preserved in the live proxy response.
+6. **Base64 embedding decoding** — when the upstream returns base64-encoded embeddings (the default `encoding_format` in Python's openai SDK), the recorder decodes them into float arrays so fixtures contain readable numeric data instead of opaque base64 strings.
+7. **Loud logging** — every proxy hit logs at `warn` level so you can see exactly which requests are being forwarded.
+### Programmatic API
+```typescript
+const mock = new LLMock({ port: 0 });
+await mock.start();
+// Enable recording at runtime
+mock.enableRecording({
+  providers: {
+    openai: "https://api.openai.com",
+    anthropic: "https://api.anthropic.com",
+  },
+  fixturePath: "./fixtures/recorded",
+});
+// ... run tests that hit real APIs for uncovered cases ...
+// Disable recording (back to fixture-only mode)
+mock.disableRecording();
+```
+### Workflow
+1. **Bootstrap**: Run your test suite with `--record` and provider URLs. All requests that don't match existing fixtures are proxied and recorded.
+2. **Review**: Check the recorded fixtures in `{fixturePath}/recorded/`. Edit or reorganize as needed.
+3. **Lock down**: Run your test suite with `--strict` to ensure every request hits a fixture. No network calls escape.
+4. **Maintain**: When APIs change, delete stale fixtures and re-record.