ai-functions 2.1.3 → 2.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.turbo/turbo-build.log +1 -1
- package/CHANGELOG.md +55 -1
- package/README.md +38 -0
- package/dist/ai-promise.d.ts +3 -3
- package/dist/ai-promise.d.ts.map +1 -1
- package/dist/ai-promise.js +135 -64
- package/dist/ai-promise.js.map +1 -1
- package/dist/ai-schemas.d.ts +56 -0
- package/dist/ai-schemas.d.ts.map +1 -0
- package/dist/ai-schemas.js +53 -0
- package/dist/ai-schemas.js.map +1 -0
- package/dist/ai.d.ts +16 -242
- package/dist/ai.d.ts.map +1 -1
- package/dist/ai.js +51 -858
- package/dist/ai.js.map +1 -1
- package/dist/batch/anthropic.d.ts +6 -4
- package/dist/batch/anthropic.d.ts.map +1 -1
- package/dist/batch/anthropic.js +83 -145
- package/dist/batch/anthropic.js.map +1 -1
- package/dist/batch/bedrock.d.ts +8 -30
- package/dist/batch/bedrock.d.ts.map +1 -1
- package/dist/batch/bedrock.js +155 -338
- package/dist/batch/bedrock.js.map +1 -1
- package/dist/batch/cloudflare.d.ts +8 -20
- package/dist/batch/cloudflare.d.ts.map +1 -1
- package/dist/batch/cloudflare.js +68 -189
- package/dist/batch/cloudflare.js.map +1 -1
- package/dist/batch/google.d.ts +6 -20
- package/dist/batch/google.d.ts.map +1 -1
- package/dist/batch/google.js +70 -238
- package/dist/batch/google.js.map +1 -1
- package/dist/batch/index.d.ts +4 -1
- package/dist/batch/index.d.ts.map +1 -1
- package/dist/batch/index.js +4 -1
- package/dist/batch/index.js.map +1 -1
- package/dist/batch/memory.d.ts +1 -1
- package/dist/batch/memory.d.ts.map +1 -1
- package/dist/batch/memory.js +14 -10
- package/dist/batch/memory.js.map +1 -1
- package/dist/batch/openai.d.ts +11 -14
- package/dist/batch/openai.d.ts.map +1 -1
- package/dist/batch/openai.js +52 -156
- package/dist/batch/openai.js.map +1 -1
- package/dist/batch/provider.d.ts +111 -0
- package/dist/batch/provider.d.ts.map +1 -0
- package/dist/batch/provider.js +233 -0
- package/dist/batch/provider.js.map +1 -0
- package/dist/batch-map.d.ts.map +1 -1
- package/dist/batch-map.js +23 -17
- package/dist/batch-map.js.map +1 -1
- package/dist/batch-queue.d.ts +65 -0
- package/dist/batch-queue.d.ts.map +1 -1
- package/dist/batch-queue.js +169 -14
- package/dist/batch-queue.js.map +1 -1
- package/dist/budget.d.ts.map +1 -1
- package/dist/budget.js +27 -14
- package/dist/budget.js.map +1 -1
- package/dist/cache.d.ts +23 -0
- package/dist/cache.d.ts.map +1 -1
- package/dist/cache.js +36 -15
- package/dist/cache.js.map +1 -1
- package/dist/context.d.ts +26 -8
- package/dist/context.d.ts.map +1 -1
- package/dist/context.js +64 -62
- package/dist/context.js.map +1 -1
- package/dist/digital-objects-registry.d.ts +229 -0
- package/dist/digital-objects-registry.d.ts.map +1 -0
- package/dist/digital-objects-registry.js +617 -0
- package/dist/digital-objects-registry.js.map +1 -0
- package/dist/embeddings.d.ts +2 -2
- package/dist/embeddings.d.ts.map +1 -1
- package/dist/errors.d.ts +22 -0
- package/dist/errors.d.ts.map +1 -0
- package/dist/errors.js +35 -0
- package/dist/errors.js.map +1 -0
- package/dist/eval/runner.d.ts +8 -0
- package/dist/eval/runner.d.ts.map +1 -1
- package/dist/eval/runner.js +41 -35
- package/dist/eval/runner.js.map +1 -1
- package/dist/eval-log/in-memory.d.ts +34 -0
- package/dist/eval-log/in-memory.d.ts.map +1 -0
- package/dist/eval-log/in-memory.js +84 -0
- package/dist/eval-log/in-memory.js.map +1 -0
- package/dist/eval-log/index.d.ts +29 -0
- package/dist/eval-log/index.d.ts.map +1 -0
- package/dist/eval-log/index.js +39 -0
- package/dist/eval-log/index.js.map +1 -0
- package/dist/eval-log/types.d.ts +101 -0
- package/dist/eval-log/types.d.ts.map +1 -0
- package/dist/eval-log/types.js +16 -0
- package/dist/eval-log/types.js.map +1 -0
- package/dist/function-registry.d.ts +116 -0
- package/dist/function-registry.d.ts.map +1 -0
- package/dist/function-registry.js +546 -0
- package/dist/function-registry.js.map +1 -0
- package/dist/generate.d.ts +9 -3
- package/dist/generate.d.ts.map +1 -1
- package/dist/generate.js +18 -18
- package/dist/generate.js.map +1 -1
- package/dist/index.d.ts +18 -11
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +35 -18
- package/dist/index.js.map +1 -1
- package/dist/logger.d.ts +118 -0
- package/dist/logger.d.ts.map +1 -0
- package/dist/logger.js +187 -0
- package/dist/logger.js.map +1 -0
- package/dist/middleware/budget.d.ts +84 -0
- package/dist/middleware/budget.d.ts.map +1 -0
- package/dist/middleware/budget.js +110 -0
- package/dist/middleware/budget.js.map +1 -0
- package/dist/middleware/cache.d.ts +103 -0
- package/dist/middleware/cache.d.ts.map +1 -0
- package/dist/middleware/cache.js +228 -0
- package/dist/middleware/cache.js.map +1 -0
- package/dist/middleware/embed-cache.d.ts +99 -0
- package/dist/middleware/embed-cache.d.ts.map +1 -0
- package/dist/middleware/embed-cache.js +128 -0
- package/dist/middleware/embed-cache.js.map +1 -0
- package/dist/middleware/index.d.ts +11 -0
- package/dist/middleware/index.d.ts.map +1 -0
- package/dist/middleware/index.js +11 -0
- package/dist/middleware/index.js.map +1 -0
- package/dist/middleware/trace.d.ts +103 -0
- package/dist/middleware/trace.d.ts.map +1 -0
- package/dist/middleware/trace.js +176 -0
- package/dist/middleware/trace.js.map +1 -0
- package/dist/primitives.d.ts +120 -1
- package/dist/primitives.d.ts.map +1 -1
- package/dist/primitives.js +398 -26
- package/dist/primitives.js.map +1 -1
- package/dist/retry.d.ts +66 -1
- package/dist/retry.d.ts.map +1 -1
- package/dist/retry.js +115 -8
- package/dist/retry.js.map +1 -1
- package/dist/schema.js +2 -2
- package/dist/schema.js.map +1 -1
- package/dist/telemetry.d.ts +128 -0
- package/dist/telemetry.d.ts.map +1 -0
- package/dist/telemetry.js +285 -0
- package/dist/telemetry.js.map +1 -0
- package/dist/template.d.ts.map +1 -1
- package/dist/template.js +6 -1
- package/dist/template.js.map +1 -1
- package/dist/tool-orchestration.d.ts +66 -4
- package/dist/tool-orchestration.d.ts.map +1 -1
- package/dist/tool-orchestration.js +123 -23
- package/dist/tool-orchestration.js.map +1 -1
- package/dist/type-guards.d.ts +28 -0
- package/dist/type-guards.d.ts.map +1 -0
- package/dist/type-guards.js +29 -0
- package/dist/type-guards.js.map +1 -0
- package/dist/types.d.ts +135 -17
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js +36 -1
- package/dist/types.js.map +1 -1
- package/dist/wrap-for-v3.d.ts +80 -0
- package/dist/wrap-for-v3.d.ts.map +1 -0
- package/dist/wrap-for-v3.js +89 -0
- package/dist/wrap-for-v3.js.map +1 -0
- package/examples/00-quickstart.ts +232 -0
- package/examples/01-rag-chatbot.ts +212 -0
- package/examples/02-multi-agent-research.ts +290 -0
- package/examples/03-email-classification.ts +379 -0
- package/examples/04-content-moderation.ts +400 -0
- package/examples/05-document-extraction.ts +455 -0
- package/examples/06-streaming-chat-nextjs.ts +437 -0
- package/examples/07-cloudflare-worker.ts +483 -0
- package/examples/08-batch-processing.ts +491 -0
- package/examples/09-budget-constrained.ts +527 -0
- package/examples/10-tool-orchestration.ts +565 -0
- package/examples/11-retry-resilience.ts +403 -0
- package/examples/12-caching-strategies.ts +422 -0
- package/examples/README.md +145 -0
- package/package.json +28 -25
- package/src/ai-promise.ts +226 -140
- package/src/ai-schemas.ts +122 -0
- package/src/ai.ts +69 -1176
- package/src/batch/anthropic.ts +96 -161
- package/src/batch/bedrock.ts +203 -454
- package/src/batch/cloudflare.ts +99 -282
- package/src/batch/google.ts +91 -297
- package/src/batch/index.ts +4 -1
- package/src/batch/memory.ts +15 -10
- package/src/batch/openai.ts +65 -193
- package/src/batch/provider.ts +336 -0
- package/src/batch-map.ts +29 -24
- package/src/batch-queue.ts +200 -11
- package/src/budget.ts +31 -18
- package/src/cache.ts +45 -17
- package/src/context.ts +106 -77
- package/src/digital-objects-registry.ts +750 -0
- package/src/errors.ts +37 -0
- package/src/eval/runner.ts +60 -36
- package/src/eval-log/in-memory.ts +90 -0
- package/src/eval-log/index.ts +46 -0
- package/src/eval-log/types.ts +110 -0
- package/src/function-registry.ts +671 -0
- package/src/generate.ts +33 -28
- package/src/index.ts +119 -21
- package/src/logger.ts +232 -0
- package/src/middleware/budget.ts +171 -0
- package/src/middleware/cache.ts +299 -0
- package/src/middleware/embed-cache.ts +195 -0
- package/src/middleware/index.ts +23 -0
- package/src/middleware/trace.ts +248 -0
- package/src/primitives.ts +589 -62
- package/src/retry.ts +144 -18
- package/src/schema.ts +8 -8
- package/src/telemetry.ts +403 -0
- package/src/template.ts +8 -4
- package/src/tool-orchestration.ts +213 -48
- package/src/type-guards.ts +31 -0
- package/src/types.ts +164 -25
- package/src/wrap-for-v3.ts +105 -0
- package/test/ai-promise.test.ts +1080 -0
- package/test/ai-proxy.test.ts +1 -1
- package/test/batch-autosubmit-errors.test.ts +49 -37
- package/test/batch-blog-posts.test.ts +87 -129
- package/test/core-functions.test.ts +183 -579
- package/test/decide.test.ts +154 -322
- package/test/define.test.ts +211 -8
- package/test/digital-objects-registry.test.ts +760 -0
- package/test/embedding-cache-middleware.test.ts +140 -0
- package/test/generate-core.test.ts +140 -229
- package/test/implicit-batch.test.ts +22 -65
- package/test/retry-policy-integration.test.ts +117 -0
- package/test/schema.test.ts +55 -19
- package/test/template.test.ts +1164 -0
- package/test/tool-orchestration.test.ts +270 -0
- package/test/wrap-for-v3.test.ts +612 -0
- package/vitest.config.js +6 -0
- package/vitest.config.ts +20 -0
- package/LICENSE +0 -21
- package/dist/rpc/auth.d.ts +0 -69
- package/dist/rpc/auth.d.ts.map +0 -1
- package/dist/rpc/auth.js +0 -136
- package/dist/rpc/auth.js.map +0 -1
- package/dist/rpc/client.d.ts +0 -62
- package/dist/rpc/client.d.ts.map +0 -1
- package/dist/rpc/client.js +0 -103
- package/dist/rpc/client.js.map +0 -1
- package/dist/rpc/deferred.d.ts +0 -60
- package/dist/rpc/deferred.d.ts.map +0 -1
- package/dist/rpc/deferred.js +0 -96
- package/dist/rpc/deferred.js.map +0 -1
- package/dist/rpc/index.d.ts +0 -22
- package/dist/rpc/index.d.ts.map +0 -1
- package/dist/rpc/index.js +0 -38
- package/dist/rpc/index.js.map +0 -1
- package/dist/rpc/local.d.ts +0 -42
- package/dist/rpc/local.d.ts.map +0 -1
- package/dist/rpc/local.js +0 -50
- package/dist/rpc/local.js.map +0 -1
- package/dist/rpc/server.d.ts +0 -165
- package/dist/rpc/server.d.ts.map +0 -1
- package/dist/rpc/server.js +0 -405
- package/dist/rpc/server.js.map +0 -1
- package/dist/rpc/session.d.ts +0 -32
- package/dist/rpc/session.d.ts.map +0 -1
- package/dist/rpc/session.js +0 -43
- package/dist/rpc/session.js.map +0 -1
- package/dist/rpc/transport.d.ts +0 -306
- package/dist/rpc/transport.d.ts.map +0 -1
- package/dist/rpc/transport.js +0 -731
- package/dist/rpc/transport.js.map +0 -1
- package/src/batch/anthropic.js +0 -256
- package/src/batch/bedrock.js +0 -584
- package/src/batch/cloudflare.js +0 -287
- package/src/batch/google.js +0 -359
- package/src/batch/index.js +0 -30
- package/src/batch/memory.js +0 -187
- package/src/batch/openai.js +0 -402
- package/src/eval/index.js +0 -7
- package/src/eval/models.js +0 -119
- package/src/eval/runner.js +0 -147
- package/test/schema.test.js +0 -96
|
@@ -0,0 +1,248 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* traceMiddleware — emit per-call trace events for `wrapLanguageModel`
|
|
3
|
+
*
|
|
4
|
+
* Wraps `doGenerate` / `doStream` and emits a {@link TraceEvent} on every
|
|
5
|
+
* completion. The sink is opaque (caller supplies `emit`) so this primitive
|
|
6
|
+
* works equally well piping into:
|
|
7
|
+
*
|
|
8
|
+
* - the v3 cascade-walker InvocationEvent stream (round 16+ work to add
|
|
9
|
+
* `'persona-trace'` / `'cascade-trace'` to the union),
|
|
10
|
+
* - an {@link import('../eval-log/index.js').EvalLogStore} for fixture
|
|
11
|
+
* replay,
|
|
12
|
+
* - OpenTelemetry / Datadog / Honeycomb adapters that map the event into
|
|
13
|
+
* a span.
|
|
14
|
+
*
|
|
15
|
+
* **Emit-error tolerance:** if the supplied `emit` throws, we *swallow* the
|
|
16
|
+
* error (with a one-time `console.warn`) so a flaky trace sink can never
|
|
17
|
+
* break the wrapped LLM call. This matches the Evalite v0.19 trace
|
|
18
|
+
* middleware behaviour.
|
|
19
|
+
*
|
|
20
|
+
* Composition note: install **last** so the event sees the final outcome
|
|
21
|
+
* (post-cache, post-budget). The event's `costUsd` field is best-effort —
|
|
22
|
+
* the trace middleware doesn't have direct access to the budget tracker, so
|
|
23
|
+
* the caller can pass a `getCostUsd` resolver if they want costs in the
|
|
24
|
+
* event payload.
|
|
25
|
+
*
|
|
26
|
+
* @packageDocumentation
|
|
27
|
+
*/
|
|
28
|
+
|
|
29
|
+
import type {
|
|
30
|
+
LanguageModelV3CallOptions,
|
|
31
|
+
LanguageModelV3GenerateResult,
|
|
32
|
+
LanguageModelV3Middleware,
|
|
33
|
+
LanguageModelV3StreamPart,
|
|
34
|
+
LanguageModelV3StreamResult,
|
|
35
|
+
LanguageModelV3Usage,
|
|
36
|
+
} from '@ai-sdk/provider'
|
|
37
|
+
|
|
38
|
+
// ============================================================================
|
|
39
|
+
// Types
|
|
40
|
+
// ============================================================================
|
|
41
|
+
|
|
42
|
+
/**
|
|
43
|
+
* Discriminator for the originating call site. Callers inject this via the
|
|
44
|
+
* `kind` option so a single sink can fan events into different downstream
|
|
45
|
+
* streams (persona panel vs. cascade walker vs. ad-hoc test).
|
|
46
|
+
*/
|
|
47
|
+
export type TraceEventKind = 'persona-trace' | 'cascade-trace' | 'eval-trace' | string
|
|
48
|
+
|
|
49
|
+
/**
|
|
50
|
+
* Trace event payload emitted on every wrapped call completion.
|
|
51
|
+
*
|
|
52
|
+
* Field design notes:
|
|
53
|
+
* - `prompt` / `response` are stringified for cheap downstream storage
|
|
54
|
+
* (the structured `LanguageModelV3Prompt` / `LanguageModelV3Content[]`
|
|
55
|
+
* shapes are intentionally flattened).
|
|
56
|
+
* - `usage` is the raw V3 shape (with the cache breakdown) — the
|
|
57
|
+
* EvalLogStore consumer flattens it into total counts.
|
|
58
|
+
* - `costUsd` is optional because the trace middleware doesn't compute
|
|
59
|
+
* cost itself; callers either pass a resolver or compute downstream
|
|
60
|
+
* from `usage`.
|
|
61
|
+
*/
|
|
62
|
+
export interface TraceEvent {
|
|
63
|
+
kind: TraceEventKind
|
|
64
|
+
model: string
|
|
65
|
+
prompt: string
|
|
66
|
+
response: string
|
|
67
|
+
usage: LanguageModelV3Usage | undefined
|
|
68
|
+
costUsd?: number
|
|
69
|
+
durationMs: number
|
|
70
|
+
/** Optional caller-supplied tags for downstream filtering. */
|
|
71
|
+
tags?: Record<string, string>
|
|
72
|
+
}
|
|
73
|
+
|
|
74
|
+
/** Options for {@link traceMiddleware}. */
|
|
75
|
+
export interface TraceMiddlewareOptions {
|
|
76
|
+
/**
|
|
77
|
+
* Opaque sink. Errors thrown from `emit` are swallowed (with a one-time
|
|
78
|
+
* `console.warn`) so a flaky sink never breaks the wrapped LLM call.
|
|
79
|
+
*/
|
|
80
|
+
emit: (event: TraceEvent) => void | Promise<void>
|
|
81
|
+
/**
|
|
82
|
+
* Discriminator threaded into the event's `kind` field. Defaults to
|
|
83
|
+
* `'eval-trace'`.
|
|
84
|
+
*/
|
|
85
|
+
kind?: TraceEventKind
|
|
86
|
+
/**
|
|
87
|
+
* Optional cost resolver. When supplied, called with the V3 usage shape
|
|
88
|
+
* and the modelId; result is set on `event.costUsd`. Useful when the
|
|
89
|
+
* caller has a side-channel pricing table (the budgetMiddleware's
|
|
90
|
+
* tracker) and wants costs in the trace event itself.
|
|
91
|
+
*/
|
|
92
|
+
getCostUsd?: (modelId: string, usage: LanguageModelV3Usage | undefined) => number
|
|
93
|
+
/** Optional caller-supplied tags merged into every emitted event. */
|
|
94
|
+
tags?: Record<string, string>
|
|
95
|
+
}
|
|
96
|
+
|
|
97
|
+
// ============================================================================
|
|
98
|
+
// Helpers
|
|
99
|
+
// ============================================================================
|
|
100
|
+
|
|
101
|
+
/**
|
|
102
|
+
* Flatten the structured V3 prompt into a single string for cheap storage.
|
|
103
|
+
* Walks system / user / assistant / tool messages and concatenates their
|
|
104
|
+
* text parts. Non-text parts (files, tool results) are summarised with a
|
|
105
|
+
* short marker so the trace doesn't grow unboundedly.
|
|
106
|
+
*/
|
|
107
|
+
function stringifyPrompt(params: LanguageModelV3CallOptions): string {
|
|
108
|
+
const out: string[] = []
|
|
109
|
+
for (const msg of params.prompt) {
|
|
110
|
+
if (msg.role === 'system') {
|
|
111
|
+
out.push(`[system] ${msg.content}`)
|
|
112
|
+
continue
|
|
113
|
+
}
|
|
114
|
+
if (typeof msg.content === 'string') {
|
|
115
|
+
out.push(`[${msg.role}] ${msg.content}`)
|
|
116
|
+
continue
|
|
117
|
+
}
|
|
118
|
+
if (Array.isArray(msg.content)) {
|
|
119
|
+
const parts: string[] = []
|
|
120
|
+
for (const part of msg.content) {
|
|
121
|
+
if (part.type === 'text') parts.push(part.text)
|
|
122
|
+
else parts.push(`[${part.type}]`)
|
|
123
|
+
}
|
|
124
|
+
out.push(`[${msg.role}] ${parts.join(' ')}`)
|
|
125
|
+
}
|
|
126
|
+
}
|
|
127
|
+
return out.join('\n')
|
|
128
|
+
}
|
|
129
|
+
|
|
130
|
+
/**
|
|
131
|
+
* Flatten the V3 generate result content into a single string. Walks the
|
|
132
|
+
* `content` array (text, reasoning, tool-call, etc.) and concatenates text
|
|
133
|
+
* parts; non-text parts get short summaries.
|
|
134
|
+
*/
|
|
135
|
+
function stringifyContent(content: LanguageModelV3GenerateResult['content']): string {
|
|
136
|
+
const parts: string[] = []
|
|
137
|
+
for (const part of content) {
|
|
138
|
+
if (part.type === 'text') parts.push(part.text)
|
|
139
|
+
else if (part.type === 'reasoning') parts.push(`[reasoning] ${part.text}`)
|
|
140
|
+
else parts.push(`[${part.type}]`)
|
|
141
|
+
}
|
|
142
|
+
return parts.join('')
|
|
143
|
+
}
|
|
144
|
+
|
|
145
|
+
let _hasWarnedEmit = false
|
|
146
|
+
|
|
147
|
+
async function safeEmit(emit: TraceMiddlewareOptions['emit'], event: TraceEvent): Promise<void> {
|
|
148
|
+
try {
|
|
149
|
+
await emit(event)
|
|
150
|
+
} catch (err) {
|
|
151
|
+
if (!_hasWarnedEmit) {
|
|
152
|
+
_hasWarnedEmit = true
|
|
153
|
+
// eslint-disable-next-line no-console
|
|
154
|
+
console.warn(
|
|
155
|
+
`[ai-functions/traceMiddleware] emit() threw — subsequent emit errors will be silenced. ${
|
|
156
|
+
err instanceof Error ? err.message : String(err)
|
|
157
|
+
}`
|
|
158
|
+
)
|
|
159
|
+
}
|
|
160
|
+
}
|
|
161
|
+
}
|
|
162
|
+
|
|
163
|
+
// ============================================================================
|
|
164
|
+
// Middleware
|
|
165
|
+
// ============================================================================
|
|
166
|
+
|
|
167
|
+
/**
|
|
168
|
+
* Build a trace middleware for `wrapLanguageModel`. Emits a
|
|
169
|
+
* {@link TraceEvent} on every successful `doGenerate` / `doStream`
|
|
170
|
+
* completion. Errors from `emit` are swallowed (one-time warn) so a flaky
|
|
171
|
+
* trace sink can never break the wrapped LLM call.
|
|
172
|
+
*
|
|
173
|
+
* @example
|
|
174
|
+
* ```ts
|
|
175
|
+
* import { wrapLanguageModel } from 'ai'
|
|
176
|
+
* import { traceMiddleware, getEvalLogStore } from 'ai-functions'
|
|
177
|
+
*
|
|
178
|
+
* const store = getEvalLogStore()
|
|
179
|
+
* const model = wrapLanguageModel({
|
|
180
|
+
* model: openai('gpt-4o'),
|
|
181
|
+
* middleware: traceMiddleware({
|
|
182
|
+
* kind: 'cascade-trace',
|
|
183
|
+
* emit: (event) => store.record({ ...event, costUsd: event.costUsd ?? 0 }),
|
|
184
|
+
* }),
|
|
185
|
+
* })
|
|
186
|
+
* ```
|
|
187
|
+
*/
|
|
188
|
+
export function traceMiddleware(options: TraceMiddlewareOptions): LanguageModelV3Middleware {
|
|
189
|
+
const { emit, kind = 'eval-trace', getCostUsd, tags } = options
|
|
190
|
+
return {
|
|
191
|
+
specificationVersion: 'v3',
|
|
192
|
+
async wrapGenerate({ doGenerate, params, model }) {
|
|
193
|
+
const start = Date.now()
|
|
194
|
+
const result = await doGenerate()
|
|
195
|
+
const durationMs = Date.now() - start
|
|
196
|
+
const modelId = model.modelId
|
|
197
|
+
const event: TraceEvent = {
|
|
198
|
+
kind,
|
|
199
|
+
model: modelId,
|
|
200
|
+
prompt: stringifyPrompt(params),
|
|
201
|
+
response: stringifyContent(result.content),
|
|
202
|
+
usage: result.usage,
|
|
203
|
+
durationMs,
|
|
204
|
+
...(getCostUsd !== undefined ? { costUsd: getCostUsd(modelId, result.usage) } : {}),
|
|
205
|
+
...(tags !== undefined ? { tags } : {}),
|
|
206
|
+
}
|
|
207
|
+
await safeEmit(emit, event)
|
|
208
|
+
return result
|
|
209
|
+
},
|
|
210
|
+
async wrapStream({ doStream, params, model }) {
|
|
211
|
+
const start = Date.now()
|
|
212
|
+
const result = await doStream()
|
|
213
|
+
const modelId = model.modelId
|
|
214
|
+
let finalUsage: LanguageModelV3Usage | undefined
|
|
215
|
+
const collected: string[] = []
|
|
216
|
+
const transformedStream = result.stream.pipeThrough(
|
|
217
|
+
new TransformStream<LanguageModelV3StreamPart, LanguageModelV3StreamPart>({
|
|
218
|
+
transform(chunk, controller) {
|
|
219
|
+
if (chunk.type === 'text-delta') collected.push(chunk.delta)
|
|
220
|
+
else if (chunk.type === 'finish') finalUsage = chunk.usage
|
|
221
|
+
controller.enqueue(chunk)
|
|
222
|
+
},
|
|
223
|
+
flush() {
|
|
224
|
+
const durationMs = Date.now() - start
|
|
225
|
+
const event: TraceEvent = {
|
|
226
|
+
kind,
|
|
227
|
+
model: modelId,
|
|
228
|
+
prompt: stringifyPrompt(params),
|
|
229
|
+
response: collected.join(''),
|
|
230
|
+
usage: finalUsage,
|
|
231
|
+
durationMs,
|
|
232
|
+
...(getCostUsd !== undefined ? { costUsd: getCostUsd(modelId, finalUsage) } : {}),
|
|
233
|
+
...(tags !== undefined ? { tags } : {}),
|
|
234
|
+
}
|
|
235
|
+
// Fire-and-forget — TransformStream.flush is sync; we don't
|
|
236
|
+
// await safeEmit so a slow sink doesn't block stream close.
|
|
237
|
+
void safeEmit(emit, event)
|
|
238
|
+
},
|
|
239
|
+
})
|
|
240
|
+
)
|
|
241
|
+
const wrapped: LanguageModelV3StreamResult = {
|
|
242
|
+
...result,
|
|
243
|
+
stream: transformedStream,
|
|
244
|
+
}
|
|
245
|
+
return wrapped
|
|
246
|
+
},
|
|
247
|
+
}
|
|
248
|
+
}
|