@hebo-ai/gateway 0.9.2 → 0.9.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/config.d.ts +2 -0
- package/dist/config.js +125 -0
- package/dist/endpoints/chat-completions/converters.d.ts +26 -0
- package/dist/endpoints/chat-completions/converters.js +525 -0
- package/dist/endpoints/chat-completions/handler.d.ts +2 -0
- package/dist/endpoints/chat-completions/handler.js +152 -0
- package/dist/endpoints/chat-completions/index.d.ts +4 -0
- package/dist/endpoints/chat-completions/index.js +4 -0
- package/dist/endpoints/chat-completions/otel.d.ts +5 -0
- package/dist/endpoints/chat-completions/otel.js +177 -0
- package/dist/endpoints/chat-completions/schema.d.ts +1170 -0
- package/dist/endpoints/chat-completions/schema.js +252 -0
- package/dist/endpoints/conversations/converters.d.ts +8 -0
- package/dist/endpoints/conversations/converters.js +29 -0
- package/dist/endpoints/conversations/handler.d.ts +2 -0
- package/dist/endpoints/conversations/handler.js +259 -0
- package/dist/endpoints/conversations/index.d.ts +3 -0
- package/dist/endpoints/conversations/index.js +3 -0
- package/dist/endpoints/conversations/schema.d.ts +1511 -0
- package/dist/endpoints/conversations/schema.js +74 -0
- package/dist/endpoints/conversations/storage/dialects/greptime.d.ts +10 -0
- package/dist/endpoints/conversations/storage/dialects/greptime.js +87 -0
- package/dist/endpoints/conversations/storage/dialects/mysql.d.ts +12 -0
- package/dist/endpoints/conversations/storage/dialects/mysql.js +118 -0
- package/dist/endpoints/conversations/storage/dialects/postgres.d.ts +16 -0
- package/dist/endpoints/conversations/storage/dialects/postgres.js +185 -0
- package/dist/endpoints/conversations/storage/dialects/sqlite.d.ts +11 -0
- package/dist/endpoints/conversations/storage/dialects/sqlite.js +176 -0
- package/dist/endpoints/conversations/storage/dialects/types.d.ts +42 -0
- package/dist/endpoints/conversations/storage/dialects/types.js +0 -0
- package/dist/endpoints/conversations/storage/dialects/utils.d.ts +25 -0
- package/dist/endpoints/conversations/storage/dialects/utils.js +80 -0
- package/dist/endpoints/conversations/storage/memory.d.ts +25 -0
- package/dist/endpoints/conversations/storage/memory.js +200 -0
- package/dist/endpoints/conversations/storage/sql.d.ts +33 -0
- package/dist/endpoints/conversations/storage/sql.js +276 -0
- package/dist/endpoints/conversations/storage/types.d.ts +39 -0
- package/dist/endpoints/conversations/storage/types.js +0 -0
- package/dist/endpoints/embeddings/converters.d.ts +10 -0
- package/dist/endpoints/embeddings/converters.js +31 -0
- package/dist/endpoints/embeddings/handler.d.ts +2 -0
- package/dist/endpoints/embeddings/handler.js +99 -0
- package/dist/endpoints/embeddings/index.d.ts +4 -0
- package/dist/endpoints/embeddings/index.js +4 -0
- package/dist/endpoints/embeddings/otel.d.ts +5 -0
- package/dist/endpoints/embeddings/otel.js +29 -0
- package/dist/endpoints/embeddings/schema.d.ts +44 -0
- package/dist/endpoints/embeddings/schema.js +29 -0
- package/dist/endpoints/models/converters.d.ts +6 -0
- package/dist/endpoints/models/converters.js +42 -0
- package/dist/endpoints/models/handler.d.ts +2 -0
- package/dist/endpoints/models/handler.js +29 -0
- package/dist/endpoints/models/index.d.ts +3 -0
- package/dist/endpoints/models/index.js +3 -0
- package/dist/endpoints/models/schema.d.ts +42 -0
- package/dist/endpoints/models/schema.js +31 -0
- package/dist/endpoints/responses/converters.d.ts +17 -0
- package/dist/endpoints/responses/converters.js +1037 -0
- package/dist/endpoints/responses/handler.d.ts +2 -0
- package/dist/endpoints/responses/handler.js +141 -0
- package/dist/endpoints/responses/index.d.ts +4 -0
- package/dist/endpoints/responses/index.js +4 -0
- package/dist/endpoints/responses/otel.d.ts +6 -0
- package/dist/endpoints/responses/otel.js +225 -0
- package/dist/endpoints/responses/schema.d.ts +2109 -0
- package/dist/endpoints/responses/schema.js +314 -0
- package/dist/endpoints/shared/converters.d.ts +56 -0
- package/dist/endpoints/shared/converters.js +180 -0
- package/dist/endpoints/shared/schema.d.ts +70 -0
- package/dist/endpoints/shared/schema.js +46 -0
- package/dist/errors/ai-sdk.d.ts +2 -0
- package/dist/errors/ai-sdk.js +52 -0
- package/dist/errors/gateway.d.ts +5 -0
- package/dist/errors/gateway.js +13 -0
- package/dist/errors/openai.d.ts +15 -0
- package/dist/errors/openai.js +40 -0
- package/dist/errors/utils.d.ts +24 -0
- package/dist/errors/utils.js +46 -0
- package/dist/gateway.d.ts +11 -0
- package/dist/gateway.js +44 -0
- package/dist/index.d.ts +11 -0
- package/dist/index.js +10 -0
- package/dist/lifecycle.d.ts +3 -0
- package/dist/lifecycle.js +114 -0
- package/dist/logger/default.d.ts +4 -0
- package/dist/logger/default.js +81 -0
- package/dist/logger/index.d.ts +11 -0
- package/dist/logger/index.js +25 -0
- package/dist/middleware/common.d.ts +12 -0
- package/dist/middleware/common.js +146 -0
- package/dist/middleware/debug.d.ts +3 -0
- package/dist/middleware/debug.js +27 -0
- package/dist/middleware/matcher.d.ts +28 -0
- package/dist/middleware/matcher.js +118 -0
- package/dist/middleware/utils.d.ts +2 -0
- package/dist/middleware/utils.js +24 -0
- package/dist/models/amazon/index.d.ts +2 -0
- package/dist/models/amazon/index.js +2 -0
- package/dist/models/amazon/middleware.d.ts +3 -0
- package/dist/models/amazon/middleware.js +69 -0
- package/dist/models/amazon/presets.d.ts +345 -0
- package/dist/models/amazon/presets.js +80 -0
- package/dist/models/anthropic/index.d.ts +2 -0
- package/dist/models/anthropic/index.js +2 -0
- package/dist/models/anthropic/middleware.d.ts +5 -0
- package/dist/models/anthropic/middleware.js +128 -0
- package/dist/models/anthropic/presets.d.ts +711 -0
- package/dist/models/anthropic/presets.js +140 -0
- package/dist/models/catalog.d.ts +4 -0
- package/dist/models/catalog.js +8 -0
- package/dist/models/cohere/index.d.ts +2 -0
- package/dist/models/cohere/index.js +2 -0
- package/dist/models/cohere/middleware.d.ts +3 -0
- package/dist/models/cohere/middleware.js +62 -0
- package/dist/models/cohere/presets.d.ts +411 -0
- package/dist/models/cohere/presets.js +134 -0
- package/dist/models/google/index.d.ts +2 -0
- package/dist/models/google/index.js +2 -0
- package/dist/models/google/middleware.d.ts +8 -0
- package/dist/models/google/middleware.js +118 -0
- package/dist/models/google/presets.d.ts +815 -0
- package/dist/models/google/presets.js +184 -0
- package/dist/models/meta/index.d.ts +1 -0
- package/dist/models/meta/index.js +1 -0
- package/dist/models/meta/presets.d.ts +483 -0
- package/dist/models/meta/presets.js +105 -0
- package/dist/models/openai/index.d.ts +2 -0
- package/dist/models/openai/index.js +2 -0
- package/dist/models/openai/middleware.d.ts +4 -0
- package/dist/models/openai/middleware.js +89 -0
- package/dist/models/openai/presets.d.ts +1319 -0
- package/dist/models/openai/presets.js +277 -0
- package/dist/models/types.d.ts +20 -0
- package/dist/models/types.js +100 -0
- package/dist/models/voyage/index.d.ts +2 -0
- package/dist/models/voyage/index.js +2 -0
- package/dist/models/voyage/middleware.d.ts +2 -0
- package/dist/models/voyage/middleware.js +19 -0
- package/dist/models/voyage/presets.d.ts +436 -0
- package/dist/models/voyage/presets.js +85 -0
- package/dist/providers/anthropic/canonical.d.ts +3 -0
- package/dist/providers/anthropic/canonical.js +9 -0
- package/dist/providers/anthropic/index.d.ts +1 -0
- package/dist/providers/anthropic/index.js +1 -0
- package/dist/providers/bedrock/canonical.d.ts +17 -0
- package/dist/providers/bedrock/canonical.js +64 -0
- package/dist/providers/bedrock/index.d.ts +2 -0
- package/dist/providers/bedrock/index.js +2 -0
- package/dist/providers/bedrock/middleware.d.ts +5 -0
- package/dist/providers/bedrock/middleware.js +133 -0
- package/dist/providers/cohere/canonical.d.ts +3 -0
- package/dist/providers/cohere/canonical.js +17 -0
- package/dist/providers/cohere/index.d.ts +1 -0
- package/dist/providers/cohere/index.js +1 -0
- package/dist/providers/groq/canonical.d.ts +3 -0
- package/dist/providers/groq/canonical.js +12 -0
- package/dist/providers/groq/index.d.ts +2 -0
- package/dist/providers/groq/index.js +2 -0
- package/dist/providers/groq/middleware.d.ts +2 -0
- package/dist/providers/groq/middleware.js +30 -0
- package/dist/providers/openai/canonical.d.ts +3 -0
- package/dist/providers/openai/canonical.js +8 -0
- package/dist/providers/openai/index.d.ts +1 -0
- package/dist/providers/openai/index.js +1 -0
- package/dist/providers/registry.d.ts +24 -0
- package/dist/providers/registry.js +103 -0
- package/dist/providers/types.d.ts +7 -0
- package/dist/providers/types.js +11 -0
- package/dist/providers/vertex/canonical.d.ts +3 -0
- package/dist/providers/vertex/canonical.js +8 -0
- package/dist/providers/vertex/index.d.ts +2 -0
- package/dist/providers/vertex/index.js +2 -0
- package/dist/providers/vertex/middleware.d.ts +2 -0
- package/dist/providers/vertex/middleware.js +47 -0
- package/dist/providers/voyage/canonical.d.ts +3 -0
- package/dist/providers/voyage/canonical.js +7 -0
- package/dist/providers/voyage/index.d.ts +1 -0
- package/dist/providers/voyage/index.js +1 -0
- package/dist/telemetry/ai-sdk.d.ts +2 -0
- package/dist/telemetry/ai-sdk.js +31 -0
- package/dist/telemetry/baggage.d.ts +1 -0
- package/dist/telemetry/baggage.js +24 -0
- package/dist/telemetry/fetch.d.ts +2 -0
- package/dist/telemetry/fetch.js +49 -0
- package/dist/telemetry/gen-ai.d.ts +7 -0
- package/dist/telemetry/gen-ai.js +112 -0
- package/dist/telemetry/http.d.ts +3 -0
- package/dist/telemetry/http.js +54 -0
- package/dist/telemetry/index.d.ts +1 -0
- package/dist/telemetry/index.js +1 -0
- package/dist/telemetry/memory.d.ts +2 -0
- package/dist/telemetry/memory.js +43 -0
- package/dist/telemetry/span.d.ts +13 -0
- package/dist/telemetry/span.js +60 -0
- package/dist/types.d.ts +231 -0
- package/dist/types.js +2 -0
- package/dist/utils/body.d.ts +19 -0
- package/dist/utils/body.js +99 -0
- package/dist/utils/env.d.ts +2 -0
- package/dist/utils/env.js +7 -0
- package/dist/utils/headers.d.ts +4 -0
- package/dist/utils/headers.js +22 -0
- package/dist/utils/preset.d.ts +10 -0
- package/dist/utils/preset.js +41 -0
- package/dist/utils/request.d.ts +2 -0
- package/dist/utils/request.js +43 -0
- package/dist/utils/response.d.ts +6 -0
- package/dist/utils/response.js +55 -0
- package/dist/utils/stream.d.ts +9 -0
- package/dist/utils/stream.js +100 -0
- package/dist/utils/url.d.ts +4 -0
- package/dist/utils/url.js +21 -0
- package/package.json +1 -1
|
@@ -0,0 +1,152 @@
|
|
|
1
|
+
import { generateText, Output, streamText, wrapLanguageModel, } from "ai";
|
|
2
|
+
import * as z from "zod/mini";
|
|
3
|
+
import { GatewayError } from "../../errors/gateway";
|
|
4
|
+
import { winterCgHandler } from "../../lifecycle";
|
|
5
|
+
import { logger } from "../../logger";
|
|
6
|
+
import { modelMiddlewareMatcher } from "../../middleware/matcher";
|
|
7
|
+
import { resolveProvider } from "../../providers/registry";
|
|
8
|
+
import { getGenAiGeneralAttributes, recordTimePerOutputToken, recordTimeToFirstToken, recordTokenUsage, } from "../../telemetry/gen-ai";
|
|
9
|
+
import { addSpanEvent, setSpanAttributes } from "../../telemetry/span";
|
|
10
|
+
import { parseRequestBody } from "../../utils/body";
|
|
11
|
+
import { prepareForwardHeaders } from "../../utils/request";
|
|
12
|
+
import { convertToTextCallOptions, toChatCompletions, toChatCompletionsStream } from "./converters";
|
|
13
|
+
import { getChatRequestAttributes, getChatResponseAttributes } from "./otel";
|
|
14
|
+
import { ChatCompletionsBodySchema, } from "./schema";
|
|
15
|
+
export const chatCompletions = (config) => {
|
|
16
|
+
const hooks = config.hooks;
|
|
17
|
+
const handler = async (ctx, cfg) => {
|
|
18
|
+
const start = performance.now();
|
|
19
|
+
ctx.operation = "chat";
|
|
20
|
+
setSpanAttributes({ "gen_ai.operation.name": ctx.operation });
|
|
21
|
+
addSpanEvent("hebo.handler.started");
|
|
22
|
+
// Guard: enforce HTTP method early.
|
|
23
|
+
if (!ctx.request || ctx.request.method !== "POST") {
|
|
24
|
+
throw new GatewayError("Method Not Allowed", 405);
|
|
25
|
+
}
|
|
26
|
+
// Parse + validate input (handles Content-Encoding decompression + body size limits).
|
|
27
|
+
ctx.body = (await parseRequestBody(ctx.request, cfg.maxBodySize));
|
|
28
|
+
logger.trace({ requestId: ctx.requestId, body: ctx.body }, "[chat] ChatCompletionsBody");
|
|
29
|
+
addSpanEvent("hebo.request.deserialized");
|
|
30
|
+
const parsed = ChatCompletionsBodySchema.safeParse(ctx.body);
|
|
31
|
+
if (!parsed.success) {
|
|
32
|
+
// FUTURE: consider adding body shape to metadata
|
|
33
|
+
throw new GatewayError(z.prettifyError(parsed.error), 400, undefined, parsed.error);
|
|
34
|
+
}
|
|
35
|
+
ctx.body = parsed.data;
|
|
36
|
+
addSpanEvent("hebo.request.parsed");
|
|
37
|
+
if (hooks?.before) {
|
|
38
|
+
ctx.body =
|
|
39
|
+
(await hooks.before(ctx)) ?? ctx.body;
|
|
40
|
+
addSpanEvent("hebo.hooks.before.completed");
|
|
41
|
+
}
|
|
42
|
+
// Resolve model + provider (hooks may override defaults).
|
|
43
|
+
ctx.modelId = ctx.body.model;
|
|
44
|
+
ctx.resolvedModelId =
|
|
45
|
+
(await hooks?.resolveModelId?.(ctx)) ?? ctx.modelId;
|
|
46
|
+
logger.debug(`[chat] resolved ${ctx.modelId} to ${ctx.resolvedModelId}`);
|
|
47
|
+
addSpanEvent("hebo.model.resolved");
|
|
48
|
+
const override = await hooks?.resolveProvider?.(ctx);
|
|
49
|
+
ctx.provider =
|
|
50
|
+
override ??
|
|
51
|
+
resolveProvider({
|
|
52
|
+
providers: ctx.providers,
|
|
53
|
+
models: ctx.models,
|
|
54
|
+
modelId: ctx.resolvedModelId,
|
|
55
|
+
operation: ctx.operation,
|
|
56
|
+
});
|
|
57
|
+
const languageModel = ctx.provider.languageModel(ctx.resolvedModelId);
|
|
58
|
+
ctx.resolvedProviderId = languageModel.provider;
|
|
59
|
+
logger.debug(`[chat] using ${languageModel.provider} for ${ctx.resolvedModelId}`);
|
|
60
|
+
addSpanEvent("hebo.provider.resolved");
|
|
61
|
+
const genAiSignalLevel = cfg.telemetry?.signals?.gen_ai;
|
|
62
|
+
const genAiGeneralAttrs = getGenAiGeneralAttributes(ctx, genAiSignalLevel);
|
|
63
|
+
setSpanAttributes(genAiGeneralAttrs);
|
|
64
|
+
// Convert inputs to AI SDK call options.
|
|
65
|
+
const { model: _model, stream, ...inputs } = ctx.body;
|
|
66
|
+
const textOptions = convertToTextCallOptions(inputs);
|
|
67
|
+
logger.trace({
|
|
68
|
+
requestId: ctx.requestId,
|
|
69
|
+
options: textOptions,
|
|
70
|
+
}, "[chat] AI SDK options");
|
|
71
|
+
addSpanEvent("hebo.options.prepared");
|
|
72
|
+
setSpanAttributes(getChatRequestAttributes(ctx.body, genAiSignalLevel));
|
|
73
|
+
// Build middleware chain (model -> forward params -> provider).
|
|
74
|
+
const languageModelWithMiddleware = wrapLanguageModel({
|
|
75
|
+
model: languageModel,
|
|
76
|
+
middleware: modelMiddlewareMatcher.for(ctx.resolvedModelId, languageModel.provider),
|
|
77
|
+
});
|
|
78
|
+
// Execute request (streaming vs. non-streaming).
|
|
79
|
+
if (stream) {
|
|
80
|
+
addSpanEvent("hebo.ai-sdk.started");
|
|
81
|
+
let ttft = 0;
|
|
82
|
+
const result = streamText({
|
|
83
|
+
model: languageModelWithMiddleware,
|
|
84
|
+
headers: prepareForwardHeaders(ctx.request),
|
|
85
|
+
abortSignal: ctx.request.signal,
|
|
86
|
+
timeout: {
|
|
87
|
+
totalMs: ctx.body.service_tier === "flex" ? cfg.timeouts.flex : cfg.timeouts.normal,
|
|
88
|
+
},
|
|
89
|
+
onAbort: () => {
|
|
90
|
+
throw new DOMException("The operation was aborted.", "AbortError");
|
|
91
|
+
},
|
|
92
|
+
onError: () => { },
|
|
93
|
+
onChunk: () => {
|
|
94
|
+
if (!ttft) {
|
|
95
|
+
ttft = performance.now() - start;
|
|
96
|
+
recordTimeToFirstToken(ttft, genAiGeneralAttrs, genAiSignalLevel);
|
|
97
|
+
}
|
|
98
|
+
},
|
|
99
|
+
onFinish: (res) => {
|
|
100
|
+
addSpanEvent("hebo.ai-sdk.completed");
|
|
101
|
+
const streamResult = toChatCompletions(res, ctx.resolvedModelId);
|
|
102
|
+
logger.trace({ requestId: ctx.requestId, result: streamResult }, "[chat] ChatCompletions");
|
|
103
|
+
addSpanEvent("hebo.result.transformed");
|
|
104
|
+
const genAiResponseAttrs = getChatResponseAttributes(streamResult, genAiSignalLevel);
|
|
105
|
+
setSpanAttributes(genAiResponseAttrs);
|
|
106
|
+
recordTokenUsage(genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);
|
|
107
|
+
recordTimePerOutputToken(start, ttft, genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);
|
|
108
|
+
},
|
|
109
|
+
experimental_include: {
|
|
110
|
+
requestBody: false,
|
|
111
|
+
},
|
|
112
|
+
includeRawChunks: false,
|
|
113
|
+
...textOptions,
|
|
114
|
+
});
|
|
115
|
+
ctx.result = toChatCompletionsStream(result, ctx.resolvedModelId);
|
|
116
|
+
if (hooks?.after) {
|
|
117
|
+
ctx.result = (await hooks.after(ctx)) ?? ctx.result;
|
|
118
|
+
addSpanEvent("hebo.hooks.after.completed");
|
|
119
|
+
}
|
|
120
|
+
return ctx.result;
|
|
121
|
+
}
|
|
122
|
+
addSpanEvent("hebo.ai-sdk.started");
|
|
123
|
+
const result = await generateText({
|
|
124
|
+
model: languageModelWithMiddleware,
|
|
125
|
+
headers: prepareForwardHeaders(ctx.request),
|
|
126
|
+
abortSignal: ctx.request.signal,
|
|
127
|
+
timeout: ctx.body.service_tier === "flex" ? cfg.timeouts.flex : cfg.timeouts.normal,
|
|
128
|
+
experimental_include: {
|
|
129
|
+
requestBody: false,
|
|
130
|
+
responseBody: false,
|
|
131
|
+
},
|
|
132
|
+
...textOptions,
|
|
133
|
+
});
|
|
134
|
+
logger.trace({ requestId: ctx.requestId, result }, "[chat] AI SDK result");
|
|
135
|
+
addSpanEvent("hebo.ai-sdk.completed");
|
|
136
|
+
recordTimeToFirstToken(performance.now() - start, genAiGeneralAttrs, genAiSignalLevel);
|
|
137
|
+
// Transform result.
|
|
138
|
+
ctx.result = toChatCompletions(result, ctx.resolvedModelId);
|
|
139
|
+
logger.trace({ requestId: ctx.requestId, result: ctx.result }, "[chat] ChatCompletions");
|
|
140
|
+
addSpanEvent("hebo.result.transformed");
|
|
141
|
+
const genAiResponseAttrs = getChatResponseAttributes(ctx.result, genAiSignalLevel);
|
|
142
|
+
setSpanAttributes(genAiResponseAttrs);
|
|
143
|
+
recordTokenUsage(genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);
|
|
144
|
+
if (hooks?.after) {
|
|
145
|
+
ctx.result = (await hooks.after(ctx)) ?? ctx.result;
|
|
146
|
+
addSpanEvent("hebo.hooks.after.completed");
|
|
147
|
+
}
|
|
148
|
+
recordTimePerOutputToken(start, 0, genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);
|
|
149
|
+
return ctx.result;
|
|
150
|
+
};
|
|
151
|
+
return { handler: winterCgHandler(handler, config) };
|
|
152
|
+
};
|
|
@@ -0,0 +1,5 @@
|
|
|
1
|
+
import type { Attributes } from "@opentelemetry/api";
|
|
2
|
+
import { type TelemetrySignalLevel } from "../../types";
|
|
3
|
+
import type { ChatCompletions, ChatCompletionsBody } from "./schema";
|
|
4
|
+
export declare const getChatRequestAttributes: (body: ChatCompletionsBody, signalLevel?: TelemetrySignalLevel) => Attributes;
|
|
5
|
+
export declare const getChatResponseAttributes: (completions: ChatCompletions, signalLevel?: TelemetrySignalLevel) => Attributes;
|
|
@@ -0,0 +1,177 @@
|
|
|
1
|
+
import {} from "../../types";
|
|
2
|
+
import { parseDataUrl } from "../../utils/url";
|
|
3
|
+
const toTextParts = (content) => {
|
|
4
|
+
if (typeof content === "string") {
|
|
5
|
+
return [{ type: "text", content }];
|
|
6
|
+
}
|
|
7
|
+
const result = [];
|
|
8
|
+
if (Array.isArray(content)) {
|
|
9
|
+
for (const part of content) {
|
|
10
|
+
if (part.type === "text") {
|
|
11
|
+
result.push({ type: "text", content: part.text });
|
|
12
|
+
}
|
|
13
|
+
}
|
|
14
|
+
}
|
|
15
|
+
return result;
|
|
16
|
+
};
|
|
17
|
+
const toBlobPart = (modality, mimeType) => {
|
|
18
|
+
const part = {
|
|
19
|
+
type: "blob",
|
|
20
|
+
modality,
|
|
21
|
+
content: "[REDACTED_BINARY_DATA]",
|
|
22
|
+
};
|
|
23
|
+
if (mimeType)
|
|
24
|
+
part["mime_type"] = mimeType;
|
|
25
|
+
return part;
|
|
26
|
+
};
|
|
27
|
+
const toToolResponsePart = (id, content) => ({
|
|
28
|
+
type: "tool_call_response",
|
|
29
|
+
id,
|
|
30
|
+
response: typeof content === "string" ? content : content.map((p) => p.text).join(""),
|
|
31
|
+
});
|
|
32
|
+
const toAssistantParts = (message) => {
|
|
33
|
+
const parts = [];
|
|
34
|
+
if (typeof message.reasoning === "string") {
|
|
35
|
+
parts.push({ type: "reasoning", content: message.reasoning });
|
|
36
|
+
}
|
|
37
|
+
for (const part of toTextParts(message.content)) {
|
|
38
|
+
parts.push(part);
|
|
39
|
+
}
|
|
40
|
+
if (Array.isArray(message.tool_calls)) {
|
|
41
|
+
for (const call of message.tool_calls) {
|
|
42
|
+
parts.push({
|
|
43
|
+
type: "tool_call",
|
|
44
|
+
id: call.id,
|
|
45
|
+
name: call.function.name,
|
|
46
|
+
arguments: call.function.arguments,
|
|
47
|
+
});
|
|
48
|
+
}
|
|
49
|
+
}
|
|
50
|
+
return parts;
|
|
51
|
+
};
|
|
52
|
+
const toUserParts = (content) => {
|
|
53
|
+
if (typeof content === "string")
|
|
54
|
+
return [{ type: "text", content }];
|
|
55
|
+
const parts = [];
|
|
56
|
+
for (const part of content) {
|
|
57
|
+
switch (part.type) {
|
|
58
|
+
case "text":
|
|
59
|
+
parts.push({ type: "text", content: part.text });
|
|
60
|
+
break;
|
|
61
|
+
case "image_url": {
|
|
62
|
+
const url = part.image_url.url;
|
|
63
|
+
if (url.slice(0, 5).toLowerCase() === "data:") {
|
|
64
|
+
const { mimeType } = parseDataUrl(url);
|
|
65
|
+
parts.push(toBlobPart("image", mimeType || undefined));
|
|
66
|
+
}
|
|
67
|
+
else {
|
|
68
|
+
parts.push({ type: "uri", modality: "image", uri: url });
|
|
69
|
+
}
|
|
70
|
+
break;
|
|
71
|
+
}
|
|
72
|
+
case "input_audio":
|
|
73
|
+
parts.push(toBlobPart("audio", `audio/${part.input_audio.format}`));
|
|
74
|
+
break;
|
|
75
|
+
case "file": {
|
|
76
|
+
const filePart = toBlobPart("file", part.file.media_type);
|
|
77
|
+
if (part.file.filename)
|
|
78
|
+
filePart["file_name"] = part.file.filename;
|
|
79
|
+
parts.push(filePart);
|
|
80
|
+
break;
|
|
81
|
+
}
|
|
82
|
+
default:
|
|
83
|
+
parts.push({ type: part.type, content: "[UNHANDLED_CONTENT_PART]" });
|
|
84
|
+
break;
|
|
85
|
+
}
|
|
86
|
+
}
|
|
87
|
+
return parts;
|
|
88
|
+
};
|
|
89
|
+
const toMessageParts = (message) => {
|
|
90
|
+
switch (message.role) {
|
|
91
|
+
case "assistant":
|
|
92
|
+
return toAssistantParts(message);
|
|
93
|
+
case "tool":
|
|
94
|
+
return [toToolResponsePart(message.tool_call_id, message.content)];
|
|
95
|
+
case "user":
|
|
96
|
+
return toUserParts(message.content);
|
|
97
|
+
// FUTURE: remove once Langfuse supports gen_ai.system_instructions
|
|
98
|
+
// https://github.com/langfuse/langfuse/issues/11607
|
|
99
|
+
case "system":
|
|
100
|
+
return toTextParts(message.content);
|
|
101
|
+
default:
|
|
102
|
+
return [{ type: message.role, content: "[UNHANDLED_ROLE]" }];
|
|
103
|
+
}
|
|
104
|
+
};
|
|
105
|
+
export const getChatRequestAttributes = (body, signalLevel) => {
|
|
106
|
+
if (!signalLevel || signalLevel === "off")
|
|
107
|
+
return {};
|
|
108
|
+
const attrs = {};
|
|
109
|
+
if (body.seed !== undefined) {
|
|
110
|
+
Object.assign(attrs, { "gen_ai.request.seed": body.seed });
|
|
111
|
+
}
|
|
112
|
+
if (signalLevel !== "required") {
|
|
113
|
+
Object.assign(attrs, {
|
|
114
|
+
"gen_ai.request.reasoning.enabled": body.reasoning?.enabled,
|
|
115
|
+
"gen_ai.request.reasoning.effort": body.reasoning?.effort,
|
|
116
|
+
"gen_ai.request.reasoning.max_tokens": body.reasoning?.max_tokens,
|
|
117
|
+
"gen_ai.request.stream": body.stream,
|
|
118
|
+
"gen_ai.request.frequency_penalty": body.frequency_penalty,
|
|
119
|
+
"gen_ai.request.max_tokens": body.max_completion_tokens,
|
|
120
|
+
"gen_ai.request.presence_penalty": body.presence_penalty,
|
|
121
|
+
"gen_ai.request.stop_sequences": body.stop
|
|
122
|
+
? Array.isArray(body.stop)
|
|
123
|
+
? body.stop
|
|
124
|
+
: [body.stop]
|
|
125
|
+
: undefined,
|
|
126
|
+
"gen_ai.request.temperature": body.temperature,
|
|
127
|
+
"gen_ai.request.top_p": body.top_p,
|
|
128
|
+
});
|
|
129
|
+
if (body.metadata) {
|
|
130
|
+
for (const key in body.metadata) {
|
|
131
|
+
attrs[`gen_ai.request.metadata.${key}`] = body.metadata[key];
|
|
132
|
+
}
|
|
133
|
+
}
|
|
134
|
+
}
|
|
135
|
+
if (signalLevel === "full") {
|
|
136
|
+
Object.assign(attrs, {
|
|
137
|
+
// FUTURE: move system instructions from messages to here
|
|
138
|
+
// blocker: https://github.com/langfuse/langfuse/issues/11607
|
|
139
|
+
// "gen_ai.system_instructions": inputs.messages
|
|
140
|
+
// .filter((m) => m.role === "system")
|
|
141
|
+
// .map((m) => JSON.stringify(toTextPart(m.content))),
|
|
142
|
+
"gen_ai.input.messages": body.messages
|
|
143
|
+
//.filter((m) => m.role !== "system")
|
|
144
|
+
.map((m) => JSON.stringify({ role: m.role, parts: toMessageParts(m) })),
|
|
145
|
+
"gen_ai.tool.definitions": body.tools?.map((toolDefinition) => JSON.stringify(toolDefinition)),
|
|
146
|
+
});
|
|
147
|
+
}
|
|
148
|
+
return attrs;
|
|
149
|
+
};
|
|
150
|
+
export const getChatResponseAttributes = (completions, signalLevel) => {
|
|
151
|
+
if (!signalLevel || signalLevel === "off")
|
|
152
|
+
return {};
|
|
153
|
+
const attrs = {
|
|
154
|
+
"gen_ai.response.id": completions.id,
|
|
155
|
+
};
|
|
156
|
+
if (signalLevel !== "required") {
|
|
157
|
+
Object.assign(attrs, {
|
|
158
|
+
"gen_ai.response.finish_reasons": completions.choices?.map((c) => c.finish_reason),
|
|
159
|
+
"gen_ai.response.service_tier": completions.service_tier,
|
|
160
|
+
"gen_ai.usage.total_tokens": completions.usage?.total_tokens,
|
|
161
|
+
"gen_ai.usage.input_tokens": completions.usage?.prompt_tokens,
|
|
162
|
+
"gen_ai.usage.cache_read.input_tokens": completions.usage?.prompt_tokens_details?.cached_tokens,
|
|
163
|
+
"gen_ai.usage.output_tokens": completions.usage?.completion_tokens,
|
|
164
|
+
"gen_ai.usage.reasoning.output_tokens": completions.usage?.completion_tokens_details?.reasoning_tokens,
|
|
165
|
+
});
|
|
166
|
+
}
|
|
167
|
+
if (signalLevel === "full") {
|
|
168
|
+
Object.assign(attrs, {
|
|
169
|
+
"gen_ai.output.messages": completions.choices?.map((c) => JSON.stringify({
|
|
170
|
+
role: c.message.role,
|
|
171
|
+
parts: toMessageParts(c.message),
|
|
172
|
+
finish_reason: c.finish_reason,
|
|
173
|
+
})),
|
|
174
|
+
});
|
|
175
|
+
}
|
|
176
|
+
return attrs;
|
|
177
|
+
};
|