@hebo-ai/gateway 0.9.2 → 0.9.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (213) hide show
  1. package/dist/config.d.ts +2 -0
  2. package/dist/config.js +125 -0
  3. package/dist/endpoints/chat-completions/converters.d.ts +26 -0
  4. package/dist/endpoints/chat-completions/converters.js +525 -0
  5. package/dist/endpoints/chat-completions/handler.d.ts +2 -0
  6. package/dist/endpoints/chat-completions/handler.js +152 -0
  7. package/dist/endpoints/chat-completions/index.d.ts +4 -0
  8. package/dist/endpoints/chat-completions/index.js +4 -0
  9. package/dist/endpoints/chat-completions/otel.d.ts +5 -0
  10. package/dist/endpoints/chat-completions/otel.js +177 -0
  11. package/dist/endpoints/chat-completions/schema.d.ts +1170 -0
  12. package/dist/endpoints/chat-completions/schema.js +252 -0
  13. package/dist/endpoints/conversations/converters.d.ts +8 -0
  14. package/dist/endpoints/conversations/converters.js +29 -0
  15. package/dist/endpoints/conversations/handler.d.ts +2 -0
  16. package/dist/endpoints/conversations/handler.js +259 -0
  17. package/dist/endpoints/conversations/index.d.ts +3 -0
  18. package/dist/endpoints/conversations/index.js +3 -0
  19. package/dist/endpoints/conversations/schema.d.ts +1511 -0
  20. package/dist/endpoints/conversations/schema.js +74 -0
  21. package/dist/endpoints/conversations/storage/dialects/greptime.d.ts +10 -0
  22. package/dist/endpoints/conversations/storage/dialects/greptime.js +87 -0
  23. package/dist/endpoints/conversations/storage/dialects/mysql.d.ts +12 -0
  24. package/dist/endpoints/conversations/storage/dialects/mysql.js +118 -0
  25. package/dist/endpoints/conversations/storage/dialects/postgres.d.ts +16 -0
  26. package/dist/endpoints/conversations/storage/dialects/postgres.js +185 -0
  27. package/dist/endpoints/conversations/storage/dialects/sqlite.d.ts +11 -0
  28. package/dist/endpoints/conversations/storage/dialects/sqlite.js +176 -0
  29. package/dist/endpoints/conversations/storage/dialects/types.d.ts +42 -0
  30. package/dist/endpoints/conversations/storage/dialects/types.js +0 -0
  31. package/dist/endpoints/conversations/storage/dialects/utils.d.ts +25 -0
  32. package/dist/endpoints/conversations/storage/dialects/utils.js +80 -0
  33. package/dist/endpoints/conversations/storage/memory.d.ts +25 -0
  34. package/dist/endpoints/conversations/storage/memory.js +200 -0
  35. package/dist/endpoints/conversations/storage/sql.d.ts +33 -0
  36. package/dist/endpoints/conversations/storage/sql.js +276 -0
  37. package/dist/endpoints/conversations/storage/types.d.ts +39 -0
  38. package/dist/endpoints/conversations/storage/types.js +0 -0
  39. package/dist/endpoints/embeddings/converters.d.ts +10 -0
  40. package/dist/endpoints/embeddings/converters.js +31 -0
  41. package/dist/endpoints/embeddings/handler.d.ts +2 -0
  42. package/dist/endpoints/embeddings/handler.js +99 -0
  43. package/dist/endpoints/embeddings/index.d.ts +4 -0
  44. package/dist/endpoints/embeddings/index.js +4 -0
  45. package/dist/endpoints/embeddings/otel.d.ts +5 -0
  46. package/dist/endpoints/embeddings/otel.js +29 -0
  47. package/dist/endpoints/embeddings/schema.d.ts +44 -0
  48. package/dist/endpoints/embeddings/schema.js +29 -0
  49. package/dist/endpoints/models/converters.d.ts +6 -0
  50. package/dist/endpoints/models/converters.js +42 -0
  51. package/dist/endpoints/models/handler.d.ts +2 -0
  52. package/dist/endpoints/models/handler.js +29 -0
  53. package/dist/endpoints/models/index.d.ts +3 -0
  54. package/dist/endpoints/models/index.js +3 -0
  55. package/dist/endpoints/models/schema.d.ts +42 -0
  56. package/dist/endpoints/models/schema.js +31 -0
  57. package/dist/endpoints/responses/converters.d.ts +17 -0
  58. package/dist/endpoints/responses/converters.js +1037 -0
  59. package/dist/endpoints/responses/handler.d.ts +2 -0
  60. package/dist/endpoints/responses/handler.js +141 -0
  61. package/dist/endpoints/responses/index.d.ts +4 -0
  62. package/dist/endpoints/responses/index.js +4 -0
  63. package/dist/endpoints/responses/otel.d.ts +6 -0
  64. package/dist/endpoints/responses/otel.js +225 -0
  65. package/dist/endpoints/responses/schema.d.ts +2109 -0
  66. package/dist/endpoints/responses/schema.js +314 -0
  67. package/dist/endpoints/shared/converters.d.ts +56 -0
  68. package/dist/endpoints/shared/converters.js +180 -0
  69. package/dist/endpoints/shared/schema.d.ts +70 -0
  70. package/dist/endpoints/shared/schema.js +46 -0
  71. package/dist/errors/ai-sdk.d.ts +2 -0
  72. package/dist/errors/ai-sdk.js +52 -0
  73. package/dist/errors/gateway.d.ts +5 -0
  74. package/dist/errors/gateway.js +13 -0
  75. package/dist/errors/openai.d.ts +15 -0
  76. package/dist/errors/openai.js +40 -0
  77. package/dist/errors/utils.d.ts +24 -0
  78. package/dist/errors/utils.js +46 -0
  79. package/dist/gateway.d.ts +11 -0
  80. package/dist/gateway.js +44 -0
  81. package/dist/index.d.ts +11 -0
  82. package/dist/index.js +10 -0
  83. package/dist/lifecycle.d.ts +3 -0
  84. package/dist/lifecycle.js +114 -0
  85. package/dist/logger/default.d.ts +4 -0
  86. package/dist/logger/default.js +81 -0
  87. package/dist/logger/index.d.ts +11 -0
  88. package/dist/logger/index.js +25 -0
  89. package/dist/middleware/common.d.ts +12 -0
  90. package/dist/middleware/common.js +146 -0
  91. package/dist/middleware/debug.d.ts +3 -0
  92. package/dist/middleware/debug.js +27 -0
  93. package/dist/middleware/matcher.d.ts +28 -0
  94. package/dist/middleware/matcher.js +118 -0
  95. package/dist/middleware/utils.d.ts +2 -0
  96. package/dist/middleware/utils.js +24 -0
  97. package/dist/models/amazon/index.d.ts +2 -0
  98. package/dist/models/amazon/index.js +2 -0
  99. package/dist/models/amazon/middleware.d.ts +3 -0
  100. package/dist/models/amazon/middleware.js +69 -0
  101. package/dist/models/amazon/presets.d.ts +345 -0
  102. package/dist/models/amazon/presets.js +80 -0
  103. package/dist/models/anthropic/index.d.ts +2 -0
  104. package/dist/models/anthropic/index.js +2 -0
  105. package/dist/models/anthropic/middleware.d.ts +5 -0
  106. package/dist/models/anthropic/middleware.js +128 -0
  107. package/dist/models/anthropic/presets.d.ts +711 -0
  108. package/dist/models/anthropic/presets.js +140 -0
  109. package/dist/models/catalog.d.ts +4 -0
  110. package/dist/models/catalog.js +8 -0
  111. package/dist/models/cohere/index.d.ts +2 -0
  112. package/dist/models/cohere/index.js +2 -0
  113. package/dist/models/cohere/middleware.d.ts +3 -0
  114. package/dist/models/cohere/middleware.js +62 -0
  115. package/dist/models/cohere/presets.d.ts +411 -0
  116. package/dist/models/cohere/presets.js +134 -0
  117. package/dist/models/google/index.d.ts +2 -0
  118. package/dist/models/google/index.js +2 -0
  119. package/dist/models/google/middleware.d.ts +8 -0
  120. package/dist/models/google/middleware.js +118 -0
  121. package/dist/models/google/presets.d.ts +815 -0
  122. package/dist/models/google/presets.js +184 -0
  123. package/dist/models/meta/index.d.ts +1 -0
  124. package/dist/models/meta/index.js +1 -0
  125. package/dist/models/meta/presets.d.ts +483 -0
  126. package/dist/models/meta/presets.js +105 -0
  127. package/dist/models/openai/index.d.ts +2 -0
  128. package/dist/models/openai/index.js +2 -0
  129. package/dist/models/openai/middleware.d.ts +4 -0
  130. package/dist/models/openai/middleware.js +89 -0
  131. package/dist/models/openai/presets.d.ts +1319 -0
  132. package/dist/models/openai/presets.js +277 -0
  133. package/dist/models/types.d.ts +20 -0
  134. package/dist/models/types.js +100 -0
  135. package/dist/models/voyage/index.d.ts +2 -0
  136. package/dist/models/voyage/index.js +2 -0
  137. package/dist/models/voyage/middleware.d.ts +2 -0
  138. package/dist/models/voyage/middleware.js +19 -0
  139. package/dist/models/voyage/presets.d.ts +436 -0
  140. package/dist/models/voyage/presets.js +85 -0
  141. package/dist/providers/anthropic/canonical.d.ts +3 -0
  142. package/dist/providers/anthropic/canonical.js +9 -0
  143. package/dist/providers/anthropic/index.d.ts +1 -0
  144. package/dist/providers/anthropic/index.js +1 -0
  145. package/dist/providers/bedrock/canonical.d.ts +17 -0
  146. package/dist/providers/bedrock/canonical.js +64 -0
  147. package/dist/providers/bedrock/index.d.ts +2 -0
  148. package/dist/providers/bedrock/index.js +2 -0
  149. package/dist/providers/bedrock/middleware.d.ts +5 -0
  150. package/dist/providers/bedrock/middleware.js +133 -0
  151. package/dist/providers/cohere/canonical.d.ts +3 -0
  152. package/dist/providers/cohere/canonical.js +17 -0
  153. package/dist/providers/cohere/index.d.ts +1 -0
  154. package/dist/providers/cohere/index.js +1 -0
  155. package/dist/providers/groq/canonical.d.ts +3 -0
  156. package/dist/providers/groq/canonical.js +12 -0
  157. package/dist/providers/groq/index.d.ts +2 -0
  158. package/dist/providers/groq/index.js +2 -0
  159. package/dist/providers/groq/middleware.d.ts +2 -0
  160. package/dist/providers/groq/middleware.js +30 -0
  161. package/dist/providers/openai/canonical.d.ts +3 -0
  162. package/dist/providers/openai/canonical.js +8 -0
  163. package/dist/providers/openai/index.d.ts +1 -0
  164. package/dist/providers/openai/index.js +1 -0
  165. package/dist/providers/registry.d.ts +24 -0
  166. package/dist/providers/registry.js +103 -0
  167. package/dist/providers/types.d.ts +7 -0
  168. package/dist/providers/types.js +11 -0
  169. package/dist/providers/vertex/canonical.d.ts +3 -0
  170. package/dist/providers/vertex/canonical.js +8 -0
  171. package/dist/providers/vertex/index.d.ts +2 -0
  172. package/dist/providers/vertex/index.js +2 -0
  173. package/dist/providers/vertex/middleware.d.ts +2 -0
  174. package/dist/providers/vertex/middleware.js +47 -0
  175. package/dist/providers/voyage/canonical.d.ts +3 -0
  176. package/dist/providers/voyage/canonical.js +7 -0
  177. package/dist/providers/voyage/index.d.ts +1 -0
  178. package/dist/providers/voyage/index.js +1 -0
  179. package/dist/telemetry/ai-sdk.d.ts +2 -0
  180. package/dist/telemetry/ai-sdk.js +31 -0
  181. package/dist/telemetry/baggage.d.ts +1 -0
  182. package/dist/telemetry/baggage.js +24 -0
  183. package/dist/telemetry/fetch.d.ts +2 -0
  184. package/dist/telemetry/fetch.js +49 -0
  185. package/dist/telemetry/gen-ai.d.ts +7 -0
  186. package/dist/telemetry/gen-ai.js +112 -0
  187. package/dist/telemetry/http.d.ts +3 -0
  188. package/dist/telemetry/http.js +54 -0
  189. package/dist/telemetry/index.d.ts +1 -0
  190. package/dist/telemetry/index.js +1 -0
  191. package/dist/telemetry/memory.d.ts +2 -0
  192. package/dist/telemetry/memory.js +43 -0
  193. package/dist/telemetry/span.d.ts +13 -0
  194. package/dist/telemetry/span.js +60 -0
  195. package/dist/types.d.ts +231 -0
  196. package/dist/types.js +2 -0
  197. package/dist/utils/body.d.ts +19 -0
  198. package/dist/utils/body.js +99 -0
  199. package/dist/utils/env.d.ts +2 -0
  200. package/dist/utils/env.js +7 -0
  201. package/dist/utils/headers.d.ts +4 -0
  202. package/dist/utils/headers.js +22 -0
  203. package/dist/utils/preset.d.ts +10 -0
  204. package/dist/utils/preset.js +41 -0
  205. package/dist/utils/request.d.ts +2 -0
  206. package/dist/utils/request.js +43 -0
  207. package/dist/utils/response.d.ts +6 -0
  208. package/dist/utils/response.js +55 -0
  209. package/dist/utils/stream.d.ts +9 -0
  210. package/dist/utils/stream.js +100 -0
  211. package/dist/utils/url.d.ts +4 -0
  212. package/dist/utils/url.js +21 -0
  213. package/package.json +1 -1
@@ -0,0 +1,152 @@
1
+ import { generateText, Output, streamText, wrapLanguageModel, } from "ai";
2
+ import * as z from "zod/mini";
3
+ import { GatewayError } from "../../errors/gateway";
4
+ import { winterCgHandler } from "../../lifecycle";
5
+ import { logger } from "../../logger";
6
+ import { modelMiddlewareMatcher } from "../../middleware/matcher";
7
+ import { resolveProvider } from "../../providers/registry";
8
+ import { getGenAiGeneralAttributes, recordTimePerOutputToken, recordTimeToFirstToken, recordTokenUsage, } from "../../telemetry/gen-ai";
9
+ import { addSpanEvent, setSpanAttributes } from "../../telemetry/span";
10
+ import { parseRequestBody } from "../../utils/body";
11
+ import { prepareForwardHeaders } from "../../utils/request";
12
+ import { convertToTextCallOptions, toChatCompletions, toChatCompletionsStream } from "./converters";
13
+ import { getChatRequestAttributes, getChatResponseAttributes } from "./otel";
14
+ import { ChatCompletionsBodySchema, } from "./schema";
15
+ export const chatCompletions = (config) => {
16
+ const hooks = config.hooks;
17
+ const handler = async (ctx, cfg) => {
18
+ const start = performance.now();
19
+ ctx.operation = "chat";
20
+ setSpanAttributes({ "gen_ai.operation.name": ctx.operation });
21
+ addSpanEvent("hebo.handler.started");
22
+ // Guard: enforce HTTP method early.
23
+ if (!ctx.request || ctx.request.method !== "POST") {
24
+ throw new GatewayError("Method Not Allowed", 405);
25
+ }
26
+ // Parse + validate input (handles Content-Encoding decompression + body size limits).
27
+ ctx.body = (await parseRequestBody(ctx.request, cfg.maxBodySize));
28
+ logger.trace({ requestId: ctx.requestId, body: ctx.body }, "[chat] ChatCompletionsBody");
29
+ addSpanEvent("hebo.request.deserialized");
30
+ const parsed = ChatCompletionsBodySchema.safeParse(ctx.body);
31
+ if (!parsed.success) {
32
+ // FUTURE: consider adding body shape to metadata
33
+ throw new GatewayError(z.prettifyError(parsed.error), 400, undefined, parsed.error);
34
+ }
35
+ ctx.body = parsed.data;
36
+ addSpanEvent("hebo.request.parsed");
37
+ if (hooks?.before) {
38
+ ctx.body =
39
+ (await hooks.before(ctx)) ?? ctx.body;
40
+ addSpanEvent("hebo.hooks.before.completed");
41
+ }
42
+ // Resolve model + provider (hooks may override defaults).
43
+ ctx.modelId = ctx.body.model;
44
+ ctx.resolvedModelId =
45
+ (await hooks?.resolveModelId?.(ctx)) ?? ctx.modelId;
46
+ logger.debug(`[chat] resolved ${ctx.modelId} to ${ctx.resolvedModelId}`);
47
+ addSpanEvent("hebo.model.resolved");
48
+ const override = await hooks?.resolveProvider?.(ctx);
49
+ ctx.provider =
50
+ override ??
51
+ resolveProvider({
52
+ providers: ctx.providers,
53
+ models: ctx.models,
54
+ modelId: ctx.resolvedModelId,
55
+ operation: ctx.operation,
56
+ });
57
+ const languageModel = ctx.provider.languageModel(ctx.resolvedModelId);
58
+ ctx.resolvedProviderId = languageModel.provider;
59
+ logger.debug(`[chat] using ${languageModel.provider} for ${ctx.resolvedModelId}`);
60
+ addSpanEvent("hebo.provider.resolved");
61
+ const genAiSignalLevel = cfg.telemetry?.signals?.gen_ai;
62
+ const genAiGeneralAttrs = getGenAiGeneralAttributes(ctx, genAiSignalLevel);
63
+ setSpanAttributes(genAiGeneralAttrs);
64
+ // Convert inputs to AI SDK call options.
65
+ const { model: _model, stream, ...inputs } = ctx.body;
66
+ const textOptions = convertToTextCallOptions(inputs);
67
+ logger.trace({
68
+ requestId: ctx.requestId,
69
+ options: textOptions,
70
+ }, "[chat] AI SDK options");
71
+ addSpanEvent("hebo.options.prepared");
72
+ setSpanAttributes(getChatRequestAttributes(ctx.body, genAiSignalLevel));
73
+ // Build middleware chain (model -> forward params -> provider).
74
+ const languageModelWithMiddleware = wrapLanguageModel({
75
+ model: languageModel,
76
+ middleware: modelMiddlewareMatcher.for(ctx.resolvedModelId, languageModel.provider),
77
+ });
78
+ // Execute request (streaming vs. non-streaming).
79
+ if (stream) {
80
+ addSpanEvent("hebo.ai-sdk.started");
81
+ let ttft = 0;
82
+ const result = streamText({
83
+ model: languageModelWithMiddleware,
84
+ headers: prepareForwardHeaders(ctx.request),
85
+ abortSignal: ctx.request.signal,
86
+ timeout: {
87
+ totalMs: ctx.body.service_tier === "flex" ? cfg.timeouts.flex : cfg.timeouts.normal,
88
+ },
89
+ onAbort: () => {
90
+ throw new DOMException("The operation was aborted.", "AbortError");
91
+ },
92
+ onError: () => { },
93
+ onChunk: () => {
94
+ if (!ttft) {
95
+ ttft = performance.now() - start;
96
+ recordTimeToFirstToken(ttft, genAiGeneralAttrs, genAiSignalLevel);
97
+ }
98
+ },
99
+ onFinish: (res) => {
100
+ addSpanEvent("hebo.ai-sdk.completed");
101
+ const streamResult = toChatCompletions(res, ctx.resolvedModelId);
102
+ logger.trace({ requestId: ctx.requestId, result: streamResult }, "[chat] ChatCompletions");
103
+ addSpanEvent("hebo.result.transformed");
104
+ const genAiResponseAttrs = getChatResponseAttributes(streamResult, genAiSignalLevel);
105
+ setSpanAttributes(genAiResponseAttrs);
106
+ recordTokenUsage(genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);
107
+ recordTimePerOutputToken(start, ttft, genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);
108
+ },
109
+ experimental_include: {
110
+ requestBody: false,
111
+ },
112
+ includeRawChunks: false,
113
+ ...textOptions,
114
+ });
115
+ ctx.result = toChatCompletionsStream(result, ctx.resolvedModelId);
116
+ if (hooks?.after) {
117
+ ctx.result = (await hooks.after(ctx)) ?? ctx.result;
118
+ addSpanEvent("hebo.hooks.after.completed");
119
+ }
120
+ return ctx.result;
121
+ }
122
+ addSpanEvent("hebo.ai-sdk.started");
123
+ const result = await generateText({
124
+ model: languageModelWithMiddleware,
125
+ headers: prepareForwardHeaders(ctx.request),
126
+ abortSignal: ctx.request.signal,
127
+ timeout: ctx.body.service_tier === "flex" ? cfg.timeouts.flex : cfg.timeouts.normal,
128
+ experimental_include: {
129
+ requestBody: false,
130
+ responseBody: false,
131
+ },
132
+ ...textOptions,
133
+ });
134
+ logger.trace({ requestId: ctx.requestId, result }, "[chat] AI SDK result");
135
+ addSpanEvent("hebo.ai-sdk.completed");
136
+ recordTimeToFirstToken(performance.now() - start, genAiGeneralAttrs, genAiSignalLevel);
137
+ // Transform result.
138
+ ctx.result = toChatCompletions(result, ctx.resolvedModelId);
139
+ logger.trace({ requestId: ctx.requestId, result: ctx.result }, "[chat] ChatCompletions");
140
+ addSpanEvent("hebo.result.transformed");
141
+ const genAiResponseAttrs = getChatResponseAttributes(ctx.result, genAiSignalLevel);
142
+ setSpanAttributes(genAiResponseAttrs);
143
+ recordTokenUsage(genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);
144
+ if (hooks?.after) {
145
+ ctx.result = (await hooks.after(ctx)) ?? ctx.result;
146
+ addSpanEvent("hebo.hooks.after.completed");
147
+ }
148
+ recordTimePerOutputToken(start, 0, genAiResponseAttrs, genAiGeneralAttrs, genAiSignalLevel);
149
+ return ctx.result;
150
+ };
151
+ return { handler: winterCgHandler(handler, config) };
152
+ };
@@ -0,0 +1,4 @@
1
+ export * from "./converters";
2
+ export * from "./handler";
3
+ export * from "./schema";
4
+ export * from "./otel";
@@ -0,0 +1,4 @@
1
+ export * from "./converters";
2
+ export * from "./handler";
3
+ export * from "./schema";
4
+ export * from "./otel";
@@ -0,0 +1,5 @@
1
+ import type { Attributes } from "@opentelemetry/api";
2
+ import { type TelemetrySignalLevel } from "../../types";
3
+ import type { ChatCompletions, ChatCompletionsBody } from "./schema";
4
+ export declare const getChatRequestAttributes: (body: ChatCompletionsBody, signalLevel?: TelemetrySignalLevel) => Attributes;
5
+ export declare const getChatResponseAttributes: (completions: ChatCompletions, signalLevel?: TelemetrySignalLevel) => Attributes;
@@ -0,0 +1,177 @@
1
+ import {} from "../../types";
2
+ import { parseDataUrl } from "../../utils/url";
3
+ const toTextParts = (content) => {
4
+ if (typeof content === "string") {
5
+ return [{ type: "text", content }];
6
+ }
7
+ const result = [];
8
+ if (Array.isArray(content)) {
9
+ for (const part of content) {
10
+ if (part.type === "text") {
11
+ result.push({ type: "text", content: part.text });
12
+ }
13
+ }
14
+ }
15
+ return result;
16
+ };
17
+ const toBlobPart = (modality, mimeType) => {
18
+ const part = {
19
+ type: "blob",
20
+ modality,
21
+ content: "[REDACTED_BINARY_DATA]",
22
+ };
23
+ if (mimeType)
24
+ part["mime_type"] = mimeType;
25
+ return part;
26
+ };
27
+ const toToolResponsePart = (id, content) => ({
28
+ type: "tool_call_response",
29
+ id,
30
+ response: typeof content === "string" ? content : content.map((p) => p.text).join(""),
31
+ });
32
+ const toAssistantParts = (message) => {
33
+ const parts = [];
34
+ if (typeof message.reasoning === "string") {
35
+ parts.push({ type: "reasoning", content: message.reasoning });
36
+ }
37
+ for (const part of toTextParts(message.content)) {
38
+ parts.push(part);
39
+ }
40
+ if (Array.isArray(message.tool_calls)) {
41
+ for (const call of message.tool_calls) {
42
+ parts.push({
43
+ type: "tool_call",
44
+ id: call.id,
45
+ name: call.function.name,
46
+ arguments: call.function.arguments,
47
+ });
48
+ }
49
+ }
50
+ return parts;
51
+ };
52
+ const toUserParts = (content) => {
53
+ if (typeof content === "string")
54
+ return [{ type: "text", content }];
55
+ const parts = [];
56
+ for (const part of content) {
57
+ switch (part.type) {
58
+ case "text":
59
+ parts.push({ type: "text", content: part.text });
60
+ break;
61
+ case "image_url": {
62
+ const url = part.image_url.url;
63
+ if (url.slice(0, 5).toLowerCase() === "data:") {
64
+ const { mimeType } = parseDataUrl(url);
65
+ parts.push(toBlobPart("image", mimeType || undefined));
66
+ }
67
+ else {
68
+ parts.push({ type: "uri", modality: "image", uri: url });
69
+ }
70
+ break;
71
+ }
72
+ case "input_audio":
73
+ parts.push(toBlobPart("audio", `audio/${part.input_audio.format}`));
74
+ break;
75
+ case "file": {
76
+ const filePart = toBlobPart("file", part.file.media_type);
77
+ if (part.file.filename)
78
+ filePart["file_name"] = part.file.filename;
79
+ parts.push(filePart);
80
+ break;
81
+ }
82
+ default:
83
+ parts.push({ type: part.type, content: "[UNHANDLED_CONTENT_PART]" });
84
+ break;
85
+ }
86
+ }
87
+ return parts;
88
+ };
89
+ const toMessageParts = (message) => {
90
+ switch (message.role) {
91
+ case "assistant":
92
+ return toAssistantParts(message);
93
+ case "tool":
94
+ return [toToolResponsePart(message.tool_call_id, message.content)];
95
+ case "user":
96
+ return toUserParts(message.content);
97
+ // FUTURE: remove once Langfuse supports gen_ai.system_instructions
98
+ // https://github.com/langfuse/langfuse/issues/11607
99
+ case "system":
100
+ return toTextParts(message.content);
101
+ default:
102
+ return [{ type: message.role, content: "[UNHANDLED_ROLE]" }];
103
+ }
104
+ };
105
+ export const getChatRequestAttributes = (body, signalLevel) => {
106
+ if (!signalLevel || signalLevel === "off")
107
+ return {};
108
+ const attrs = {};
109
+ if (body.seed !== undefined) {
110
+ Object.assign(attrs, { "gen_ai.request.seed": body.seed });
111
+ }
112
+ if (signalLevel !== "required") {
113
+ Object.assign(attrs, {
114
+ "gen_ai.request.reasoning.enabled": body.reasoning?.enabled,
115
+ "gen_ai.request.reasoning.effort": body.reasoning?.effort,
116
+ "gen_ai.request.reasoning.max_tokens": body.reasoning?.max_tokens,
117
+ "gen_ai.request.stream": body.stream,
118
+ "gen_ai.request.frequency_penalty": body.frequency_penalty,
119
+ "gen_ai.request.max_tokens": body.max_completion_tokens,
120
+ "gen_ai.request.presence_penalty": body.presence_penalty,
121
+ "gen_ai.request.stop_sequences": body.stop
122
+ ? Array.isArray(body.stop)
123
+ ? body.stop
124
+ : [body.stop]
125
+ : undefined,
126
+ "gen_ai.request.temperature": body.temperature,
127
+ "gen_ai.request.top_p": body.top_p,
128
+ });
129
+ if (body.metadata) {
130
+ for (const key in body.metadata) {
131
+ attrs[`gen_ai.request.metadata.${key}`] = body.metadata[key];
132
+ }
133
+ }
134
+ }
135
+ if (signalLevel === "full") {
136
+ Object.assign(attrs, {
137
+ // FUTURE: move system instructions from messages to here
138
+ // blocker: https://github.com/langfuse/langfuse/issues/11607
139
+ // "gen_ai.system_instructions": inputs.messages
140
+ // .filter((m) => m.role === "system")
141
+ // .map((m) => JSON.stringify(toTextPart(m.content))),
142
+ "gen_ai.input.messages": body.messages
143
+ //.filter((m) => m.role !== "system")
144
+ .map((m) => JSON.stringify({ role: m.role, parts: toMessageParts(m) })),
145
+ "gen_ai.tool.definitions": body.tools?.map((toolDefinition) => JSON.stringify(toolDefinition)),
146
+ });
147
+ }
148
+ return attrs;
149
+ };
150
+ export const getChatResponseAttributes = (completions, signalLevel) => {
151
+ if (!signalLevel || signalLevel === "off")
152
+ return {};
153
+ const attrs = {
154
+ "gen_ai.response.id": completions.id,
155
+ };
156
+ if (signalLevel !== "required") {
157
+ Object.assign(attrs, {
158
+ "gen_ai.response.finish_reasons": completions.choices?.map((c) => c.finish_reason),
159
+ "gen_ai.response.service_tier": completions.service_tier,
160
+ "gen_ai.usage.total_tokens": completions.usage?.total_tokens,
161
+ "gen_ai.usage.input_tokens": completions.usage?.prompt_tokens,
162
+ "gen_ai.usage.cache_read.input_tokens": completions.usage?.prompt_tokens_details?.cached_tokens,
163
+ "gen_ai.usage.output_tokens": completions.usage?.completion_tokens,
164
+ "gen_ai.usage.reasoning.output_tokens": completions.usage?.completion_tokens_details?.reasoning_tokens,
165
+ });
166
+ }
167
+ if (signalLevel === "full") {
168
+ Object.assign(attrs, {
169
+ "gen_ai.output.messages": completions.choices?.map((c) => JSON.stringify({
170
+ role: c.message.role,
171
+ parts: toMessageParts(c.message),
172
+ finish_reason: c.finish_reason,
173
+ })),
174
+ });
175
+ }
176
+ return attrs;
177
+ };