npm - openlit - Versions diffs - 1.7.0 → 1.8.0 - Mend

openlit 1.7.0 → 1.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (74) hide show

package/dist/instrumentation/openai/wrapper.js CHANGED Viewed

@@ -61,6 +61,8 @@ class OpenAIWrapper extends base_wrapper_1.default {
     }
     static async *_chatCompletionGenerator({ args, genAIEndpoint, response, span, }) {
         let metricParams;
+        const timestamps = [];
+        const startTime = Date.now();
         try {
             const { messages } = args[0];
             let { tools } = args[0];
@@ -68,6 +70,8 @@ class OpenAIWrapper extends base_wrapper_1.default {
                 id: '0',
                 created: -1,
                 model: '',
+                system_fingerprint: '',
+                service_tier: 'auto',
                 choices: [
                     {
                         index: 0,
@@ -80,12 +84,28 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     prompt_tokens: 0,
                     completion_tokens: 0,
                     total_tokens: 0,
+                    completion_tokens_details: {
+                        reasoning_tokens: 0,
+                        audio_tokens: 0,
+                    },
+                    prompt_tokens_details: {
+                        cached_tokens: 0,
+                        audio_tokens: 0,
+                    },
                 },
             };
+            let toolCalls = [];
             for await (const chunk of response) {
+                timestamps.push(Date.now());
                 result.id = chunk.id;
                 result.created = chunk.created;
                 result.model = chunk.model;
+                if (chunk.system_fingerprint) {
+                    result.system_fingerprint = chunk.system_fingerprint;
+                }
+                if (chunk.service_tier) {
+                    result.service_tier = chunk.service_tier;
+                }
                 if (chunk.choices[0]?.finish_reason) {
                     result.choices[0].finish_reason = chunk.choices[0].finish_reason;
                 }
@@ -95,11 +115,45 @@ class OpenAIWrapper extends base_wrapper_1.default {
                 if (chunk.choices[0]?.delta.content) {
                     result.choices[0].message.content += chunk.choices[0].delta.content;
                 }
+                // Improved tool calls handling for streaming
                 if (chunk.choices[0]?.delta.tool_calls) {
+                    const deltaTools = chunk.choices[0].delta.tool_calls;
+                    for (const tool of deltaTools) {
+                        const idx = tool.index || 0;
+                        // Extend array if needed
+                        while (toolCalls.length <= idx) {
+                            toolCalls.push({
+                                id: '',
+                                type: 'function',
+                                function: { name: '', arguments: '' }
+                            });
+                        }
+                        if (tool.id) {
+                            // New tool call
+                            toolCalls[idx].id = tool.id;
+                            toolCalls[idx].type = tool.type || 'function';
+                            if (tool.function?.name) {
+                                toolCalls[idx].function.name = tool.function.name;
+                            }
+                            if (tool.function?.arguments) {
+                                toolCalls[idx].function.arguments = tool.function.arguments;
+                            }
+                        }
+                        else if (tool.function?.arguments) {
+                            // Append arguments to existing tool call
+                            toolCalls[idx].function.arguments += tool.function.arguments;
+                        }
+                    }
                     tools = true;
                 }
                 yield chunk;
             }
+            if (toolCalls.length > 0) {
+                result.choices[0].message = {
+                    ...result.choices[0].message,
+                    tool_calls: toolCalls
+                };
+            }
             let promptTokens = 0;
             for (const message of messages || []) {
                 promptTokens += helpers_1.default.openaiTokens(message.content, result.model) ?? 0;
@@ -110,14 +164,25 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     prompt_tokens: promptTokens,
                     completion_tokens: completionTokens,
                     total_tokens: promptTokens + completionTokens,
+                    completion_tokens_details: result.usage.completion_tokens_details,
+                    prompt_tokens_details: result.usage.prompt_tokens_details,
                 };
             }
             args[0].tools = tools;
+            // Calculate TTFT and TBT
+            const ttft = timestamps.length > 0 ? (timestamps[0] - startTime) / 1000 : 0;
+            let tbt = 0;
+            if (timestamps.length > 1) {
+                const timeDiffs = timestamps.slice(1).map((t, i) => t - timestamps[i]);
+                tbt = timeDiffs.reduce((a, b) => a + b, 0) / timeDiffs.length / 1000;
+            }
             metricParams = await OpenAIWrapper._chatCompletionCommonSetter({
                 args,
                 genAIEndpoint,
                 result,
                 span,
+                ttft,
+                tbt,
             });
             return result;
         }
@@ -132,48 +197,31 @@ class OpenAIWrapper extends base_wrapper_1.default {
             }
         }
     }
-    static async _chatCompletionCommonSetter({ args, genAIEndpoint, result, span, }) {
+    static async _chatCompletionCommonSetter({ args, genAIEndpoint, result, span, ttft = 0, tbt = 0, }) {
         const traceContent = config_1.default.traceContent;
-        const { messages, frequency_penalty = 0, max_tokens = null, n = 1, presence_penalty = 0, seed = null, temperature = 1, top_p, user, stream = false, tools, } = args[0];
+        const { messages, frequency_penalty = 0, max_tokens = null, n = 1, presence_penalty = 0, seed = null, stop = null, temperature = 1, top_p, user, stream = false, tools, } = args[0];
         // Request Params attributes : Start
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_TOP_P, top_p || 1);
-        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_MAX_TOKENS, max_tokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_MAX_TOKENS, max_tokens || -1);
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_TEMPERATURE, temperature);
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_PRESENCE_PENALTY, presence_penalty);
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_FREQUENCY_PENALTY, frequency_penalty);
-        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_SEED, seed);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_SEED, seed ? String(seed) : '');
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IS_STREAM, stream);
+        if (stop) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_STOP_SEQUENCES, Array.isArray(stop) ? stop : [stop]);
+        }
+        if (user) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_USER, user);
+        }
         if (traceContent) {
-            // Format 'messages' into a single string
-            const messagePrompt = messages || [];
-            const formattedMessages = [];
-            for (const message of messagePrompt) {
-                const role = message.role;
-                const content = message.content;
-                if (Array.isArray(content)) {
-                    const contentStr = content
-                        .map((item) => {
-                        if ('type' in item) {
-                            return `${item.type}: ${item.text ? item.text : item.image_url}`;
-                        }
-                        else {
-                            return `text: ${item.text}`;
-                        }
-                    })
-                        .join(', ');
-                    formattedMessages.push(`${role}: ${contentStr}`);
-                }
-                else {
-                    formattedMessages.push(`${role}: ${content}`);
-                }
-            }
-            const prompt = formattedMessages.join('\n');
-            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, prompt);
+            span.setAttribute(semantic_convention_1.default.GEN_AI_INPUT_MESSAGES, helpers_1.default.buildInputMessages(messages || []));
         }
         // Request Params attributes : End
         span.setAttribute(semantic_convention_1.default.GEN_AI_OPERATION, semantic_convention_1.default.GEN_AI_OPERATION_TYPE_CHAT);
         span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_ID, result.id);
         const model = result.model || 'gpt-3.5-turbo';
+        const responseModel = result.model || model;
         const pricingInfo = await config_1.default.updatePricingJson(config_1.default.pricing_json);
         // Calculate cost of the operation
         const cost = helpers_1.default.getChatModelCost(model, pricingInfo, result.usage.prompt_tokens, result.usage.completion_tokens);
@@ -184,30 +232,80 @@ class OpenAIWrapper extends base_wrapper_1.default {
             cost,
             aiSystem: OpenAIWrapper.aiSystem,
         });
+        // Response model
+        span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_MODEL, responseModel);
+        // OpenAI-specific attributes
+        if (result.system_fingerprint) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_SYSTEM_FINGERPRINT, result.system_fingerprint);
+        }
+        if (result.service_tier) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_SERVICE_TIER, result.service_tier);
+        }
+        // Token usage
         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_INPUT_TOKENS, result.usage.prompt_tokens);
         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_OUTPUT_TOKENS, result.usage.completion_tokens);
         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_TOTAL_TOKENS, result.usage.total_tokens);
-        if (result.choices[0].finish_reason) {
-            span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_FINISH_REASON, result.choices[0].finish_reason);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_CLIENT_TOKEN_USAGE, result.usage.total_tokens);
+        // Enhanced token details
+        if (result.usage.completion_tokens_details) {
+            if (result.usage.completion_tokens_details.reasoning_tokens) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_REASONING_TOKENS, result.usage.completion_tokens_details.reasoning_tokens);
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_COMPLETION_TOKENS_DETAILS_REASONING, result.usage.completion_tokens_details.reasoning_tokens);
+            }
+            if (result.usage.completion_tokens_details.audio_tokens) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_COMPLETION_TOKENS_DETAILS_AUDIO, result.usage.completion_tokens_details.audio_tokens);
+            }
         }
-        if (tools) {
-            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION, 'Function called with tools');
+        if (result.usage.prompt_tokens_details) {
+            if (result.usage.prompt_tokens_details.cached_tokens) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_PROMPT_TOKENS_DETAILS_CACHE_READ, result.usage.prompt_tokens_details.cached_tokens);
+            }
+            if (result.usage.prompt_tokens_details.audio_tokens) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_PROMPT_TOKENS_DETAILS_CACHE_WRITE, result.usage.prompt_tokens_details.audio_tokens);
+            }
         }
-        else {
-            if (traceContent) {
-                if (n === 1) {
-                    span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION, result.choices[0].message.content);
-                }
-                else {
-                    let i = 0;
-                    while (i < n) {
-                        const attribute_name = `${semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION}.[i]`;
-                        span.setAttribute(attribute_name, result.choices[i].message.content);
-                        i += 1;
-                    }
-                }
+        // TTFT and TBT metrics
+        if (ttft > 0) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TTFT, ttft);
+        }
+        if (tbt > 0) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TBT, tbt);
+        }
+        // Finish reason
+        if (result.choices[0].finish_reason) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_FINISH_REASON, [result.choices[0].finish_reason]);
+        }
+        // Output type
+        const outputType = typeof result.choices[0].message.content === 'string'
+            ? semantic_convention_1.default.GEN_AI_OUTPUT_TYPE_TEXT
+            : semantic_convention_1.default.GEN_AI_OUTPUT_TYPE_JSON;
+        span.setAttribute(semantic_convention_1.default.GEN_AI_OUTPUT_TYPE, outputType);
+        // Tool calls handling
+        if (result.choices[0].message.tool_calls) {
+            const toolCalls = result.choices[0].message.tool_calls;
+            const toolNames = toolCalls.map((t) => t.function?.name || '').filter(Boolean);
+            const toolIds = toolCalls.map((t) => t.id || '').filter(Boolean);
+            const toolArgs = toolCalls.map((t) => t.function?.arguments || '').filter(Boolean);
+            const toolTypes = toolCalls.map((t) => t.type || '').filter(Boolean);
+            if (toolNames.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_NAME, toolNames.join(', '));
+            }
+            if (toolIds.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_CALL_ID, toolIds.join(', '));
+            }
+            if (toolArgs.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_CALL_ARGUMENTS, toolArgs);
+            }
+            if (toolTypes.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_TYPE, toolTypes.join(', '));
             }
         }
+        // Content
+        if (traceContent) {
+            const toolCalls = result.choices[0].message.tool_calls;
+            const outputJson = helpers_1.default.buildOutputMessages(result.choices[0].message.content || '', result.choices[0].finish_reason || 'stop', toolCalls);
+            span.setAttribute(semantic_convention_1.default.GEN_AI_OUTPUT_MESSAGES, outputJson);
+        }
         return {
             genAIEndpoint,
             model,
@@ -223,13 +321,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
             return async function (...args) {
                 const span = tracer.startSpan(genAIEndpoint, { kind: api_1.SpanKind.CLIENT });
                 return api_1.context.with(api_1.trace.setSpan(api_1.context.active(), span), async () => {
-                    let metricParams = {
-                        genAIEndpoint,
-                        model: '',
-                        user: '',
-                        cost: 0,
-                        aiSystem: OpenAIWrapper.aiSystem,
-                    };
+                    let metricParams;
                     try {
                         const response = await originalMethod.apply(this, args);
                         const model = response.model || 'text-embedding-ada-002';
@@ -237,7 +329,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
                         const cost = helpers_1.default.getEmbedModelCost(model, pricingInfo, response.usage.prompt_tokens);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_OPERATION, semantic_convention_1.default.GEN_AI_OPERATION_TYPE_EMBEDDING);
                         const { dimensions, encoding_format = 'float', input, user } = args[0];
-                        // Set base span attribues
+                        // Set base span attributes
                         OpenAIWrapper.setBaseSpanAttributes(span, {
                             genAIEndpoint,
                             model,
@@ -245,15 +337,29 @@ class OpenAIWrapper extends base_wrapper_1.default {
                             cost,
                             aiSystem: OpenAIWrapper.aiSystem,
                         });
+                        // Set missing critical attributes to match Python SDK
+                        span.setAttribute(semantic_convention_1.default.SERVER_ADDRESS, 'api.openai.com');
+                        span.setAttribute(semantic_convention_1.default.SERVER_PORT, 443);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IS_STREAM, false);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TBT, 0);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TTFT, 0);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_SDK_VERSION, '1.7.0');
                         // Request Params attributes : Start
-                        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_ENCODING_FORMATS, encoding_format);
-                        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_EMBEDDING_DIMENSION, dimensions);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_ENCODING_FORMATS, [encoding_format]);
+                        if (dimensions) {
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_EMBEDDING_DIMENSION, dimensions);
+                        }
+                        if (user) {
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_USER, user);
+                        }
                         if (traceContent) {
-                            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, input);
+                            const formattedInput = typeof input === 'string' ? input : JSON.stringify(input);
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_INPUT_MESSAGES, formattedInput);
                         }
                         // Request Params attributes : End
                         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_INPUT_TOKENS, response.usage.prompt_tokens);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_TOTAL_TOKENS, response.usage.total_tokens);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_CLIENT_TOKEN_USAGE, response.usage.prompt_tokens);
                         metricParams = {
                             genAIEndpoint,
                             model,
@@ -265,10 +371,13 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     }
                     catch (e) {
                         helpers_1.default.handleException(span, e);
+                        throw e;
                     }
                     finally {
                         span.end();
-                        base_wrapper_1.default.recordMetrics(span, metricParams);
+                        if (metricParams) {
+                            base_wrapper_1.default.recordMetrics(span, metricParams);
+                        }
                     }
                 });
             };
@@ -356,7 +465,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
                         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IMAGE_QUALITY, quality);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IMAGE_STYLE, style);
                         if (traceContent) {
-                            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, prompt);
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_INPUT_MESSAGES, prompt);
                         }
                         // Request Params attributes : End
                         let imagesCount = 0;
@@ -422,7 +531,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
                         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IMAGE_QUALITY, quality);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IMAGE_STYLE, style);
                         if (traceContent) {
-                            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, prompt);
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_INPUT_MESSAGES, prompt);
                         }
                         // Request Params attributes : End
                         let imagesCount = 0;
@@ -486,7 +595,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
                         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_AUDIO_RESPONSE_FORMAT, response_format);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_AUDIO_SPEED, speed);
                         if (traceContent) {
-                            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, input);
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_INPUT_MESSAGES, input);
                         }
                         // Request Params attributes : End
                         // Store metric parameters for use after span ends
@@ -513,6 +622,255 @@ class OpenAIWrapper extends base_wrapper_1.default {
             };
         };
     }
+    static _patchResponsesCreate(tracer) {
+        const genAIEndpoint = 'openai.resources.responses';
+        return (originalMethod) => {
+            return async function (...args) {
+                const span = tracer.startSpan(genAIEndpoint, { kind: api_1.SpanKind.CLIENT });
+                return api_1.context
+                    .with(api_1.trace.setSpan(api_1.context.active(), span), async () => {
+                    return originalMethod.apply(this, args);
+                })
+                    .then((response) => {
+                    const { stream = false } = args[0];
+                    if (stream) {
+                        return helpers_1.default.createStreamProxy(response, OpenAIWrapper._responsesGenerator({
+                            args,
+                            genAIEndpoint,
+                            response,
+                            span,
+                        }));
+                    }
+                    return OpenAIWrapper._responsesComplete({ args, genAIEndpoint, response, span });
+                })
+                    .catch((e) => {
+                    helpers_1.default.handleException(span, e);
+                    span.end();
+                });
+            };
+        };
+    }
+    static async _responsesComplete({ args, genAIEndpoint, response, span, }) {
+        let metricParams;
+        try {
+            metricParams = await OpenAIWrapper._responsesCommonSetter({
+                args,
+                genAIEndpoint,
+                result: response,
+                span,
+            });
+            return response;
+        }
+        catch (e) {
+            helpers_1.default.handleException(span, e);
+        }
+        finally {
+            span.end();
+            if (metricParams) {
+                base_wrapper_1.default.recordMetrics(span, metricParams);
+            }
+        }
+    }
+    static async *_responsesGenerator({ args, genAIEndpoint, response, span, }) {
+        let metricParams;
+        const timestamps = [];
+        const startTime = Date.now();
+        try {
+            const { input } = args[0];
+            const result = {
+                id: '',
+                model: '',
+                service_tier: 'default',
+                status: 'completed',
+                output: [],
+                usage: {
+                    input_tokens: 0,
+                    output_tokens: 0,
+                    output_tokens_details: {
+                        reasoning_tokens: 0,
+                    },
+                },
+            };
+            let llmResponse = '';
+            let responseTools = [];
+            for await (const chunk of response) {
+                timestamps.push(Date.now());
+                if (chunk.type === 'response.output_text.delta') {
+                    llmResponse += chunk.delta || '';
+                }
+                else if (chunk.type === 'response.output_item.added') {
+                    const item = chunk.item;
+                    if (item?.type === 'function_call') {
+                        responseTools.push({
+                            id: item.id,
+                            call_id: item.call_id,
+                            name: item.name,
+                            type: item.type,
+                            arguments: item.arguments || '',
+                            status: item.status,
+                        });
+                    }
+                }
+                else if (chunk.type === 'response.function_call_arguments.delta') {
+                    const itemId = chunk.item_id;
+                    const delta = chunk.delta || '';
+                    const tool = responseTools.find(t => t.id === itemId);
+                    if (tool) {
+                        tool.arguments += delta;
+                    }
+                }
+                else if (chunk.type === 'response.completed') {
+                    const responseData = chunk.response;
+                    result.id = responseData.id;
+                    result.model = responseData.model;
+                    result.status = responseData.status;
+                    const usage = responseData.usage || {};
+                    result.usage.input_tokens = usage.input_tokens || 0;
+                    result.usage.output_tokens = usage.output_tokens || 0;
+                    result.usage.output_tokens_details.reasoning_tokens =
+                        usage.output_tokens_details?.reasoning_tokens || 0;
+                }
+                yield chunk;
+            }
+            // Construct output array
+            if (llmResponse) {
+                result.output.push({
+                    type: 'message',
+                    content: [{ type: 'text', text: llmResponse }],
+                });
+            }
+            if (responseTools.length > 0) {
+                result.output.push(...responseTools);
+            }
+            // Calculate TTFT and TBT
+            const ttft = timestamps.length > 0 ? (timestamps[0] - startTime) / 1000 : 0;
+            let tbt = 0;
+            if (timestamps.length > 1) {
+                const timeDiffs = timestamps.slice(1).map((t, i) => t - timestamps[i]);
+                tbt = timeDiffs.reduce((a, b) => a + b, 0) / timeDiffs.length / 1000;
+            }
+            metricParams = await OpenAIWrapper._responsesCommonSetter({
+                args,
+                genAIEndpoint,
+                result,
+                span,
+                ttft,
+                tbt,
+            });
+            return result;
+        }
+        catch (e) {
+            helpers_1.default.handleException(span, e);
+        }
+        finally {
+            span.end();
+            if (metricParams) {
+                base_wrapper_1.default.recordMetrics(span, metricParams);
+            }
+        }
+    }
+    static async _responsesCommonSetter({ args, genAIEndpoint, result, span, ttft = 0, tbt = 0, }) {
+        const traceContent = config_1.default.traceContent;
+        const { input, temperature = 1.0, top_p = 1.0, max_output_tokens, reasoning, stream = false, } = args[0];
+        // Normalize Responses API input to messages array for buildInputMessages
+        const responsesMessages = typeof input === 'string'
+            ? [{ role: 'user', content: input }]
+            : (Array.isArray(input) ? input : []);
+        // Request Params attributes
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_TEMPERATURE, temperature);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_TOP_P, top_p);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_MAX_TOKENS, max_output_tokens || -1);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IS_STREAM, stream);
+        if (reasoning?.effort) {
+            span.setAttribute('gen_ai.request.reasoning_effort', reasoning.effort);
+        }
+        if (traceContent) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_INPUT_MESSAGES, helpers_1.default.buildInputMessages(responsesMessages));
+        }
+        span.setAttribute(semantic_convention_1.default.GEN_AI_OPERATION, semantic_convention_1.default.GEN_AI_OPERATION_TYPE_CHAT);
+        const model = result.model || 'gpt-4o';
+        const responseModel = result.model || model;
+        const pricingInfo = await config_1.default.updatePricingJson(config_1.default.pricing_json);
+        // Calculate cost
+        const inputTokens = result.usage?.input_tokens || 0;
+        const outputTokens = result.usage?.output_tokens || 0;
+        const cost = helpers_1.default.getChatModelCost(model, pricingInfo, inputTokens, outputTokens);
+        OpenAIWrapper.setBaseSpanAttributes(span, {
+            genAIEndpoint,
+            model,
+            user: '',
+            cost,
+            aiSystem: OpenAIWrapper.aiSystem,
+        });
+        // Response attributes
+        span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_ID, result.id);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_MODEL, responseModel);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_FINISH_REASON, [result.status || 'completed']);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_OUTPUT_TYPE, semantic_convention_1.default.GEN_AI_OUTPUT_TYPE_TEXT);
+        if (result.service_tier) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_SERVICE_TIER, result.service_tier);
+        }
+        // Token usage
+        span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_INPUT_TOKENS, inputTokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_OUTPUT_TOKENS, outputTokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_TOTAL_TOKENS, inputTokens + outputTokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_CLIENT_TOKEN_USAGE, inputTokens + outputTokens);
+        // Reasoning tokens
+        if (result.usage?.output_tokens_details?.reasoning_tokens) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_REASONING_TOKENS, result.usage.output_tokens_details.reasoning_tokens);
+        }
+        // TTFT and TBT metrics
+        if (ttft > 0) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TTFT, ttft);
+        }
+        if (tbt > 0) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TBT, tbt);
+        }
+        // Extract completion text from output
+        let completionText = '';
+        if (result.output && Array.isArray(result.output)) {
+            for (const item of result.output) {
+                if (item.type === 'message' && item.content) {
+                    for (const content of item.content) {
+                        if (content.type === 'text' || content.type === 'output_text') {
+                            completionText += content.text || '';
+                        }
+                    }
+                }
+            }
+        }
+        // Tool calls handling for Responses API
+        const toolCalls = result.tools || [];
+        if (toolCalls.length > 0) {
+            const toolNames = toolCalls.map((t) => t.name || '').filter(Boolean);
+            const toolIds = toolCalls.map((t) => t.call_id || '').filter(Boolean);
+            const toolArgs = toolCalls.map((t) => t.arguments || '').filter(Boolean);
+            const toolTypes = toolCalls.map((t) => t.type || '').filter(Boolean);
+            if (toolNames.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_NAME, toolNames.join(', '));
+            }
+            if (toolIds.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_CALL_ID, toolIds.join(', '));
+            }
+            if (toolArgs.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_CALL_ARGUMENTS, toolArgs.join(', '));
+            }
+            if (toolTypes.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_TYPE, toolTypes.join(', '));
+            }
+        }
+        // Content
+        if (traceContent) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_OUTPUT_MESSAGES, helpers_1.default.buildOutputMessages(completionText, result.status || 'stop'));
+        }
+        return {
+            genAIEndpoint,
+            model,
+            user: '',
+            cost,
+            aiSystem: OpenAIWrapper.aiSystem,
+        };
+    }
 }
 OpenAIWrapper.aiSystem = semantic_convention_1.default.GEN_AI_SYSTEM_OPENAI;
 exports.default = OpenAIWrapper;