npm - openlit - Versions diffs - 1.6.0 → 1.7.1 - Mend

openlit 1.6.0 → 1.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

package/README.md +19 -1
package/dist/helpers.js +8 -4
package/dist/helpers.js.map +1 -1
package/dist/index.d.ts +2 -2
package/dist/index.js +19 -6
package/dist/index.js.map +1 -1
package/dist/instrumentation/__tests__/anthropic-wrapper.test.d.ts +1 -0
package/dist/instrumentation/__tests__/anthropic-wrapper.test.js +92 -0
package/dist/instrumentation/__tests__/anthropic-wrapper.test.js.map +1 -0
package/dist/instrumentation/__tests__/base-wrapper.test.d.ts +1 -0
package/dist/instrumentation/__tests__/base-wrapper.test.js +175 -0
package/dist/instrumentation/__tests__/base-wrapper.test.js.map +1 -0
package/dist/instrumentation/__tests__/cohere-wrapper.test.d.ts +1 -0
package/dist/instrumentation/__tests__/cohere-wrapper.test.js +131 -0
package/dist/instrumentation/__tests__/cohere-wrapper.test.js.map +1 -0
package/dist/instrumentation/__tests__/openai-wrapper.test.d.ts +1 -0
package/dist/instrumentation/__tests__/openai-wrapper.test.js +181 -0
package/dist/instrumentation/__tests__/openai-wrapper.test.js.map +1 -0
package/dist/instrumentation/anthropic/wrapper.d.ts +7 -1
package/dist/instrumentation/anthropic/wrapper.js +16 -1
package/dist/instrumentation/anthropic/wrapper.js.map +1 -1
package/dist/instrumentation/base-wrapper.d.ts +3 -2
package/dist/instrumentation/base-wrapper.js +81 -1
package/dist/instrumentation/base-wrapper.js.map +1 -1
package/dist/instrumentation/cohere/wrapper.d.ts +7 -1
package/dist/instrumentation/cohere/wrapper.js +19 -2
package/dist/instrumentation/cohere/wrapper.js.map +1 -1
package/dist/instrumentation/ollama/wrapper.d.ts +2 -1
package/dist/instrumentation/ollama/wrapper.js +2 -2
package/dist/instrumentation/ollama/wrapper.js.map +1 -1
package/dist/instrumentation/openai/index.js +11 -0
package/dist/instrumentation/openai/index.js.map +1 -1
package/dist/instrumentation/openai/wrapper.d.ts +39 -3
package/dist/instrumentation/openai/wrapper.js +537 -26
package/dist/instrumentation/openai/wrapper.js.map +1 -1
package/dist/otel/__tests__/metrics.test.d.ts +1 -0
package/dist/otel/__tests__/metrics.test.js +51 -0
package/dist/otel/__tests__/metrics.test.js.map +1 -0
package/dist/otel/metrics.d.ts +22 -0
package/dist/otel/metrics.js +132 -0
package/dist/otel/metrics.js.map +1 -0
package/dist/{tracing.d.ts → otel/tracing.d.ts} +1 -1
package/dist/{tracing.js → otel/tracing.js} +17 -15
package/dist/otel/tracing.js.map +1 -0
package/dist/semantic-convention.d.ts +36 -0
package/dist/semantic-convention.js +53 -11
package/dist/semantic-convention.js.map +1 -1
package/dist/types.d.ts +7 -0
package/package.json +10 -11
package/dist/tracing.js.map +0 -1

package/dist/instrumentation/openai/wrapper.js CHANGED Viewed

@@ -20,7 +20,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
                 })
                     .then((response) => {
                     const { stream = false } = args[0];
-                    if (!!stream) {
+                    if (stream) {
                         return helpers_1.default.createStreamProxy(response, OpenAIWrapper._chatCompletionGenerator({
                             args,
                             genAIEndpoint,
@@ -38,8 +38,9 @@ class OpenAIWrapper extends base_wrapper_1.default {
         };
     }
     static async _chatCompletion({ args, genAIEndpoint, response, span, }) {
+        let metricParams;
         try {
-            await OpenAIWrapper._chatCompletionCommonSetter({
+            metricParams = await OpenAIWrapper._chatCompletionCommonSetter({
                 args,
                 genAIEndpoint,
                 result: response,
@@ -52,9 +53,16 @@ class OpenAIWrapper extends base_wrapper_1.default {
         }
         finally {
             span.end();
+            // Record metrics after span has ended if parameters are available
+            if (metricParams) {
+                base_wrapper_1.default.recordMetrics(span, metricParams);
+            }
         }
     }
     static async *_chatCompletionGenerator({ args, genAIEndpoint, response, span, }) {
+        let metricParams;
+        const timestamps = [];
+        const startTime = Date.now();
         try {
             const { messages } = args[0];
             let { tools } = args[0];
@@ -62,6 +70,8 @@ class OpenAIWrapper extends base_wrapper_1.default {
                 id: '0',
                 created: -1,
                 model: '',
+                system_fingerprint: '',
+                service_tier: 'auto',
                 choices: [
                     {
                         index: 0,
@@ -74,12 +84,28 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     prompt_tokens: 0,
                     completion_tokens: 0,
                     total_tokens: 0,
+                    completion_tokens_details: {
+                        reasoning_tokens: 0,
+                        audio_tokens: 0,
+                    },
+                    prompt_tokens_details: {
+                        cached_tokens: 0,
+                        audio_tokens: 0,
+                    },
                 },
             };
+            let toolCalls = [];
             for await (const chunk of response) {
+                timestamps.push(Date.now());
                 result.id = chunk.id;
                 result.created = chunk.created;
                 result.model = chunk.model;
+                if (chunk.system_fingerprint) {
+                    result.system_fingerprint = chunk.system_fingerprint;
+                }
+                if (chunk.service_tier) {
+                    result.service_tier = chunk.service_tier;
+                }
                 if (chunk.choices[0]?.finish_reason) {
                     result.choices[0].finish_reason = chunk.choices[0].finish_reason;
                 }
@@ -89,11 +115,45 @@ class OpenAIWrapper extends base_wrapper_1.default {
                 if (chunk.choices[0]?.delta.content) {
                     result.choices[0].message.content += chunk.choices[0].delta.content;
                 }
+                // Improved tool calls handling for streaming
                 if (chunk.choices[0]?.delta.tool_calls) {
+                    const deltaTools = chunk.choices[0].delta.tool_calls;
+                    for (const tool of deltaTools) {
+                        const idx = tool.index || 0;
+                        // Extend array if needed
+                        while (toolCalls.length <= idx) {
+                            toolCalls.push({
+                                id: '',
+                                type: 'function',
+                                function: { name: '', arguments: '' }
+                            });
+                        }
+                        if (tool.id) {
+                            // New tool call
+                            toolCalls[idx].id = tool.id;
+                            toolCalls[idx].type = tool.type || 'function';
+                            if (tool.function?.name) {
+                                toolCalls[idx].function.name = tool.function.name;
+                            }
+                            if (tool.function?.arguments) {
+                                toolCalls[idx].function.arguments = tool.function.arguments;
+                            }
+                        }
+                        else if (tool.function?.arguments) {
+                            // Append arguments to existing tool call
+                            toolCalls[idx].function.arguments += tool.function.arguments;
+                        }
+                    }
                     tools = true;
                 }
                 yield chunk;
             }
+            if (toolCalls.length > 0) {
+                result.choices[0].message = {
+                    ...result.choices[0].message,
+                    tool_calls: toolCalls
+                };
+            }
             let promptTokens = 0;
             for (const message of messages || []) {
                 promptTokens += helpers_1.default.openaiTokens(message.content, result.model) ?? 0;
@@ -104,14 +164,25 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     prompt_tokens: promptTokens,
                     completion_tokens: completionTokens,
                     total_tokens: promptTokens + completionTokens,
+                    completion_tokens_details: result.usage.completion_tokens_details,
+                    prompt_tokens_details: result.usage.prompt_tokens_details,
                 };
             }
             args[0].tools = tools;
-            await OpenAIWrapper._chatCompletionCommonSetter({
+            // Calculate TTFT and TBT
+            const ttft = timestamps.length > 0 ? (timestamps[0] - startTime) / 1000 : 0;
+            let tbt = 0;
+            if (timestamps.length > 1) {
+                const timeDiffs = timestamps.slice(1).map((t, i) => t - timestamps[i]);
+                tbt = timeDiffs.reduce((a, b) => a + b, 0) / timeDiffs.length / 1000;
+            }
+            metricParams = await OpenAIWrapper._chatCompletionCommonSetter({
                 args,
                 genAIEndpoint,
                 result,
                 span,
+                ttft,
+                tbt,
             });
             return result;
         }
@@ -120,19 +191,29 @@ class OpenAIWrapper extends base_wrapper_1.default {
         }
         finally {
             span.end();
+            // Record metrics after span has ended if parameters are available
+            if (metricParams) {
+                base_wrapper_1.default.recordMetrics(span, metricParams);
+            }
         }
     }
-    static async _chatCompletionCommonSetter({ args, genAIEndpoint, result, span, }) {
+    static async _chatCompletionCommonSetter({ args, genAIEndpoint, result, span, ttft = 0, tbt = 0, }) {
         const traceContent = config_1.default.traceContent;
-        const { messages, frequency_penalty = 0, max_tokens = null, n = 1, presence_penalty = 0, seed = null, temperature = 1, top_p, user, stream = false, tools, } = args[0];
+        const { messages, frequency_penalty = 0, max_tokens = null, n = 1, presence_penalty = 0, seed = null, stop = null, temperature = 1, top_p, user, stream = false, tools, } = args[0];
         // Request Params attributes : Start
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_TOP_P, top_p || 1);
-        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_MAX_TOKENS, max_tokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_MAX_TOKENS, max_tokens || -1);
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_TEMPERATURE, temperature);
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_PRESENCE_PENALTY, presence_penalty);
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_FREQUENCY_PENALTY, frequency_penalty);
-        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_SEED, seed);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_SEED, seed ? String(seed) : '');
         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IS_STREAM, stream);
+        if (stop) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_STOP_SEQUENCES, Array.isArray(stop) ? stop : [stop]);
+        }
+        if (user) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_USER, user);
+        }
         if (traceContent) {
             // Format 'messages' into a single string
             const messagePrompt = messages || [];
@@ -164,6 +245,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
         span.setAttribute(semantic_convention_1.default.GEN_AI_OPERATION, semantic_convention_1.default.GEN_AI_OPERATION_TYPE_CHAT);
         span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_ID, result.id);
         const model = result.model || 'gpt-3.5-turbo';
+        const responseModel = result.model || model;
         const pricingInfo = await config_1.default.updatePricingJson(config_1.default.pricing_json);
         // Calculate cost of the operation
         const cost = helpers_1.default.getChatModelCost(model, pricingInfo, result.usage.prompt_tokens, result.usage.completion_tokens);
@@ -174,30 +256,101 @@ class OpenAIWrapper extends base_wrapper_1.default {
             cost,
             aiSystem: OpenAIWrapper.aiSystem,
         });
+        // Response model
+        span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_MODEL, responseModel);
+        // OpenAI-specific attributes
+        if (result.system_fingerprint) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_SYSTEM_FINGERPRINT, result.system_fingerprint);
+        }
+        if (result.service_tier) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_SERVICE_TIER, result.service_tier);
+        }
+        // Token usage
         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_INPUT_TOKENS, result.usage.prompt_tokens);
         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_OUTPUT_TOKENS, result.usage.completion_tokens);
         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_TOTAL_TOKENS, result.usage.total_tokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_CLIENT_TOKEN_USAGE, result.usage.total_tokens);
+        // Enhanced token details
+        if (result.usage.completion_tokens_details) {
+            if (result.usage.completion_tokens_details.reasoning_tokens) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_REASONING_TOKENS, result.usage.completion_tokens_details.reasoning_tokens);
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_COMPLETION_TOKENS_DETAILS_REASONING, result.usage.completion_tokens_details.reasoning_tokens);
+            }
+            if (result.usage.completion_tokens_details.audio_tokens) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_COMPLETION_TOKENS_DETAILS_AUDIO, result.usage.completion_tokens_details.audio_tokens);
+            }
+        }
+        if (result.usage.prompt_tokens_details) {
+            if (result.usage.prompt_tokens_details.cached_tokens) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_PROMPT_TOKENS_DETAILS_CACHE_READ, result.usage.prompt_tokens_details.cached_tokens);
+            }
+            if (result.usage.prompt_tokens_details.audio_tokens) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_PROMPT_TOKENS_DETAILS_CACHE_WRITE, result.usage.prompt_tokens_details.audio_tokens);
+            }
+        }
+        // TTFT and TBT metrics
+        if (ttft > 0) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TTFT, ttft);
+        }
+        if (tbt > 0) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TBT, tbt);
+        }
+        // Finish reason
         if (result.choices[0].finish_reason) {
-            span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_FINISH_REASON, result.choices[0].finish_reason);
+            span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_FINISH_REASON, [result.choices[0].finish_reason]);
         }
-        if (tools) {
-            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION, 'Function called with tools');
+        // Output type
+        const outputType = typeof result.choices[0].message.content === 'string'
+            ? semantic_convention_1.default.GEN_AI_OUTPUT_TYPE_TEXT
+            : semantic_convention_1.default.GEN_AI_OUTPUT_TYPE_JSON;
+        span.setAttribute(semantic_convention_1.default.GEN_AI_OUTPUT_TYPE, outputType);
+        // Tool calls handling
+        if (result.choices[0].message.tool_calls) {
+            const toolCalls = result.choices[0].message.tool_calls;
+            const toolNames = toolCalls.map((t) => t.function?.name || '').filter(Boolean);
+            const toolIds = toolCalls.map((t) => t.id || '').filter(Boolean);
+            const toolArgs = toolCalls.map((t) => t.function?.arguments || '').filter(Boolean);
+            const toolTypes = toolCalls.map((t) => t.type || '').filter(Boolean);
+            if (toolNames.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_NAME, toolNames.join(', '));
+            }
+            if (toolIds.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_CALL_ID, toolIds.join(', '));
+            }
+            if (toolArgs.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_CALL_ARGUMENTS, toolArgs);
+            }
+            if (toolTypes.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_TYPE, toolTypes.join(', '));
+            }
         }
-        else {
-            if (traceContent) {
-                if (n === 1) {
-                    span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION, result.choices[0].message.content);
-                }
-                else {
-                    let i = 0;
-                    while (i < n) {
-                        const attribute_name = `${semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION}.[i]`;
-                        span.setAttribute(attribute_name, result.choices[i].message.content);
-                        i += 1;
-                    }
+        // Content
+        if (traceContent) {
+            // Format completion content - use actual content or empty string if only tool calls
+            const completionContent = result.choices[0].message.content || '';
+            if (n === 1) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION, completionContent);
+            }
+            else {
+                let i = 0;
+                while (i < n) {
+                    const attribute_name = `${semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION}.${i}`;
+                    span.setAttribute(attribute_name, result.choices[i].message.content || '');
+                    i += 1;
                 }
             }
+            // Add events for backward compatibility
+            span.addEvent(semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION_EVENT, {
+                [semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION]: completionContent,
+            });
         }
+        return {
+            genAIEndpoint,
+            model,
+            user,
+            cost,
+            aiSystem: OpenAIWrapper.aiSystem,
+        };
     }
     static _patchEmbedding(tracer) {
         const genAIEndpoint = 'openai.resources.embeddings';
@@ -206,6 +359,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
             return async function (...args) {
                 const span = tracer.startSpan(genAIEndpoint, { kind: api_1.SpanKind.CLIENT });
                 return api_1.context.with(api_1.trace.setSpan(api_1.context.active(), span), async () => {
+                    let metricParams;
                     try {
                         const response = await originalMethod.apply(this, args);
                         const model = response.model || 'text-embedding-ada-002';
@@ -213,7 +367,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
                         const cost = helpers_1.default.getEmbedModelCost(model, pricingInfo, response.usage.prompt_tokens);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_OPERATION, semantic_convention_1.default.GEN_AI_OPERATION_TYPE_EMBEDDING);
                         const { dimensions, encoding_format = 'float', input, user } = args[0];
-                        // Set base span attribues
+                        // Set base span attributes
                         OpenAIWrapper.setBaseSpanAttributes(span, {
                             genAIEndpoint,
                             model,
@@ -221,22 +375,47 @@ class OpenAIWrapper extends base_wrapper_1.default {
                             cost,
                             aiSystem: OpenAIWrapper.aiSystem,
                         });
+                        // Set missing critical attributes to match Python SDK
+                        span.setAttribute(semantic_convention_1.default.SERVER_ADDRESS, 'api.openai.com');
+                        span.setAttribute(semantic_convention_1.default.SERVER_PORT, 443);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IS_STREAM, false);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TBT, 0);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TTFT, 0);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_SDK_VERSION, '1.7.0');
                         // Request Params attributes : Start
-                        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_ENCODING_FORMATS, encoding_format);
-                        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_EMBEDDING_DIMENSION, dimensions);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_ENCODING_FORMATS, [encoding_format]);
+                        if (dimensions) {
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_EMBEDDING_DIMENSION, dimensions);
+                        }
+                        if (user) {
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_USER, user);
+                        }
                         if (traceContent) {
-                            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, input);
+                            const formattedInput = typeof input === 'string' ? input : JSON.stringify(input);
+                            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, formattedInput);
                         }
                         // Request Params attributes : End
                         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_INPUT_TOKENS, response.usage.prompt_tokens);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_TOTAL_TOKENS, response.usage.total_tokens);
+                        span.setAttribute(semantic_convention_1.default.GEN_AI_CLIENT_TOKEN_USAGE, response.usage.prompt_tokens);
+                        metricParams = {
+                            genAIEndpoint,
+                            model,
+                            user,
+                            cost,
+                            aiSystem: OpenAIWrapper.aiSystem,
+                        };
                         return response;
                     }
                     catch (e) {
                         helpers_1.default.handleException(span, e);
+                        throw e;
                     }
                     finally {
                         span.end();
+                        if (metricParams) {
+                            base_wrapper_1.default.recordMetrics(span, metricParams);
+                        }
                     }
                 });
             };
@@ -248,6 +427,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
             return async function (...args) {
                 const span = tracer.startSpan(genAIEndpoint, { kind: api_1.SpanKind.CLIENT });
                 return api_1.context.with(api_1.trace.setSpan(api_1.context.active(), span), async () => {
+                    let metricParams;
                     try {
                         const response = await originalMethod.apply(this, args);
                         const model = response.model || 'gpt-3.5-turbo';
@@ -271,6 +451,13 @@ class OpenAIWrapper extends base_wrapper_1.default {
                         span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_ID, response.id);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_INPUT_TOKENS, response.usage.prompt_tokens);
                         span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_FINETUNE_STATUS, response.status);
+                        // Store metric parameters for use after span ends
+                        metricParams = {
+                            genAIEndpoint,
+                            model,
+                            user,
+                            aiSystem: OpenAIWrapper.aiSystem,
+                        };
                         return response;
                     }
                     catch (e) {
@@ -278,6 +465,10 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     }
                     finally {
                         span.end();
+                        // Record metrics after span has ended if parameters are available
+                        if (metricParams) {
+                            base_wrapper_1.default.recordMetrics(span, metricParams);
+                        }
                     }
                 });
             };
@@ -290,6 +481,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
             return async function (...args) {
                 const span = tracer.startSpan(genAIEndpoint, { kind: api_1.SpanKind.CLIENT });
                 return api_1.context.with(api_1.trace.setSpan(api_1.context.active(), span), async () => {
+                    let metricParams;
                     try {
                         const response = await originalMethod.apply(this, args);
                         const { prompt, quality = 'standard', response_format = 'url', size = '1024x1024', style = 'vivid', user, } = args[0];
@@ -323,6 +515,14 @@ class OpenAIWrapper extends base_wrapper_1.default {
                                 imagesCount++;
                             }
                         }
+                        // Store metric parameters for use after span ends
+                        metricParams = {
+                            genAIEndpoint,
+                            model,
+                            user,
+                            cost,
+                            aiSystem: OpenAIWrapper.aiSystem,
+                        };
                         return response;
                     }
                     catch (e) {
@@ -330,6 +530,10 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     }
                     finally {
                         span.end();
+                        // Record metrics after span has ended if parameters are available
+                        if (metricParams) {
+                            base_wrapper_1.default.recordMetrics(span, metricParams);
+                        }
                     }
                 });
             };
@@ -342,6 +546,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
             return async function (...args) {
                 const span = tracer.startSpan(genAIEndpoint, { kind: api_1.SpanKind.CLIENT });
                 return api_1.context.with(api_1.trace.setSpan(api_1.context.active(), span), async () => {
+                    let metricParams;
                     try {
                         const response = await originalMethod.apply(this, args);
                         const { prompt, quality = 'standard', response_format = 'url', size = '1024x1024', style = 'vivid', user, } = args[0];
@@ -376,6 +581,14 @@ class OpenAIWrapper extends base_wrapper_1.default {
                                 imagesCount++;
                             }
                         }
+                        // Store metric parameters for use after span ends
+                        metricParams = {
+                            genAIEndpoint,
+                            model,
+                            user,
+                            cost,
+                            aiSystem: OpenAIWrapper.aiSystem,
+                        };
                         return response;
                     }
                     catch (e) {
@@ -383,6 +596,10 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     }
                     finally {
                         span.end();
+                        // Record metrics after span has ended if parameters are available
+                        if (metricParams) {
+                            base_wrapper_1.default.recordMetrics(span, metricParams);
+                        }
                     }
                 });
             };
@@ -395,6 +612,7 @@ class OpenAIWrapper extends base_wrapper_1.default {
             return async function (...args) {
                 const span = tracer.startSpan(genAIEndpoint, { kind: api_1.SpanKind.CLIENT });
                 return api_1.context.with(api_1.trace.setSpan(api_1.context.active(), span), async () => {
+                    let metricParams;
                     try {
                         const response = await originalMethod.apply(this, args);
                         const { input, user, voice, response_format = 'mp3', speed = 1 } = args[0];
@@ -418,6 +636,14 @@ class OpenAIWrapper extends base_wrapper_1.default {
                             span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, input);
                         }
                         // Request Params attributes : End
+                        // Store metric parameters for use after span ends
+                        metricParams = {
+                            genAIEndpoint,
+                            model,
+                            user,
+                            cost,
+                            aiSystem: OpenAIWrapper.aiSystem,
+                        };
                         return response;
                     }
                     catch (e) {
@@ -425,11 +651,296 @@ class OpenAIWrapper extends base_wrapper_1.default {
                     }
                     finally {
                         span.end();
+                        // Record metrics after span has ended if parameters are available
+                        if (metricParams) {
+                            base_wrapper_1.default.recordMetrics(span, metricParams);
+                        }
                     }
                 });
             };
         };
     }
+    static _patchResponsesCreate(tracer) {
+        const genAIEndpoint = 'openai.resources.responses';
+        return (originalMethod) => {
+            return async function (...args) {
+                const span = tracer.startSpan(genAIEndpoint, { kind: api_1.SpanKind.CLIENT });
+                return api_1.context
+                    .with(api_1.trace.setSpan(api_1.context.active(), span), async () => {
+                    return originalMethod.apply(this, args);
+                })
+                    .then((response) => {
+                    const { stream = false } = args[0];
+                    if (stream) {
+                        return helpers_1.default.createStreamProxy(response, OpenAIWrapper._responsesGenerator({
+                            args,
+                            genAIEndpoint,
+                            response,
+                            span,
+                        }));
+                    }
+                    return OpenAIWrapper._responsesComplete({ args, genAIEndpoint, response, span });
+                })
+                    .catch((e) => {
+                    helpers_1.default.handleException(span, e);
+                    span.end();
+                });
+            };
+        };
+    }
+    static async _responsesComplete({ args, genAIEndpoint, response, span, }) {
+        let metricParams;
+        try {
+            metricParams = await OpenAIWrapper._responsesCommonSetter({
+                args,
+                genAIEndpoint,
+                result: response,
+                span,
+            });
+            return response;
+        }
+        catch (e) {
+            helpers_1.default.handleException(span, e);
+        }
+        finally {
+            span.end();
+            if (metricParams) {
+                base_wrapper_1.default.recordMetrics(span, metricParams);
+            }
+        }
+    }
+    static async *_responsesGenerator({ args, genAIEndpoint, response, span, }) {
+        let metricParams;
+        const timestamps = [];
+        const startTime = Date.now();
+        try {
+            const { input } = args[0];
+            const result = {
+                id: '',
+                model: '',
+                service_tier: 'default',
+                status: 'completed',
+                output: [],
+                usage: {
+                    input_tokens: 0,
+                    output_tokens: 0,
+                    output_tokens_details: {
+                        reasoning_tokens: 0,
+                    },
+                },
+            };
+            let llmResponse = '';
+            let responseTools = [];
+            for await (const chunk of response) {
+                timestamps.push(Date.now());
+                if (chunk.type === 'response.output_text.delta') {
+                    llmResponse += chunk.delta || '';
+                }
+                else if (chunk.type === 'response.output_item.added') {
+                    const item = chunk.item;
+                    if (item?.type === 'function_call') {
+                        responseTools.push({
+                            id: item.id,
+                            call_id: item.call_id,
+                            name: item.name,
+                            type: item.type,
+                            arguments: item.arguments || '',
+                            status: item.status,
+                        });
+                    }
+                }
+                else if (chunk.type === 'response.function_call_arguments.delta') {
+                    const itemId = chunk.item_id;
+                    const delta = chunk.delta || '';
+                    const tool = responseTools.find(t => t.id === itemId);
+                    if (tool) {
+                        tool.arguments += delta;
+                    }
+                }
+                else if (chunk.type === 'response.completed') {
+                    const responseData = chunk.response;
+                    result.id = responseData.id;
+                    result.model = responseData.model;
+                    result.status = responseData.status;
+                    const usage = responseData.usage || {};
+                    result.usage.input_tokens = usage.input_tokens || 0;
+                    result.usage.output_tokens = usage.output_tokens || 0;
+                    result.usage.output_tokens_details.reasoning_tokens =
+                        usage.output_tokens_details?.reasoning_tokens || 0;
+                }
+                yield chunk;
+            }
+            // Construct output array
+            if (llmResponse) {
+                result.output.push({
+                    type: 'message',
+                    content: [{ type: 'text', text: llmResponse }],
+                });
+            }
+            if (responseTools.length > 0) {
+                result.output.push(...responseTools);
+            }
+            // Calculate TTFT and TBT
+            const ttft = timestamps.length > 0 ? (timestamps[0] - startTime) / 1000 : 0;
+            let tbt = 0;
+            if (timestamps.length > 1) {
+                const timeDiffs = timestamps.slice(1).map((t, i) => t - timestamps[i]);
+                tbt = timeDiffs.reduce((a, b) => a + b, 0) / timeDiffs.length / 1000;
+            }
+            metricParams = await OpenAIWrapper._responsesCommonSetter({
+                args,
+                genAIEndpoint,
+                result,
+                span,
+                ttft,
+                tbt,
+            });
+            return result;
+        }
+        catch (e) {
+            helpers_1.default.handleException(span, e);
+        }
+        finally {
+            span.end();
+            if (metricParams) {
+                base_wrapper_1.default.recordMetrics(span, metricParams);
+            }
+        }
+    }
+    static async _responsesCommonSetter({ args, genAIEndpoint, result, span, ttft = 0, tbt = 0, }) {
+        const traceContent = config_1.default.traceContent;
+        const { input, temperature = 1.0, top_p = 1.0, max_output_tokens, reasoning, stream = false, } = args[0];
+        // Format input for prompt
+        let prompt = '';
+        if (typeof input === 'string') {
+            prompt = input;
+        }
+        else if (Array.isArray(input)) {
+            const formattedMessages = [];
+            for (const item of input) {
+                const role = item.role || 'user';
+                const content = item.content;
+                if (typeof content === 'string') {
+                    formattedMessages.push(`${role}: ${content}`);
+                }
+                else if (Array.isArray(content)) {
+                    const contentParts = content
+                        .map((part) => {
+                        if (part.type === 'input_text') {
+                            return `text: ${part.text || ''}`;
+                        }
+                        else if (part.type === 'input_image' && part.image_url && !part.image_url.startsWith('data:')) {
+                            return `image_url: ${part.image_url}`;
+                        }
+                        return '';
+                    })
+                        .filter(Boolean)
+                        .join(', ');
+                    formattedMessages.push(`${role}: ${contentParts}`);
+                }
+            }
+            prompt = formattedMessages.join('\n');
+        }
+        // Request Params attributes
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_TEMPERATURE, temperature);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_TOP_P, top_p);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_MAX_TOKENS, max_output_tokens || -1);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_IS_STREAM, stream);
+        if (reasoning?.effort) {
+            span.setAttribute('gen_ai.request.reasoning_effort', reasoning.effort);
+        }
+        if (traceContent) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_PROMPT, prompt);
+        }
+        span.setAttribute(semantic_convention_1.default.GEN_AI_OPERATION, semantic_convention_1.default.GEN_AI_OPERATION_TYPE_CHAT);
+        const model = result.model || 'gpt-4o';
+        const responseModel = result.model || model;
+        const pricingInfo = await config_1.default.updatePricingJson(config_1.default.pricing_json);
+        // Calculate cost
+        const inputTokens = result.usage?.input_tokens || 0;
+        const outputTokens = result.usage?.output_tokens || 0;
+        const cost = helpers_1.default.getChatModelCost(model, pricingInfo, inputTokens, outputTokens);
+        OpenAIWrapper.setBaseSpanAttributes(span, {
+            genAIEndpoint,
+            model,
+            user: '',
+            cost,
+            aiSystem: OpenAIWrapper.aiSystem,
+        });
+        // Response attributes
+        span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_ID, result.id);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_MODEL, responseModel);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_RESPONSE_FINISH_REASON, [result.status || 'completed']);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_OUTPUT_TYPE, semantic_convention_1.default.GEN_AI_OUTPUT_TYPE_TEXT);
+        if (result.service_tier) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_REQUEST_SERVICE_TIER, result.service_tier);
+        }
+        // Token usage
+        span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_INPUT_TOKENS, inputTokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_OUTPUT_TOKENS, outputTokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_TOTAL_TOKENS, inputTokens + outputTokens);
+        span.setAttribute(semantic_convention_1.default.GEN_AI_CLIENT_TOKEN_USAGE, inputTokens + outputTokens);
+        // Reasoning tokens
+        if (result.usage?.output_tokens_details?.reasoning_tokens) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_USAGE_REASONING_TOKENS, result.usage.output_tokens_details.reasoning_tokens);
+        }
+        // TTFT and TBT metrics
+        if (ttft > 0) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TTFT, ttft);
+        }
+        if (tbt > 0) {
+            span.setAttribute(semantic_convention_1.default.GEN_AI_SERVER_TBT, tbt);
+        }
+        // Extract completion text from output
+        let completionText = '';
+        if (result.output && Array.isArray(result.output)) {
+            for (const item of result.output) {
+                if (item.type === 'message' && item.content) {
+                    for (const content of item.content) {
+                        if (content.type === 'text' || content.type === 'output_text') {
+                            completionText += content.text || '';
+                        }
+                    }
+                }
+            }
+        }
+        // Tool calls handling for Responses API
+        const toolCalls = result.tools || [];
+        if (toolCalls.length > 0) {
+            const toolNames = toolCalls.map((t) => t.name || '').filter(Boolean);
+            const toolIds = toolCalls.map((t) => t.call_id || '').filter(Boolean);
+            const toolArgs = toolCalls.map((t) => t.arguments || '').filter(Boolean);
+            const toolTypes = toolCalls.map((t) => t.type || '').filter(Boolean);
+            if (toolNames.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_NAME, toolNames.join(', '));
+            }
+            if (toolIds.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_CALL_ID, toolIds.join(', '));
+            }
+            if (toolArgs.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_CALL_ARGUMENTS, toolArgs.join(', '));
+            }
+            if (toolTypes.length > 0) {
+                span.setAttribute(semantic_convention_1.default.GEN_AI_TOOL_TYPE, toolTypes.join(', '));
+            }
+        }
+        // Content
+        if (traceContent) {
+            // Set completion content - use actual text or empty string if only tool calls
+            span.setAttribute(semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION, completionText);
+            // Add events for backward compatibility
+            span.addEvent(semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION_EVENT, {
+                [semantic_convention_1.default.GEN_AI_CONTENT_COMPLETION]: completionText,
+            });
+        }
+        return {
+            genAIEndpoint,
+            model,
+            user: '',
+            cost,
+            aiSystem: OpenAIWrapper.aiSystem,
+        };
+    }
 }
 OpenAIWrapper.aiSystem = semantic_convention_1.default.GEN_AI_SYSTEM_OPENAI;
 exports.default = OpenAIWrapper;