npm - @posthog/ai - Versions diffs - 3.2.1 → 3.3.0 - Mend

@posthog/ai 3.2.1 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/CHANGELOG.md +6 -0
package/lib/index.cjs.js +118 -18
package/lib/index.cjs.js.map +1 -1
package/lib/index.esm.js +118 -18
package/lib/index.esm.js.map +1 -1
package/lib/posthog-ai/src/utils.d.ts +5 -1
package/package.json +1 -1
package/src/anthropic/index.ts +12 -1
package/src/langchain/callbacks.ts +6 -0
package/src/openai/azure.ts +10 -1
package/src/openai/index.ts +13 -2
package/src/utils.ts +17 -1
package/src/vercel/middleware.ts +93 -15
package/tests/openai.test.ts +36 -0

package/lib/posthog-ai/src/utils.d.ts CHANGED Viewed

@@ -49,10 +49,14 @@ export type SendEventToPosthogParams = {
     usage?: {
         inputTokens?: number;
         outputTokens?: number;
+        reasoningTokens?: any;
+        cacheReadInputTokens?: any;
+        cacheCreationInputTokens?: any;
     };
     params: (ChatCompletionCreateParamsBase | MessageCreateParams) & MonitoringParams;
     isError?: boolean;
     error?: string;
+    tools?: any;
 };
-export declare const sendEventToPosthog: ({ client, distinctId, traceId, model, provider, input, output, latency, baseURL, params, httpStatus, usage, isError, error, }: SendEventToPosthogParams) => void;
+export declare const sendEventToPosthog: ({ client, distinctId, traceId, model, provider, input, output, latency, baseURL, params, httpStatus, usage, isError, error, tools, }: SendEventToPosthogParams) => void;
 export {};

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@posthog/ai",
-  "version": "3.2.1",
+  "version": "3.3.0",
   "description": "PostHog Node.js AI integrations",
   "repository": {
     "type": "git",

package/src/anthropic/index.ts CHANGED Viewed

@@ -70,9 +70,16 @@ export class WrappedMessages extends AnthropicOriginal.Messages {
     if (anthropicParams.stream) {
       return parentPromise.then((value) => {
         let accumulatedContent = ''
-        const usage: { inputTokens: number; outputTokens: number } = {
+        const usage: {
+          inputTokens: number
+          outputTokens: number
+          cacheCreationInputTokens?: number
+          cacheReadInputTokens?: number
+        } = {
           inputTokens: 0,
           outputTokens: 0,
+          cacheCreationInputTokens: 0,
+          cacheReadInputTokens: 0,
         }
         if ('tee' in value) {
           const [stream1, stream2] = value.tee()
@@ -87,6 +94,8 @@ export class WrappedMessages extends AnthropicOriginal.Messages {
                 }
                 if (chunk.type == 'message_start') {
                   usage.inputTokens = chunk.message.usage.input_tokens ?? 0
+                  usage.cacheCreationInputTokens = chunk.message.usage.cache_creation_input_tokens ?? 0
+                  usage.cacheReadInputTokens = chunk.message.usage.cache_read_input_tokens ?? 0
                 }
                 if ('usage' in chunk) {
                   usage.outputTokens = chunk.usage.output_tokens ?? 0
@@ -156,6 +165,8 @@ export class WrappedMessages extends AnthropicOriginal.Messages {
               usage: {
                 inputTokens: result.usage.input_tokens ?? 0,
                 outputTokens: result.usage.output_tokens ?? 0,
+                cacheCreationInputTokens: result.usage.cache_creation_input_tokens ?? 0,
+                cacheReadInputTokens: result.usage.cache_read_input_tokens ?? 0,
               },
             })
           }

package/src/langchain/callbacks.ts CHANGED Viewed

@@ -28,6 +28,8 @@ interface GenerationMetadata extends SpanMetadata {
   modelParams?: Record<string, any>
   /** The base URL—for example, the API base used */
   baseUrl?: string
+  /** The tools used in the generation */
+  tools?: Record<string, any>
 }
 /** A run may either be a Span or a Generation */
@@ -420,6 +422,10 @@ export class LangChainCallbackHandler extends BaseCallbackHandler {
       $ai_base_url: run.baseUrl,
     }
+    if (run.tools) {
+      eventProperties['$ai_tools'] = withPrivacyMode(this.client, this.privacyMode, run.tools)
+    }
     if (output instanceof Error) {
       eventProperties['$ai_http_status'] = (output as any).status || 500
       eventProperties['$ai_error'] = output.toString()

package/src/openai/azure.ts CHANGED Viewed

@@ -86,7 +86,12 @@ export class WrappedCompletions extends AzureOpenAI.Chat.Completions {
     if (openAIParams.stream) {
       return parentPromise.then((value) => {
         let accumulatedContent = ''
-        let usage: { inputTokens: number; outputTokens: number } = {
+        let usage: {
+          inputTokens: number
+          outputTokens: number
+          reasoningTokens?: number
+          cacheReadInputTokens?: number
+        } = {
           inputTokens: 0,
           outputTokens: 0,
         }
@@ -105,6 +110,8 @@ export class WrappedCompletions extends AzureOpenAI.Chat.Completions {
                   usage = {
                     inputTokens: chunk.usage.prompt_tokens ?? 0,
                     outputTokens: chunk.usage.completion_tokens ?? 0,
+                    reasoningTokens: chunk.usage.completion_tokens_details?.reasoning_tokens ?? 0,
+                    cacheReadInputTokens: chunk.usage.prompt_tokens_details?.cached_tokens ?? 0,
                   }
                 }
               }
@@ -176,6 +183,8 @@ export class WrappedCompletions extends AzureOpenAI.Chat.Completions {
               usage: {
                 inputTokens: result.usage?.prompt_tokens ?? 0,
                 outputTokens: result.usage?.completion_tokens ?? 0,
+                reasoningTokens: result.usage?.completion_tokens_details?.reasoning_tokens ?? 0,
+                cacheReadInputTokens: result.usage?.prompt_tokens_details?.cached_tokens ?? 0,
               },
             })
           }

package/src/openai/index.ts CHANGED Viewed

@@ -88,11 +88,18 @@ export class WrappedCompletions extends OpenAIOrignal.Chat.Completions {
       return parentPromise.then((value) => {
         if ('tee' in value) {
           const [stream1, stream2] = value.tee()
-          // Use one stream for tracking
           ;(async () => {
             try {
               let accumulatedContent = ''
-              let usage = { inputTokens: 0, outputTokens: 0 }
+              let usage: {
+                inputTokens?: number
+                outputTokens?: number
+                reasoningTokens?: number
+                cacheReadInputTokens?: number
+              } = {
+                inputTokens: 0,
+                outputTokens: 0,
+              }
               for await (const chunk of stream1) {
                 const delta = chunk?.choices?.[0]?.delta?.content ?? ''
@@ -101,6 +108,8 @@ export class WrappedCompletions extends OpenAIOrignal.Chat.Completions {
                   usage = {
                     inputTokens: chunk.usage.prompt_tokens ?? 0,
                     outputTokens: chunk.usage.completion_tokens ?? 0,
+                    reasoningTokens: chunk.usage.completion_tokens_details?.reasoning_tokens ?? 0,
+                    cacheReadInputTokens: chunk.usage.prompt_tokens_details?.cached_tokens ?? 0,
                   }
                 }
               }
@@ -165,6 +174,8 @@ export class WrappedCompletions extends OpenAIOrignal.Chat.Completions {
               usage: {
                 inputTokens: result.usage?.prompt_tokens ?? 0,
                 outputTokens: result.usage?.completion_tokens ?? 0,
+                reasoningTokens: result.usage?.completion_tokens_details?.reasoning_tokens ?? 0,
+                cacheReadInputTokens: result.usage?.prompt_tokens_details?.cached_tokens ?? 0,
               },
             })
           }

package/src/utils.ts CHANGED Viewed

@@ -118,10 +118,17 @@ export type SendEventToPosthogParams = {
   latency: number
   baseURL: string
   httpStatus: number
-  usage?: { inputTokens?: number; outputTokens?: number }
+  usage?: {
+    inputTokens?: number
+    outputTokens?: number
+    reasoningTokens?: any
+    cacheReadInputTokens?: any
+    cacheCreationInputTokens?: any
+  }
   params: (ChatCompletionCreateParamsBase | MessageCreateParams) & MonitoringParams
   isError?: boolean
   error?: string
+  tools?: any
 }
 export const sendEventToPosthog = ({
@@ -139,6 +146,7 @@ export const sendEventToPosthog = ({
   usage = {},
   isError = false,
   error,
+  tools,
 }: SendEventToPosthogParams): void => {
   if (client.capture) {
     let errorData = {}
@@ -159,6 +167,12 @@ export const sendEventToPosthog = ({
       }
     }
+    let additionalTokenValues = {
+      ...(usage.reasoningTokens ? { $ai_reasoning_tokens: usage.reasoningTokens } : {}),
+      ...(usage.cacheReadInputTokens ? { $ai_cache_read_input_tokens: usage.cacheReadInputTokens } : {}),
+      ...(usage.cacheCreationInputTokens ? { $ai_cache_creation_input_tokens: usage.cacheCreationInputTokens } : {}),
+    }
     client.capture({
       distinctId: distinctId ?? traceId,
       event: '$ai_generation',
@@ -171,11 +185,13 @@ export const sendEventToPosthog = ({
         $ai_http_status: httpStatus,
         $ai_input_tokens: usage.inputTokens ?? 0,
         $ai_output_tokens: usage.outputTokens ?? 0,
+        ...additionalTokenValues,
         $ai_latency: latency,
         $ai_trace_id: traceId,
         $ai_base_url: baseURL,
         ...params.posthogProperties,
         ...(distinctId ? {} : { $process_person_profile: false }),
+        ...(tools ? { $ai_tools: tools } : {}),
         ...errorData,
         ...costOverrideData,
       },

package/src/vercel/middleware.ts CHANGED Viewed

@@ -27,8 +27,13 @@ interface CreateInstrumentationMiddlewareOptions {
 }
 interface PostHogInput {
-  content: string
   role: string
+  type?: string
+  content?:
+    | string
+    | {
+        [key: string]: any
+      }
 }
 const mapVercelParams = (params: any): Record<string, any> => {
@@ -45,18 +50,60 @@ const mapVercelParams = (params: any): Record<string, any> => {
 const mapVercelPrompt = (prompt: LanguageModelV1Prompt): PostHogInput[] => {
   return prompt.map((p) => {
-    let content = ''
+    let content = {}
     if (Array.isArray(p.content)) {
-      content = p.content
-        .map((c) => {
-          if (c.type === 'text') {
-            return c.text
+      content = p.content.map((c) => {
+        if (c.type === 'text') {
+          return {
+            type: 'text',
+            content: c.text,
           }
-          return ''
-        })
-        .join('')
+        } else if (c.type === 'image') {
+          return {
+            type: 'image',
+            content: {
+              // if image is a url use it, or use "none supported"
+              image: c.image instanceof URL ? c.image.toString() : 'raw images not supported',
+              mimeType: c.mimeType,
+            },
+          }
+        } else if (c.type === 'file') {
+          return {
+            type: 'file',
+            content: {
+              file: c.data instanceof URL ? c.data.toString() : 'raw files not supported',
+              mimeType: c.mimeType,
+            },
+          }
+        } else if (c.type === 'tool-call') {
+          return {
+            type: 'tool-call',
+            content: {
+              toolCallId: c.toolCallId,
+              toolName: c.toolName,
+              args: c.args,
+            },
+          }
+        } else if (c.type === 'tool-result') {
+          return {
+            type: 'tool-result',
+            content: {
+              toolCallId: c.toolCallId,
+              toolName: c.toolName,
+              result: c.result,
+              isError: c.isError,
+            },
+          }
+        }
+        return {
+          content: '',
+        }
+      })
     } else {
-      content = p.content
+      content = {
+        type: 'text',
+        text: p.content,
+      }
     }
     return {
       role: p.role,
@@ -91,10 +138,22 @@ export const createInstrumentationMiddleware = (
           options.posthogModelOverride ?? (result.response?.modelId ? result.response.modelId : model.modelId)
         const provider = options.posthogProviderOverride ?? extractProvider(model)
         const baseURL = '' // cannot currently get baseURL from vercel
-        let content = result.text
-        if (!content) {
-          // support generate Object
-          content = result.toolCalls?.[0].args || JSON.stringify(result)
+        let content = result.text || JSON.stringify(result)
+        // let tools = result.toolCalls
+        let providerMetadata = result.providerMetadata
+        let additionalTokenValues = {
+          ...(providerMetadata?.openai?.reasoningTokens
+            ? { reasoningTokens: providerMetadata.openai.reasoningTokens }
+            : {}),
+          ...(providerMetadata?.openai?.cachedPromptToken
+            ? { cacheReadInputTokens: providerMetadata.openai.cachedPromptTokens }
+            : {}),
+          ...(providerMetadata?.anthropic
+            ? {
+                cacheReadInputTokens: providerMetadata.anthropic.cacheReadInputTokens,
+                cacheCreationInputTokens: providerMetadata.anthropic.cacheCreationInputTokens,
+              }
+            : {}),
         }
         sendEventToPosthog({
           client: phClient,
@@ -111,6 +170,7 @@ export const createInstrumentationMiddleware = (
           usage: {
             inputTokens: result.usage.promptTokens,
             outputTokens: result.usage.completionTokens,
+            ...additionalTokenValues,
           },
         })
@@ -143,7 +203,13 @@ export const createInstrumentationMiddleware = (
     wrapStream: async ({ doStream, params }) => {
       const startTime = Date.now()
       let generatedText = ''
-      let usage: { inputTokens?: number; outputTokens?: number } = {}
+      let usage: {
+        inputTokens?: number
+        outputTokens?: number
+        reasoningTokens?: any
+        cacheReadInputTokens?: any
+        cacheCreationInputTokens?: any
+      } = {}
       const mergedParams = {
         ...options,
         ...mapVercelParams(params),
@@ -164,6 +230,18 @@ export const createInstrumentationMiddleware = (
                 inputTokens: chunk.usage?.promptTokens,
                 outputTokens: chunk.usage?.completionTokens,
               }
+              if (chunk.providerMetadata?.openai?.reasoningTokens) {
+                usage.reasoningTokens = chunk.providerMetadata.openai.reasoningTokens
+              }
+              if (chunk.providerMetadata?.openai?.cachedPromptToken) {
+                usage.cacheReadInputTokens = chunk.providerMetadata.openai.cachedPromptToken
+              }
+              if (chunk.providerMetadata?.anthropic?.cacheReadInputTokens) {
+                usage.cacheReadInputTokens = chunk.providerMetadata.anthropic.cacheReadInputTokens
+              }
+              if (chunk.providerMetadata?.anthropic?.cacheCreationInputTokens) {
+                usage.cacheCreationInputTokens = chunk.providerMetadata.anthropic.cacheCreationInputTokens
+              }
             }
             controller.enqueue(chunk)
           },

package/tests/openai.test.ts CHANGED Viewed

@@ -225,4 +225,40 @@ describe('PostHogOpenAI - Jest test suite', () => {
     expect(properties['$ai_stream']).toBe(false)
     expect(properties['foo']).toBe('bar')
   })
+  conditionalTest('reasoning and cache tokens', async () => {
+    // Set up mock response with standard token usage
+    mockOpenAiChatResponse.usage = {
+      prompt_tokens: 20,
+      completion_tokens: 10,
+      total_tokens: 30,
+      // Add the detailed token usage that OpenAI would return
+      completion_tokens_details: {
+        reasoning_tokens: 15,
+      },
+      prompt_tokens_details: {
+        cached_tokens: 5,
+      },
+    }
+    // Create a completion with additional token tracking
+    await client.chat.completions.create({
+      model: 'gpt-4',
+      messages: [{ role: 'user', content: 'Hello' }],
+      posthogDistinctId: 'test-id',
+      posthogProperties: { foo: 'bar' },
+    })
+    expect(mockPostHogClient.capture).toHaveBeenCalledTimes(1)
+    const [captureArgs] = (mockPostHogClient.capture as jest.Mock).mock.calls
+    const { properties } = captureArgs[0]
+    // Check standard token properties
+    expect(properties['$ai_input_tokens']).toBe(20)
+    expect(properties['$ai_output_tokens']).toBe(10)
+    // Check the new token properties
+    expect(properties['$ai_reasoning_tokens']).toBe(15)
+    expect(properties['$ai_cache_read_input_tokens']).toBe(5)
+  })
 })