npm - @fallom/trace - Versions diffs - 0.1.0 → 0.1.3 - Mend

@fallom/trace 0.1.0 → 0.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/README.md CHANGED Viewed

@@ -6,28 +6,27 @@ Model A/B testing and tracing for LLM applications. Zero latency, production-rea
 ```bash
 npm install @fallom/trace
-# With auto-instrumentation for your LLM provider:
-npm install @fallom/trace @traceloop/node-server-sdk
 ```
 ## Quick Start
 ```typescript
-import fallom from '@fallom/trace';
-import OpenAI from 'openai';
+import fallom from "@fallom/trace";
+import OpenAI from "openai";
+// Initialize Fallom
+await fallom.init({ apiKey: "your-api-key" });
-// Initialize FIRST - before importing your LLM libraries
-fallom.init({ apiKey: 'your-api-key' });
+// Wrap your LLM client for automatic tracing
+const openai = fallom.trace.wrapOpenAI(new OpenAI());
-// Set default session context for tracing
-fallom.trace.setSession('my-agent', sessionId);
+// Set session context
+fallom.trace.setSession("my-agent", sessionId);
 // All LLM calls are now automatically traced!
-const openai = new OpenAI();
 const response = await openai.chat.completions.create({
-  model: 'gpt-4o',
-  messages: [{ role: 'user', content: 'Hello!' }],
+  model: "gpt-4o",
+  messages: [{ role: "user", content: "Hello!" }],
 });
 ```
@@ -36,120 +35,112 @@ const response = await openai.chat.completions.create({
 Run A/B tests on models with zero latency. Same session always gets same model (sticky assignment).
 ```typescript
-import { models } from '@fallom/trace';
+import { models } from "@fallom/trace";
 // Get assigned model for this session
-const model = await models.get('summarizer-config', sessionId);
+const model = await models.get("summarizer-config", sessionId);
 // Returns: "gpt-4o" or "claude-3-5-sonnet" based on your config weights
-const agent = new Agent({ model });
-await agent.run(message);
-```
-### Version Pinning
-Pin to a specific config version, or use latest (default):
-```typescript
-// Use latest version (default)
-const model = await models.get('my-config', sessionId);
-// Pin to specific version
-const model = await models.get('my-config', sessionId, { version: 2 });
+const response = await openai.chat.completions.create({ model, ... });
 ```
 ### Fallback for Resilience
-Always provide a fallback so your app works even if Fallom is down:
 ```typescript
-const model = await models.get('my-config', sessionId, {
-  fallback: 'gpt-4o-mini', // Used if config not found or Fallom unreachable
+const model = await models.get("my-config", sessionId, {
+  fallback: "gpt-4o-mini", // Used if config not found or Fallom unreachable
 });
 ```
-**Resilience guarantees:**
-- Short timeouts (1-2 seconds max)
-- Background config sync (never blocks your requests)
-- Graceful degradation (returns fallback on any error)
-- Your app is never impacted by Fallom being down
 ## Tracing
-Auto-capture all LLM calls with OpenTelemetry instrumentation.
-> ⚠️ **Important:** Auto-tracing only works with supported LLM SDKs (OpenAI, Anthropic, etc.) - not raw HTTP requests. If you're using an OpenAI-compatible API like OpenRouter, LiteLLM, or a self-hosted model, use the OpenAI SDK with a custom `baseURL`:
->
-> ```typescript
-> import OpenAI from 'openai';
->
-> // OpenRouter, LiteLLM, vLLM, etc.
-> const client = new OpenAI({
->   baseURL: 'https://openrouter.ai/api/v1', // or your provider's URL
->   apiKey: 'your-provider-key',
-> });
->
-> // Now this call will be auto-traced!
-> const response = await client.chat.completions.create({
->   model: 'gpt-4o',
->   messages: [...],
-> });
-> ```
-### Automatic Tracing
+Wrap your LLM client once, all calls are automatically traced.
+### OpenAI (+ OpenRouter, Azure, LiteLLM, etc.)
 ```typescript
-import fallom from '@fallom/trace';
+import OpenAI from "openai";
+import fallom from "@fallom/trace";
-// Initialize before making LLM calls
-fallom.init();
+await fallom.init({ apiKey: "your-api-key" });
-// Set session context
-fallom.trace.setSession('my-agent', sessionId);
+// Works with any OpenAI-compatible API
+const openai = fallom.trace.wrapOpenAI(
+  new OpenAI({
+    baseURL: "https://openrouter.ai/api/v1", // or Azure, LiteLLM, etc.
+    apiKey: "your-provider-key",
+  })
+);
-// All LLM calls automatically traced with:
-// - Model, tokens, latency
-// - Prompts and completions
-// - Your config_key and session_id
+fallom.trace.setSession("my-config", sessionId);
+// Automatically traced!
 const response = await openai.chat.completions.create({
-  model: 'gpt-4o',
-  messages: [...],
+  model: "gpt-4o",
+  messages: [{ role: "user", content: "Hello!" }],
 });
 ```
-### Async Context Propagation
-For proper session context across async boundaries, use `runWithSession`:
+### Anthropic (Claude)
 ```typescript
-import { trace } from '@fallom/trace';
+import Anthropic from "@anthropic-ai/sdk";
+import fallom from "@fallom/trace";
+await fallom.init({ apiKey: "your-api-key" });
+const anthropic = fallom.trace.wrapAnthropic(new Anthropic());
-await trace.runWithSession('my-agent', sessionId, async () => {
-  // All LLM calls in here have session context
-  await agent.run(message);
-  await anotherAsyncOperation();
+fallom.trace.setSession("my-config", sessionId);
+// Automatically traced!
+const response = await anthropic.messages.create({
+  model: "claude-3-5-sonnet-20241022",
+  messages: [{ role: "user", content: "Hello!" }],
 });
 ```
-### Custom Metrics
+### Google AI (Gemini)
+```typescript
+import { GoogleGenerativeAI } from "@google/generative-ai";
+import fallom from "@fallom/trace";
+await fallom.init({ apiKey: "your-api-key" });
+const genAI = new GoogleGenerativeAI(apiKey);
+const model = fallom.trace.wrapGoogleAI(
+  genAI.getGenerativeModel({ model: "gemini-pro" })
+);
+fallom.trace.setSession("my-config", sessionId);
+// Automatically traced!
+const response = await model.generateContent("Hello!");
+```
+## What Gets Traced
-Record business metrics that OTEL can't capture automatically:
+For each LLM call, Fallom automatically captures:
+- ✅ Model name
+- ✅ Duration (latency)
+- ✅ Token counts (prompt, completion, total)
+- ✅ Input/output content (can be disabled)
+- ✅ Errors
+- ✅ Config key + session ID (for A/B analysis)
+## Custom Metrics
+Record business metrics for your A/B tests:
 ```typescript
-import { trace } from '@fallom/trace';
+import { trace } from "@fallom/trace";
-// Record custom metrics for this session
 trace.span({
   outlier_score: 0.8,
   user_satisfaction: 4,
   conversion: true,
 });
-// Or explicitly specify session (for batch jobs)
-trace.span(
-  { outlier_score: 0.8 },
-  { configKey: 'my-agent', sessionId: 'user123-convo456' }
-);
 ```
 ## Configuration
@@ -158,118 +149,54 @@ trace.span(
 ```bash
 FALLOM_API_KEY=your-api-key
-FALLOM_BASE_URL=https://spans.fallom.com  # or http://localhost:8001 for local dev
+FALLOM_BASE_URL=https://spans.fallom.com
 FALLOM_CAPTURE_CONTENT=true  # set to "false" for privacy mode
 ```
-### Initialization Options
-```typescript
-fallom.init({
-  apiKey: 'your-api-key',           // Or use FALLOM_API_KEY env var
-  baseUrl: 'https://spans.fallom.com', // Or use FALLOM_BASE_URL env var
-  captureContent: true,              // Set false for privacy mode
-});
-```
 ### Privacy Mode
-For companies with strict data policies, disable prompt/completion capture:
+Disable prompt/completion capture:
 ```typescript
-// Via parameter
 fallom.init({ captureContent: false });
-// Or via environment variable
-// FALLOM_CAPTURE_CONTENT=false
 ```
-In privacy mode, Fallom still tracks:
-- ✅ Model used
-- ✅ Token counts
-- ✅ Latency
-- ✅ Session/config context
-- ❌ Prompt content (not captured)
-- ❌ Completion content (not captured)
 ## API Reference
 ### `fallom.init(options?)`
-Initialize the SDK. Call this before making LLM calls for auto-instrumentation.
+Initialize the SDK.
-| Option | Type | Default | Description |
-|--------|------|---------|-------------|
-| `apiKey` | `string` | `FALLOM_API_KEY` env | Your Fallom API key |
-| `baseUrl` | `string` | `https://spans.fallom.com` | API base URL |
-| `captureContent` | `boolean` | `true` | Capture prompt/completion text |
+### `fallom.trace.wrapOpenAI(client)`
-### `fallom.models.get(configKey, sessionId, options?)`
-Get model assignment for a session.
+Wrap OpenAI client for automatic tracing. Works with any OpenAI-compatible API.
-| Parameter | Type | Description |
-|-----------|------|-------------|
-| `configKey` | `string` | Your config name from the dashboard |
-| `sessionId` | `string` | Unique session/conversation ID (sticky assignment) |
-| `options.version` | `number` | Pin to specific version (default: latest) |
-| `options.fallback` | `string` | Model to return if anything fails |
-| `options.debug` | `boolean` | Enable debug logging |
+### `fallom.trace.wrapAnthropic(client)`
-Returns: `Promise<string>` - The assigned model name
+Wrap Anthropic client for automatic tracing.
-### `fallom.trace.setSession(configKey, sessionId)`
+### `fallom.trace.wrapGoogleAI(model)`
-Set trace context. All subsequent LLM calls will be tagged with this session.
+Wrap Google AI model for automatic tracing.
-### `fallom.trace.runWithSession(configKey, sessionId, fn)`
+### `fallom.trace.setSession(configKey, sessionId)`
-Run a function with session context that propagates across async boundaries.
+Set session context for tracing.
-### `fallom.trace.clearSession()`
+### `fallom.models.get(configKey, sessionId, options?)`
-Clear trace context.
+Get model assignment for A/B testing. Returns `Promise<string>`.
-### `fallom.trace.span(data, options?)`
+### `fallom.trace.span(data)`
 Record custom business metrics.
-| Parameter | Type | Description |
-|-----------|------|-------------|
-| `data` | `Record<string, unknown>` | Metrics to record |
-| `options.configKey` | `string` | Optional if `setSession()` was called |
-| `options.sessionId` | `string` | Optional if `setSession()` was called |
-### `fallom.trace.shutdown()`
-Gracefully shutdown the tracing SDK. Call this on process exit.
-## Supported LLM Providers
-Auto-instrumentation available for:
-- OpenAI (+ OpenAI-compatible APIs: OpenRouter, LiteLLM, vLLM, Ollama, etc.)
-- Anthropic
-- Cohere
-- AWS Bedrock
-- Google Generative AI
-- Azure OpenAI
-- LangChain
-- And more via Traceloop
-Install `@traceloop/node-server-sdk` for comprehensive LLM instrumentation.
-**Note:** You must use the official SDK for your provider. Raw HTTP requests (e.g., `fetch()`) will not be traced. For OpenAI-compatible APIs, use the OpenAI SDK with a custom `baseURL`.
-## Examples
-See the `../examples/` folder for complete examples:
-- `random-fact/` - Simple A/B testing with Hono server
 ## Requirements
 - Node.js >= 18.0.0
+Works with ESM and CommonJS. Works with tsx, ts-node, Bun, and compiled JavaScript.
 ## License
 MIT

package/dist/index.d.mts CHANGED Viewed

@@ -36,7 +36,8 @@ declare function init$2(options?: {
     apiKey?: string;
     baseUrl?: string;
     captureContent?: boolean;
-}): void;
+    debug?: boolean;
+}): Promise<void>;
 /**
  * Set the current session context.
  *
@@ -111,6 +112,74 @@ declare function span(data: Record<string, unknown>, options?: {
  * Shutdown the tracing SDK gracefully.
  */
 declare function shutdown(): Promise<void>;
+/**
+ * Wrap an OpenAI client to automatically trace all chat completions.
+ * Works with OpenAI, OpenRouter, Azure OpenAI, LiteLLM, and any OpenAI-compatible API.
+ *
+ * @param client - The OpenAI client instance
+ * @returns The same client with tracing enabled
+ *
+ * @example
+ * ```typescript
+ * import OpenAI from "openai";
+ * import { trace } from "@fallom/trace";
+ *
+ * const openai = trace.wrapOpenAI(new OpenAI());
+ *
+ * trace.setSession("my-config", sessionId);
+ * const response = await openai.chat.completions.create({...}); // Automatically traced!
+ * ```
+ */
+declare function wrapOpenAI<T extends {
+    chat: {
+        completions: {
+            create: (...args: any[]) => Promise<any>;
+        };
+    };
+}>(client: T): T;
+/**
+ * Wrap an Anthropic client to automatically trace all message creations.
+ *
+ * @param client - The Anthropic client instance
+ * @returns The same client with tracing enabled
+ *
+ * @example
+ * ```typescript
+ * import Anthropic from "@anthropic-ai/sdk";
+ * import { trace } from "@fallom/trace";
+ *
+ * const anthropic = trace.wrapAnthropic(new Anthropic());
+ *
+ * trace.setSession("my-config", sessionId);
+ * const response = await anthropic.messages.create({...}); // Automatically traced!
+ * ```
+ */
+declare function wrapAnthropic<T extends {
+    messages: {
+        create: (...args: any[]) => Promise<any>;
+    };
+}>(client: T): T;
+/**
+ * Wrap a Google Generative AI client to automatically trace all content generations.
+ *
+ * @param client - The GoogleGenerativeAI client instance
+ * @returns The same client with tracing enabled
+ *
+ * @example
+ * ```typescript
+ * import { GoogleGenerativeAI } from "@google/generative-ai";
+ * import { trace } from "@fallom/trace";
+ *
+ * const genAI = new GoogleGenerativeAI(apiKey);
+ * const model = trace.wrapGoogleAI(genAI.getGenerativeModel({ model: "gemini-pro" }));
+ *
+ * trace.setSession("my-config", sessionId);
+ * const response = await model.generateContent("Hello!"); // Automatically traced!
+ * ```
+ */
+declare function wrapGoogleAI<T extends {
+    generateContent: (...args: any[]) => Promise<any>;
+}>(model: T): T;
 declare const trace_clearSession: typeof clearSession;
 declare const trace_getSession: typeof getSession;
@@ -118,8 +187,11 @@ declare const trace_runWithSession: typeof runWithSession;
 declare const trace_setSession: typeof setSession;
 declare const trace_shutdown: typeof shutdown;
 declare const trace_span: typeof span;
+declare const trace_wrapAnthropic: typeof wrapAnthropic;
+declare const trace_wrapGoogleAI: typeof wrapGoogleAI;
+declare const trace_wrapOpenAI: typeof wrapOpenAI;
 declare namespace trace {
-  export { trace_clearSession as clearSession, trace_getSession as getSession, init$2 as init, trace_runWithSession as runWithSession, trace_setSession as setSession, trace_shutdown as shutdown, trace_span as span };
+  export { trace_clearSession as clearSession, trace_getSession as getSession, init$2 as init, trace_runWithSession as runWithSession, trace_setSession as setSession, trace_shutdown as shutdown, trace_span as span, trace_wrapAnthropic as wrapAnthropic, trace_wrapGoogleAI as wrapGoogleAI, trace_wrapOpenAI as wrapOpenAI };
 }
 /**
@@ -182,6 +254,7 @@ interface InitOptions {
     apiKey?: string;
     baseUrl?: string;
     captureContent?: boolean;
+    debug?: boolean;
 }
 /**
  * Initialize both trace and models at once.
@@ -205,7 +278,7 @@ interface InitOptions {
  * fallom.init({ captureContent: false });
  * ```
  */
-declare function init(options?: InitOptions): void;
+declare function init(options?: InitOptions): Promise<void>;
 /**
  * Fallom - Model A/B testing and tracing for LLM applications.

package/dist/index.d.ts CHANGED Viewed

@@ -36,7 +36,8 @@ declare function init$2(options?: {
     apiKey?: string;
     baseUrl?: string;
     captureContent?: boolean;
-}): void;
+    debug?: boolean;
+}): Promise<void>;
 /**
  * Set the current session context.
  *
@@ -111,6 +112,74 @@ declare function span(data: Record<string, unknown>, options?: {
  * Shutdown the tracing SDK gracefully.
  */
 declare function shutdown(): Promise<void>;
+/**
+ * Wrap an OpenAI client to automatically trace all chat completions.
+ * Works with OpenAI, OpenRouter, Azure OpenAI, LiteLLM, and any OpenAI-compatible API.
+ *
+ * @param client - The OpenAI client instance
+ * @returns The same client with tracing enabled
+ *
+ * @example
+ * ```typescript
+ * import OpenAI from "openai";
+ * import { trace } from "@fallom/trace";
+ *
+ * const openai = trace.wrapOpenAI(new OpenAI());
+ *
+ * trace.setSession("my-config", sessionId);
+ * const response = await openai.chat.completions.create({...}); // Automatically traced!
+ * ```
+ */
+declare function wrapOpenAI<T extends {
+    chat: {
+        completions: {
+            create: (...args: any[]) => Promise<any>;
+        };
+    };
+}>(client: T): T;
+/**
+ * Wrap an Anthropic client to automatically trace all message creations.
+ *
+ * @param client - The Anthropic client instance
+ * @returns The same client with tracing enabled
+ *
+ * @example
+ * ```typescript
+ * import Anthropic from "@anthropic-ai/sdk";
+ * import { trace } from "@fallom/trace";
+ *
+ * const anthropic = trace.wrapAnthropic(new Anthropic());
+ *
+ * trace.setSession("my-config", sessionId);
+ * const response = await anthropic.messages.create({...}); // Automatically traced!
+ * ```
+ */
+declare function wrapAnthropic<T extends {
+    messages: {
+        create: (...args: any[]) => Promise<any>;
+    };
+}>(client: T): T;
+/**
+ * Wrap a Google Generative AI client to automatically trace all content generations.
+ *
+ * @param client - The GoogleGenerativeAI client instance
+ * @returns The same client with tracing enabled
+ *
+ * @example
+ * ```typescript
+ * import { GoogleGenerativeAI } from "@google/generative-ai";
+ * import { trace } from "@fallom/trace";
+ *
+ * const genAI = new GoogleGenerativeAI(apiKey);
+ * const model = trace.wrapGoogleAI(genAI.getGenerativeModel({ model: "gemini-pro" }));
+ *
+ * trace.setSession("my-config", sessionId);
+ * const response = await model.generateContent("Hello!"); // Automatically traced!
+ * ```
+ */
+declare function wrapGoogleAI<T extends {
+    generateContent: (...args: any[]) => Promise<any>;
+}>(model: T): T;
 declare const trace_clearSession: typeof clearSession;
 declare const trace_getSession: typeof getSession;
@@ -118,8 +187,11 @@ declare const trace_runWithSession: typeof runWithSession;
 declare const trace_setSession: typeof setSession;
 declare const trace_shutdown: typeof shutdown;
 declare const trace_span: typeof span;
+declare const trace_wrapAnthropic: typeof wrapAnthropic;
+declare const trace_wrapGoogleAI: typeof wrapGoogleAI;
+declare const trace_wrapOpenAI: typeof wrapOpenAI;
 declare namespace trace {
-  export { trace_clearSession as clearSession, trace_getSession as getSession, init$2 as init, trace_runWithSession as runWithSession, trace_setSession as setSession, trace_shutdown as shutdown, trace_span as span };
+  export { trace_clearSession as clearSession, trace_getSession as getSession, init$2 as init, trace_runWithSession as runWithSession, trace_setSession as setSession, trace_shutdown as shutdown, trace_span as span, trace_wrapAnthropic as wrapAnthropic, trace_wrapGoogleAI as wrapGoogleAI, trace_wrapOpenAI as wrapOpenAI };
 }
 /**
@@ -182,6 +254,7 @@ interface InitOptions {
     apiKey?: string;
     baseUrl?: string;
     captureContent?: boolean;
+    debug?: boolean;
 }
 /**
  * Initialize both trace and models at once.
@@ -205,7 +278,7 @@ interface InitOptions {
  * fallom.init({ captureContent: false });
  * ```
  */
-declare function init(options?: InitOptions): void;
+declare function init(options?: InitOptions): Promise<void>;
 /**
  * Fallom - Model A/B testing and tracing for LLM applications.