npm - 0xtrace - Versions diffs - 1.0.1 → 1.0.2 - Mend

0xtrace 1.0.1 → 1.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/package.json CHANGED Viewed

@@ -1,16 +1,20 @@
 {
   "name": "0xtrace",
-"version": "1.0.1",
+  "version": "1.0.2",
   "description": "Proxy-based LLM telemetry SDK for 0xtrace",
   "type": "module",
-  "main": "index.js",
+  "main": "./dist/index.cjs",
+  "module": "./dist/index.js",
+  "exports": {
+    ".": {
+      "import": "./dist/index.js",
+      "require": "./dist/index.cjs"
+    }
+  },
+  "files": ["dist"],
   "scripts": {
-    "test": "echo \"Error: no test specified\" && exit 1",
     "build": "tsup"
   },
-  "keywords": [],
-  "author": "",
-  "license": "ISC",
   "dependencies": {
     "diff": "^9.0.0",
     "openai": "^6.38.0"
@@ -21,4 +25,4 @@
     "tsup": "^8.5.1",
     "typescript": "^6.0.3"
   }
-}
+}

package/src/core/dispatcher.ts DELETED Viewed

@@ -1,212 +0,0 @@
-// ─────────────────────────────────────────────────────────────────────────────
-// packages/sdk/src/core/dispatcher.ts
-//
-// Responsibilities:
-//   1. Accept TracePayload objects from the Tracer via a fire-and-forget API.
-//   2. Accumulate payloads in an in-memory micro-batch.
-//   3. Flush the batch to the ingest endpoint as a single POST request.
-//   4. Retry failed requests with exponential back-off (max 3 attempts).
-//   5. NEVER block the caller's thread — every send goes onto the microtask
-//      queue via Promise.resolve().then(...)
-// ─────────────────────────────────────────────────────────────────────────────
-import type { IDispatcher, TracePayload } from "./types";
-// ── Constants ────────────────────────────────────────────────────────────────
-const DEFAULT_BATCH_SIZE   = 10;    // flush after N payloads accumulate
-const DEFAULT_FLUSH_MS     = 2_000; // flush every 2 s even if batch isn't full
-const DEFAULT_TIMEOUT_MS   = 5_000; // per-request abort timeout
-const MAX_RETRY_ATTEMPTS   = 3;
-const BASE_RETRY_DELAY_MS  = 200;   // doubles on each retry (200 → 400 → 800)
-// ── Types ────────────────────────────────────────────────────────────────────
-export interface DispatcherOptions {
-  ingestUrl: string;
-  apiKey?: string;
-  timeoutMs?: number;
-  batchSize?: number;
-  flushIntervalMs?: number;
-  onError?: (error: Error, payloads: TracePayload[]) => void;
-}
-// ── Dispatcher ───────────────────────────────────────────────────────────────
-export class Dispatcher implements IDispatcher {
-  private readonly ingestUrl: string;
-  private readonly apiKey: string | undefined;
-  private readonly timeoutMs: number;
-  private readonly batchSize: number;
-  private readonly onError: (error: Error, payloads: TracePayload[]) => void;
-  /** The in-memory buffer accumulating payloads between flushes. */
-  private buffer: TracePayload[] = [];
-  /** The NodeJS/browser timer handle for the periodic flush. */
-  private flushTimer: ReturnType<typeof setInterval> | null = null;
-  /** Tracks all in-flight fetch Promises so flush() can await them. */
-  private inFlight = new Set<Promise<void>>();
-  constructor(opts: DispatcherOptions) {
-    this.ingestUrl  = opts.ingestUrl;
-    this.apiKey     = opts.apiKey;
-    this.timeoutMs  = opts.timeoutMs  ?? DEFAULT_TIMEOUT_MS;
-    this.batchSize  = opts.batchSize  ?? DEFAULT_BATCH_SIZE;
-    this.onError = opts.onError ?? ((err, payloads) => {
-      console.warn(
-        `[PromptTracer] Failed to deliver ${payloads.length} trace(s):`,
-        err.message
-      );
-    });
-    // Start the periodic flush timer.
-    const intervalMs = opts.flushIntervalMs ?? DEFAULT_FLUSH_MS;
-    this.flushTimer = setInterval(() => {
-      if (this.buffer.length > 0) {
-        this._drainBuffer();
-      }
-    }, intervalMs);
-    // Prevent the timer from keeping a Node process alive indefinitely.
-    if (typeof this.flushTimer === "object" && typeof (this.flushTimer as NodeJS.Timeout).unref === "function") {
-  (this.flushTimer as NodeJS.Timeout).unref();
-    }
-  }
-  // ── Public API ─────────────────────────────────────────────────────────────
-  /**
-   * Accepts a payload and schedules delivery non-blocking via the microtask
-   * queue. The caller returns immediately; the POST happens asynchronously.
-   */
-  send(payload: TracePayload): void {
-    // Schedule the actual buffer-push on the microtask queue so it never
-    // adds synchronous overhead to the intercepted LLM call path.
-    Promise.resolve().then(() => {
-      this.buffer.push(payload);
-      if (this.buffer.length >= this.batchSize) {
-        this._drainBuffer();
-      }
-    });
-  }
-  /**
-   * Waits for all in-flight requests and flushes any remaining buffered
-   * payloads. Call this in tests or on process shutdown.
-   *
-   * @example
-   * process.on('SIGTERM', () => tracer.flush());
-   */
-  async flush(): Promise<void> {
-    // Flush whatever is sitting in the buffer right now.
-    if (this.buffer.length > 0) {
-      this._drainBuffer();
-    }
-    // Await all in-flight POSTs.
-    if (this.inFlight.size > 0) {
-      await Promise.allSettled([...this.inFlight]);
-    }
-  }
-  /**
-   * Stops the periodic flush timer and flushes remaining payloads.
-   * Call when the Tracer instance is being torn down.
-   */
-  async destroy(): Promise<void> {
-    if (this.flushTimer !== null) {
-      clearInterval(this.flushTimer);
-      this.flushTimer = null;
-    }
-    await this.flush();
-  }
-  // ── Private ────────────────────────────────────────────────────────────────
-  /**
-   * Atomically snapshots and clears the buffer, then initiates an async
-   * POST. Multiple concurrent drains are safe — each works on its own slice.
-   */
-  private _drainBuffer(): void {
-    const batch = this.buffer.splice(0, this.buffer.length);
-    if (batch.length === 0) return;
-    const promise = this._sendWithRetry(batch, 1).finally(() => {
-      this.inFlight.delete(promise);
-    });
-    this.inFlight.add(promise);
-  }
-  /**
-   * Attempts to POST a batch to the ingest endpoint.
-   * Retries up to MAX_RETRY_ATTEMPTS times with exponential back-off.
-   * Only retries on network errors or 5xx responses.
-   */
-  private async _sendWithRetry(
-    batch: TracePayload[],
-    attempt: number
-  ): Promise<void> {
-    try {
-      await this._post(batch);
-    } catch (err) {
-      const error = err instanceof Error ? err : new Error(String(err));
-      if (attempt < MAX_RETRY_ATTEMPTS) {
-        const delay = BASE_RETRY_DELAY_MS * Math.pow(2, attempt - 1);
-        await sleep(delay);
-        return this._sendWithRetry(batch, attempt + 1);
-      }
-      // All retries exhausted — surface to the error handler.
-      this.onError(error, batch);
-    }
-  }
-  /**
-   * Performs the raw HTTP POST with an AbortController timeout.
-   * Throws on network failure or non-2xx status.
-   */
-  private async _post(batch: TracePayload[]): Promise<void> {
-  const controller = new AbortController();
-  const timer = setTimeout(() => controller.abort(), this.timeoutMs);
-  const headers: Record<string, string> = {
-    "Content-Type": "application/json",
-  };
-  if (this.apiKey) {
-    headers["x-api-key"] = this.apiKey;
-  }
-  let response: Response;
-  try {
-    response = await fetch(this.ingestUrl, {
-      method:  "POST",
-      headers,
-      body:    JSON.stringify({ traces: batch }),
-      signal:  controller.signal,
-    });
-  } finally {
-    clearTimeout(timer);
-  }
-  if (!response.ok) {
-    if (response.status >= 500) {
-      throw new Error(`Ingest endpoint returned ${response.status}`);
-    }
-    console.warn(
-      `[PromptTracer] Ingest rejected batch (${response.status}). ` +
-      `Discarding ${batch.length} trace(s).`
-    );
-  }
-}
-// ── Helpers ──────────────────────────────────────────────────────────────────
-}
-function sleep(ms: number): Promise<void> {
-  return new Promise((resolve) => setTimeout(resolve, ms));
-}

package/src/core/tracer.ts DELETED Viewed

@@ -1,171 +0,0 @@
-// ─────────────────────────────────────────────────────────────────────────────
-// packages/sdk/src/core/tracer.ts
-//
-// Responsibilities:
-//   1. Own one logical "session" (a single agent run).
-//   2. Maintain a monotonic step counter across all calls in that session.
-//   3. Enrich a RawCapturePayload into a full TracePayload (ids, cost, ts).
-//   4. Hand the enriched payload to the Dispatcher non-blocking.
-//   5. Expose a flush() for clean shutdown / test assertions.
-// ─────────────────────────────────────────────────────────────────────────────
-import { Dispatcher }                            from "./dispatcher";
-import { calcCostUsd }                           from "../utils/cost";
-import type {
-  RawCapturePayload,
-  TracePayload,
-  TracerOptions,
-  IDispatcher,
-}                                                from "./types";
-// ── SDK version (keep in sync with package.json) ─────────────────────────────
-const SDK_VERSION = "0.1.0";
-// ── UUID helper ──────────────────────────────────────────────────────────────
-// crypto.randomUUID() is available in Node ≥ 14.17, modern browsers, and
-// the Edge runtime. Provide a tiny fallback for exotic environments.
-function uuid(): string {
-  if (
-    typeof crypto !== "undefined" &&
-    typeof crypto.randomUUID === "function"
-  ) {
-    return crypto.randomUUID();
-  }
-  // Fallback: RFC-4122 v4 UUID
-  return "xxxxxxxx-xxxx-4xxx-yxxx-xxxxxxxxxxxx".replace(/[xy]/g, (c) => {
-    const r = (Math.random() * 16) | 0;
-    const v = c === "x" ? r : (r & 0x3) | 0x8;
-    return v.toString(16);
-  });
-}
-// ── Tracer ────────────────────────────────────────────────────────────────────
-export class Tracer {
-  /** Groups all LLM calls in this agent run. */
-  readonly sessionId: string;
-  /** Caller-supplied arbitrary metadata attached to every payload. */
-  private readonly metadata: Record<string, string>;
-  /** Whether telemetry is active (can be disabled via options). */
-  private readonly enabled: boolean;
-  /** Delivery engine — injectable for unit-testing. */
-  private readonly dispatcher: IDispatcher;
-  /**
-   * Monotonically increasing step counter.
-   * Step 1 → first call in the session (triggers full snapshot in the DB).
-   * Step N → subsequent calls (store diff only).
-   */
-  private stepCounter = 0;
-  constructor(opts: TracerOptions, dispatcher?: IDispatcher) {
-    this.sessionId  = opts.sessionId ?? uuid();
-    this.metadata   = opts.metadata  ?? {};
-    this.enabled    = opts.enabled   ?? true;
-    // Use an injected dispatcher (useful in tests) or create the real one.
-    this.dispatcher = dispatcher ?? new Dispatcher({
-      ingestUrl:       opts.ingestUrl,
-      apiKey:    opts.apiKey,
-      timeoutMs:       opts.timeoutMs,
-      onError:         opts.onError
-        ? (err, payloads) => payloads.forEach((p) => opts.onError!(err, p))
-        : undefined,
-    });
-  }
-  // ── Public API ──────────────────────────────────────────────────────────────
-  /**
-   * The method called by every SDK wrapper after intercepting an LLM call.
-   *
-   * Design contract:
-   *   - NEVER awaited by the wrapper; fire-and-forget on microtask queue.
-   *   - Returns void so the wrapper cannot accidentally `await` it.
-   *
-   * @example
-   * // Inside wrappers/openai.ts — after receiving the result:
-   * tracer.captureAsync({ prompt, response, model, tokensIn, tokensOut, latencyMs, isStream });
-   */
-  captureAsync(raw: RawCapturePayload): void {
-    if (!this.enabled) return;
-    // Schedule enrichment + dispatch asynchronously so it never adds
-    // synchronous latency to the intercepted call path.
-    Promise.resolve().then(() => {
-      try {
-        const payload = this._enrich(raw);
-        this.dispatcher.send(payload);
-      } catch (err) {
-        // Tracer must NEVER throw into user code.
-        console.warn("[PromptTracer] Failed to enrich payload:", err);
-      }
-    });
-  }
-  /**
-   * Returns the step index the *next* call will be assigned.
-   * Useful for callers who need to know if this is step 1 (full snapshot)
-   * vs. a later step (diff only) before making the LLM call.
-   */
-  get nextStepIndex(): number {
-    return this.stepCounter + 1;
-  }
-  /**
-   * Waits for all buffered and in-flight payloads to be delivered.
-   * Call before process exit or at the end of integration tests.
-   *
-   * @example
-   * afterAll(async () => { await tracer.flush(); });
-   */
-  async flush(): Promise<void> {
-    await this.dispatcher.flush();
-  }
-  // ── Private ─────────────────────────────────────────────────────────────────
-  /**
-   * Takes a raw capture from the wrapper and enriches it with:
-   *   - a unique callId
-   *   - the session's sessionId
-   *   - a monotonic stepIndex
-   *   - ISO-8601 timestamp
-   *   - USD cost estimate
-   *   - SDK version string
-   *   - caller metadata
-   */
-  private _enrich(raw: RawCapturePayload): TracePayload {
-    this.stepCounter += 1;
-    const estimatedCostUsd = calcCostUsd({
-      model:     raw.model,
-      tokensIn:  raw.tokensIn  ?? 0,
-      tokensOut: raw.tokensOut ?? 0,
-    });
-    return {
-      // ── Core identity ───────────────────────────────────────────────────
-      callId:     uuid(),
-      sessionId:  this.sessionId,
-      stepIndex:  this.stepCounter,
-      timestamp:  new Date().toISOString(),
-      // ── Raw capture data (passed through unchanged) ──────────────────────
-      ...raw,
-      // ── Enrichment ───────────────────────────────────────────────────────
-      estimatedCostUsd,
-      sdkVersion: SDK_VERSION,
-      // Merge metadata into the payload so the ingest API can index on it.
-      // We spread it flat; the ingest schema should have a metadata JSONB col.
-      ...(Object.keys(this.metadata).length > 0
-        ? { metadata: this.metadata }
-        : {}),
-    } as TracePayload;
-  }
-}

package/src/core/types.ts DELETED Viewed

@@ -1,73 +0,0 @@
-// ─────────────────────────────────────────────────────────────────────────────
-// packages/sdk/src/core/types.ts
-// Central type contracts for the entire SDK. No runtime code lives here.
-// ─────────────────────────────────────────────────────────────────────────────
-/** A single message in an OpenAI-compatible chat conversation. */
-export interface ChatMessage {
-  role: "system" | "user" | "assistant" | "tool" | "function";
-  content: string | null;
-  name?: string;
-  tool_call_id?: string;
-}
-/** Raw data captured at the intercept point, before any enrichment. */
-export interface RawCapturePayload {
-  /** The messages array sent to the model. */
-  prompt: ChatMessage[] | readonly ChatMessage[];
-  /** The text content of the completion (reconstructed for streams). */
-  response: string;
-  /** Model string exactly as passed by the caller e.g. "gpt-4o". */
-  model: string;
-  /** Prompt tokens from usage object. Undefined for streams (not available). */
-  tokensIn: number | undefined;
-  /** Completion tokens. For streams this is an approximation (chunk count). */
-  tokensOut: number | undefined;
-  /** Wall-clock ms from request start to last byte received. */
-  latencyMs: number;
-  /** Whether the call used server-sent streaming. */
-  isStream: boolean;
-}
-/** The fully enriched payload that gets pushed to the ingest queue. */
-export interface TracePayload extends RawCapturePayload {
-  /** SDK-generated UUID for this individual LLM call. */
-  callId: string;
-  /** Session/trace ID grouping multiple calls in one agent run.
-   *  Set via TracerOptions.sessionId or auto-generated per Tracer instance. */
-  sessionId: string;
-  /** Step index within the session (1-based, incremented per capture). */
-  stepIndex: number;
-  /** ISO-8601 timestamp of the call start. */
-  timestamp: string;
-  /** Estimated USD cost for this call. */
-  estimatedCostUsd: number;
-  /** Version string of the SDK emitting this payload. */
-  sdkVersion: string;
-}
-/** Options passed when constructing a Tracer instance. */
-export interface TracerOptions {
-  /** Full URL of your Next.js ingest endpoint.
-   *  e.g. "https://your-app.vercel.app/api/ingest" */
-  ingestUrl: string;
-  apiKey?: string;
-  /** Optional session ID to group multiple calls into one trace. If omitted,
-  /** Groups multiple LLM calls into one logical agent run.
-   *  Auto-generated (UUID v4) if omitted. */
-  sessionId?: string;
-  /** Attach arbitrary key/value metadata to every payload (e.g. userId, env). */
-  metadata?: Record<string, string>;
-  /** Max ms to wait for the ingest POST before aborting. Default: 5000. */
-  timeoutMs?: number;
-  /** Called when the ingest POST fails. Defaults to console.warn. */
-  onError?: (error: Error, payload: TracePayload) => void;
-  /** Set false to completely disable telemetry (e.g. in unit tests). Default: true */
-  enabled?: boolean;
-}
-/** Minimal interface the Dispatcher must satisfy — useful for testing. */
-export interface IDispatcher {
-  send(payload: TracePayload): void; // non-blocking fire-and-forget
-  flush(): Promise<void>;            // drain all pending sends (use in tests / shutdown)
-}

package/src/diff.ts DELETED Viewed

@@ -1,181 +0,0 @@
-// ─────────────────────────────────────────────────────────────────────────────
-// packages/sdk/src/utils/diff.ts
-//
-// Computes a minimal, git-style diff between two chat message arrays.
-// The ingest API uses this to decide what to store:
-//   - Step 1  → store full snapshot (no previous to diff against)
-//   - Step 2+ → store only the diff; reconstruct full array on the frontend
-//
-// Design goals:
-//   1. Deterministic — same inputs always produce same diff.
-//   2. Reversible — applyDiff(prev, computeDiff(prev, curr)) === curr
-//   3. Zero dependencies on the openai SDK — works with plain objects.
-// ─────────────────────────────────────────────────────────────────────────────
-import type { ChatMessage } from "./core/types";
-// ── Types ─────────────────────────────────────────────────────────────────────
-/** A single entry in the diff — describes ONE message's change. */
-export type DiffOperation =
-  | { op: "add";    index: number; message: ChatMessage }
-  | { op: "remove"; index: number }
-  | { op: "keep";   index: number };   // kept for position bookkeeping
-/** The payload stored in prompt_snapshots.diff_from_previous */
-export interface MessageDiff {
-  /** Only the add/remove operations (keeps are omitted to save bytes). */
-  operations: Array<
-    | { op: "add";    index: number; message: ChatMessage }
-    | { op: "remove"; index: number }
-  >;
-  /** Net token change: positive = context grew, negative = messages pruned. */
-  tokenDelta: number;
-  /** How many messages were added in this step. */
-  added: number;
-  /** How many messages were removed in this step. */
-  removed: number;
-}
-// ── Helpers ───────────────────────────────────────────────────────────────────
-/**
- * Stable string key for a message — used for identity comparison.
- * We hash role + content so order changes are detected correctly.
- */
-function messageKey(m: ChatMessage): string {
-  return `${m.role}::${m.content ?? ""}`;
-}
-/**
- * Rough token estimator — 1 token ≈ 4 characters (GPT rule of thumb).
- * The SDK does not run a full tokenizer to stay dependency-free.
- * The backend can re-calculate with tiktoken if needed.
- */
-export function estimateTokens(messages: readonly ChatMessage[]): number {
-  return messages.reduce((sum, m) => {
-    const chars = (m.content ?? "").length;
-    return sum + Math.ceil(chars / 4);
-  }, 0);
-}
-// ── Core diff algorithm ───────────────────────────────────────────────────────
-/**
- * Computes the minimal diff between `prev` and `curr` message arrays.
- *
- * Algorithm: O(n) two-pointer walk.
- *   1. Build a Set of keys in `prev` for O(1) lookup.
- *   2. Walk `curr` — any message not in `prev` is an ADD.
- *   3. Walk `prev` — any message not in `curr` is a REMOVE.
- *
- * This is sufficient for 99% of real agent patterns where the context
- * array only ever has messages appended (never reordered mid-stream).
- * For adversarial reordering, swap to Myers diff.
- *
- * @example
- * const diff = computeMessageDiff(step1Messages, step2Messages);
- * // { operations: [{ op: "add", index: 3, message: {...} }], tokenDelta: 42, added: 1, removed: 0 }
- */
-export function computeMessageDiff(
-  prev: readonly ChatMessage[],
-  curr: readonly ChatMessage[]
-): MessageDiff {
-  const prevKeys = new Set(prev.map(messageKey));
-  const currKeys = new Set(curr.map(messageKey));
-  const operations: MessageDiff["operations"] = [];
-  // Detect additions — messages in curr that weren't in prev
-  curr.forEach((message, index) => {
-    if (!prevKeys.has(messageKey(message))) {
-      operations.push({ op: "add", index, message });
-    }
-  });
-  // Detect removals — messages in prev that aren't in curr
-  prev.forEach((message, index) => {
-    if (!currKeys.has(messageKey(message))) {
-      operations.push({ op: "remove", index });
-    }
-  });
-  const tokenDelta =
-    estimateTokens(curr) - estimateTokens(prev);
-  return {
-    operations,
-    tokenDelta,
-    added:   operations.filter((o) => o.op === "add").length,
-    removed: operations.filter((o) => o.op === "remove").length,
-  };
-}
-// ── Reconstruction (used by the frontend to replay diffs) ─────────────────────
-/**
- * Applies a stored diff forward onto a base message array.
- * The frontend calls this to reconstruct the full message array for step N:
- *
- *   const step1 = fullSnapshot;           // stored in DB for step 1
- *   const step2 = applyDiff(step1, diff); // reconstructed from diff
- *   const step3 = applyDiff(step2, diff); // and so on...
- *
- * @throws {Error} if the diff references an out-of-bounds index.
- */
-export function applyDiff(
-  base: readonly ChatMessage[],
-  diff: MessageDiff
-): ChatMessage[] {
-  const result = [...base];
-  // Process removes first (high-index first to avoid index shifting)
-  const removes = diff.operations
-    .filter((o): o is { op: "remove"; index: number } => o.op === "remove")
-    .sort((a, b) => b.index - a.index);
-  for (const op of removes) {
-    if (op.index >= result.length) {
-      throw new Error(
-        `[PromptTracer] applyDiff: remove index ${op.index} out of bounds (len=${result.length})`
-      );
-    }
-    result.splice(op.index, 1);
-  }
-  // Process adds (low-index first to preserve insertion order)
-  const adds = diff.operations
-    .filter(
-      (o): o is { op: "add"; index: number; message: ChatMessage } =>
-        o.op === "add"
-    )
-    .sort((a, b) => a.index - b.index);
-  for (const op of adds) {
-    result.splice(op.index, 0, op.message);
-  }
-  return result;
-}
-/**
- * Replays an ordered series of diffs from a base snapshot.
- * Use this when you need to reconstruct every step in a session at once.
- *
- * @example
- * const steps = replayDiffs(step1Snapshot, [diff2, diff3, diff4]);
- * // steps[0] === step1, steps[1] === step2, steps[2] === step3, steps[3] === step4
- */
-export function replayDiffs(
-  baseSnapshot: readonly ChatMessage[],
-  diffs: MessageDiff[]
-): ChatMessage[][] {
-  const results: ChatMessage[][] = [Array.from(baseSnapshot)];
-  for (const diff of diffs) {
-    const prev = results[results.length - 1];
-    results.push(applyDiff(prev, diff));
-  }
-  return results;
-}

package/src/index.ts DELETED Viewed

@@ -1,24 +0,0 @@
-// ─────────────────────────────────────────────────────────────────────────────
-// packages/sdk/src/index.ts
-// Public surface of the @prompt-tracer/sdk package.
-// ─────────────────────────────────────────────────────────────────────────────
-// Core
-export { Tracer }          from "./core/tracer";
-export { Dispatcher }      from "./core/dispatcher";
-// Wrappers
-export { wrapOpenAI }      from "./wrappers/openai";
-// Utilities
-export { calcCostUsd, formatCostUsd } from "./utils/cost";
-// Types — consumers can import these without `import type` gymnastics
-export type {
-  ChatMessage,
-  RawCapturePayload,
-  TracePayload,
-  TracerOptions,
-  IDispatcher,
-} from "./core/types";
-export type { DispatcherOptions } from "./core/dispatcher";

package/src/utils/cost.ts DELETED Viewed

@@ -1,104 +0,0 @@
-// ─────────────────────────────────────────────────────────────────────────────
-// packages/sdk/src/utils/cost.ts
-//
-// Calculates estimated USD cost for a single LLM call.
-// Prices are per 1 million tokens (as published by each provider).
-// Update MODEL_PRICES when providers change pricing.
-// ─────────────────────────────────────────────────────────────────────────────
-interface ModelPrice {
-  /** USD per 1M input tokens  */
-  inputPer1M:  number;
-  /** USD per 1M output tokens */
-  outputPer1M: number;
-}
-/**
- * Pricing table keyed by model string.
- * Keys are matched with startsWith() so "gpt-4o-mini-2024-07-18" resolves
- * to the "gpt-4o-mini" entry automatically.
- */
-const MODEL_PRICES: Record<string, ModelPrice> = {
-  // ── OpenAI ──────────────────────────────────────────────────────────────
-  "gpt-4o":                   { inputPer1M:  2.50, outputPer1M: 10.00 },
-  "gpt-4o-mini":              { inputPer1M:  0.15, outputPer1M:  0.60 },
-  "gpt-4-turbo":              { inputPer1M: 10.00, outputPer1M: 30.00 },
-  "gpt-4":                    { inputPer1M: 30.00, outputPer1M: 60.00 },
-  "gpt-3.5-turbo":            { inputPer1M:  0.50, outputPer1M:  1.50 },
-  "o1":                       { inputPer1M: 15.00, outputPer1M: 60.00 },
-  "o1-mini":                  { inputPer1M:  3.00, outputPer1M: 12.00 },
-  "o3-mini":                  { inputPer1M:  1.10, outputPer1M:  4.40 },
-  // ── Anthropic ───────────────────────────────────────────────────────────
-  "claude-opus-4":            { inputPer1M: 15.00, outputPer1M: 75.00 },
-  "claude-sonnet-4":          { inputPer1M:  3.00, outputPer1M: 15.00 },
-  "claude-haiku-4":           { inputPer1M:  0.80, outputPer1M:  4.00 },
-  "claude-3-5-sonnet":        { inputPer1M:  3.00, outputPer1M: 15.00 },
-  "claude-3-5-haiku":         { inputPer1M:  0.80, outputPer1M:  4.00 },
-  "claude-3-opus":            { inputPer1M: 15.00, outputPer1M: 75.00 },
-  // ── Google ──────────────────────────────────────────────────────────────
-  "gemini-1.5-pro":           { inputPer1M:  3.50, outputPer1M: 10.50 },
-  "gemini-1.5-flash":         { inputPer1M:  0.35, outputPer1M:  1.05 },
-  "gemini-2.0-flash":         { inputPer1M:  0.10, outputPer1M:  0.40 },
-};
-/** Fallback when the model string is unrecognised. */
-const UNKNOWN_PRICE: ModelPrice = { inputPer1M: 0, outputPer1M: 0 };
-// ── Helpers ───────────────────────────────────────────────────────────────────
-/**
- * Resolves a model string to its price entry.
- * Tries exact match first, then prefix match (handles dated model variants).
- */
-function resolvePrice(model: string): ModelPrice {
-  const normalised = model.toLowerCase().trim();
-  // 1. Exact match
-  if (normalised in MODEL_PRICES) return MODEL_PRICES[normalised];
-  // 2. Prefix match — e.g. "gpt-4o-2024-11-20" → "gpt-4o"
-  for (const key of Object.keys(MODEL_PRICES)) {
-    if (normalised.startsWith(key)) return MODEL_PRICES[key];
-  }
-  return UNKNOWN_PRICE;
-}
-// ── Public API ────────────────────────────────────────────────────────────────
-export interface CalcCostParams {
-  model:     string;
-  tokensIn:  number;
-  tokensOut: number;
-}
-/**
- * Returns the estimated USD cost for a single LLM call.
- * Returns 0 for unrecognised models rather than throwing, so the SDK
- * never crashes user code due to a missing pricing entry.
- *
- * @example
- * calcCostUsd({ model: "gpt-4o", tokensIn: 1000, tokensOut: 500 })
- * // → 0.00750
- */
-export function calcCostUsd({ model, tokensIn, tokensOut }: CalcCostParams): number {
-  const price = resolvePrice(model);
-  const inputCost  = (tokensIn  / 1_000_000) * price.inputPer1M;
-  const outputCost = (tokensOut / 1_000_000) * price.outputPer1M;
-  // Round to 8 decimal places to avoid floating-point noise in the DB.
-  return Math.round((inputCost + outputCost) * 1e8) / 1e8;
-}
-/**
- * Formats a USD cost as a human-readable string.
- * @example formatCost(0.0075) → "$0.0075"
- * @example formatCost(0.00000120) → "$0.0000012"
- */
-export function formatCostUsd(usd: number): string {
-  if (usd === 0) return "$0.00";
-  if (usd < 0.0001) return `$${usd.toFixed(8).replace(/0+$/, "")}`;
-  if (usd < 0.01)   return `$${usd.toFixed(6).replace(/0+$/, "")}`;
-  return `$${usd.toFixed(4)}`;
-}

package/src/wrappers/openai.ts DELETED Viewed

@@ -1,193 +0,0 @@
-// ─────────────────────────────────────────────────────────────────────────────
-// packages/sdk/src/wrappers/openai.ts
-//
-// Wraps an OpenAI client instance in a deeply nested Proxy that intercepts
-// `chat.completions.create`, captures telemetry, and fires it non-blocking.
-//
-// Key guarantees:
-//   1. The original OpenAI types are 100% preserved — callers see no diffs.
-//   2. Streaming responses (`stream: true`) are fully supported via an async
-//      generator that transparently yields every chunk unchanged.
-//   3. Telemetry is fired via the microtask queue — zero latency added.
-//   4. Nothing is monkey-patched; the original client is never mutated.
-// ─────────────────────────────────────────────────────────────────────────────
-import OpenAI from "openai";
-import type {
-  ChatCompletionCreateParamsNonStreaming,
-  ChatCompletionCreateParamsStreaming,
-  ChatCompletion,
-} from "openai/resources/chat/completions";
-import type { Stream } from "openai/streaming";
-import type { ChatCompletionChunk } from "openai/resources";
-import type { Tracer } from "../core/tracer";
-import type { ChatMessage } from "../core/types";
-// ── Type helpers ──────────────────────────────────────────────────────────────
-type CreateParams =
-  | ChatCompletionCreateParamsNonStreaming
-  | ChatCompletionCreateParamsStreaming;
-// ── Main export ───────────────────────────────────────────────────────────────
-/**
- * Wraps an OpenAI client with a transparent telemetry layer.
- *
- * @param client  The original `new OpenAI(...)` instance.
- * @param tracer  A configured `Tracer` instance (owns the session + dispatch).
- * @returns       A Proxy of the client — drop-in replacement, same types.
- *
- * @example
- * import OpenAI from "openai";
- * import { Tracer, wrapOpenAI } from "@prompt-tracer/sdk";
- *
- * const openai  = new OpenAI({ apiKey: process.env.OPENAI_API_KEY });
- * const tracer  = new Tracer({ ingestUrl: "https://your-app.com/api/ingest" });
- * const ai      = wrapOpenAI(openai, tracer);
- *
- * // Use exactly like the original client — streaming, tools, everything works.
- * const res = await ai.chat.completions.create({ model: "gpt-4o", messages });
- */
-export function wrapOpenAI(client: OpenAI, tracer: Tracer): OpenAI {
-  return new Proxy(client, {
-    get(target, prop, receiver) {
-      // ── Intercept .chat ───────────────────────────────────────────────────
-      if (prop === "chat") {
-        return new Proxy(target.chat, {
-          get(chatTarget, chatProp, chatReceiver) {
-            // ── Intercept .chat.completions ─────────────────────────────────
-            if (chatProp === "completions") {
-              return new Proxy(chatTarget.completions, {
-                get(compTarget, compProp, compReceiver) {
-                  // ── Intercept .chat.completions.create ────────────────────
-                  if (compProp === "create") {
-                    return _makeCreateInterceptor(compTarget, tracer);
-                  }
-                  // All other completions methods (e.g. .stream()) pass through
-                  return Reflect.get(compTarget, compProp, compReceiver);
-                },
-              });
-            }
-            return Reflect.get(chatTarget, chatProp, chatReceiver);
-          },
-        });
-      }
-      // All other top-level methods (embeddings, images, etc.) pass through
-      return Reflect.get(target, prop, receiver);
-    },
-  });
-}
-// ── Interceptor factory ───────────────────────────────────────────────────────
-/**
- * Returns the replacement `create` function that wraps the original.
- * Extracted so the Proxy `get` handler stays readable.
- */
-function _makeCreateInterceptor(
-  compTarget: OpenAI["chat"]["completions"],
-  tracer: Tracer
-) {
-  // Overloaded signature mirrors the OpenAI SDK exactly so TypeScript callers
-  // see the correct return type based on whether `stream` is true.
-  async function create(
-    params: ChatCompletionCreateParamsNonStreaming
-  ): Promise<ChatCompletion>;
-  async function create(
-    params: ChatCompletionCreateParamsStreaming
-  ): Promise<Stream<ChatCompletionChunk>>;
-  async function create(params: CreateParams): Promise<unknown> {
-    const startMs = Date.now();
-    if (params.stream === true) {
-      // ── Streaming path ────────────────────────────────────────────────────
-      // We must return an async generator so the caller's `for await` loop
-      // works identically to the original SDK.
-      const stream = await (
-        compTarget.create as (
-          p: ChatCompletionCreateParamsStreaming
-        ) => Promise<Stream<ChatCompletionChunk>>
-      )(params as ChatCompletionCreateParamsStreaming);
-      return _wrapStream(stream, params, startMs, tracer);
-    }
-    // ── Non-streaming path ────────────────────────────────────────────────────
-    const result = await (
-      compTarget.create as (
-        p: ChatCompletionCreateParamsNonStreaming
-      ) => Promise<ChatCompletion>
-    )(params as ChatCompletionCreateParamsNonStreaming);
-    const latencyMs = Date.now() - startMs;
-    // Fire telemetry onto the microtask queue — never blocks the caller.
-    tracer.captureAsync({
-      prompt:    params.messages as ChatMessage[],
-      response:  result.choices[0]?.message?.content ?? "",
-      model:     params.model,
-      tokensIn:  result.usage?.prompt_tokens,
-      tokensOut: result.usage?.completion_tokens,
-      latencyMs,
-      isStream:  false,
-    });
-    return result;
-  }
-  return create;
-}
-// ── Stream wrapper ────────────────────────────────────────────────────────────
-/**
- * Wraps an OpenAI streaming response in an async generator that:
- *   1. Yields every chunk to the caller unchanged.
- *   2. Reconstructs the full text and counts chunks.
- *   3. Fires telemetry after the last chunk via the microtask queue.
- *
- * The returned generator preserves the `Symbol.asyncIterator` contract so
- * `for await (const chunk of stream)` works exactly as before.
- */
-async function* _wrapStream(
-  stream: Stream<ChatCompletionChunk>,
-  params: CreateParams,
-  startMs: number,
-  tracer: Tracer
-): AsyncGenerator<ChatCompletionChunk> {
-  let fullContent    = "";
-  let chunkCount     = 0;
-  let promptTokens: number | undefined;
-  try {
-    for await (const chunk of stream) {
-      // Capture prompt tokens if the first chunk carries usage data
-      // (available when `stream_options: { include_usage: true }` is set).
-      if (chunk.usage?.prompt_tokens !== undefined) {
-        promptTokens = chunk.usage.prompt_tokens;
-      }
-      const delta = chunk.choices[0]?.delta?.content ?? "";
-      fullContent += delta;
-      chunkCount  += 1;
-      yield chunk; // ← caller gets every chunk unmodified, zero delay
-    }
-  } finally {
-    // `finally` runs whether the caller broke out early or read everything.
-    const latencyMs = Date.now() - startMs;
-    // Schedule telemetry on the microtask queue so it fires after the
-    // caller's current `for await` iteration completes.
-    tracer.captureAsync({
-      prompt:    params.messages as ChatMessage[],
-      response:  fullContent,
-      model:     params.model,
-      tokensIn:  promptTokens,          // exact if include_usage was set
-      tokensOut: chunkCount,            // approximation: 1 chunk ≈ 1 token
-      latencyMs,
-      isStream:  true,
-    });
-  }
-}

package/tsup.config.ts DELETED Viewed

@@ -1,7 +0,0 @@
-import { defineConfig } from 'tsup';
-export default defineConfig({
-  entry: ['src/index.ts'],
-  format: ['cjs', 'esm'],
-  dts: false,
-  clean: true,
-});