npm - langwatch - Versions diffs - 0.1.1 → 0.1.4 - Mend

langwatch 0.1.1 → 0.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/copy-types.sh +17 -0
package/dist/{chunk-OVS4NSDE.mjs → chunk-2I4YLOQY.mjs} +184 -115
package/dist/chunk-2I4YLOQY.mjs.map +1 -0
package/dist/index.d.mts +344 -4
package/dist/index.d.ts +344 -4
package/dist/index.js +1429 -1121
package/dist/index.js.map +1 -1
package/dist/index.mjs +264 -26
package/dist/index.mjs.map +1 -1
package/dist/{utils-K-jSEpnZ.d.mts → utils-CFtM8VVg.d.mts} +107 -31
package/dist/{utils-K-jSEpnZ.d.ts → utils-CFtM8VVg.d.ts} +107 -31
package/dist/utils.d.mts +1 -2
package/dist/utils.d.ts +1 -2
package/dist/utils.js +181 -114
package/dist/utils.js.map +1 -1
package/dist/utils.mjs +1 -1
package/example/app/guardrails/page.tsx +26 -0
package/example/components/header.tsx +4 -0
package/example/lib/chat/guardrails.tsx +181 -0
package/example/lib/chat/langchain-rag.tsx +1 -1
package/example/lib/chat/langchain.tsx +1 -1
package/example/lib/chat/vercel-ai.tsx +1 -1
package/example/package-lock.json +4 -3
package/package.json +3 -4
package/src/evaluations.ts +219 -0
package/src/index.test.ts +40 -2
package/src/index.ts +182 -8
package/src/typeUtils.ts +28 -3
package/src/types.ts +6 -2
package/src/utils.ts +4 -8
package/ts-to-zod.config.js +4 -0
package/dist/chunk-OVS4NSDE.mjs.map +0 -1

package/dist/{utils-K-jSEpnZ.d.mts → utils-CFtM8VVg.d.mts} RENAMED Viewed

@@ -1,5 +1,4 @@
 import { CoreMessage } from 'ai';
-import modelPrices from 'llm-cost/model_prices_and_context_window.json';
 type ChatRole = "system" | "user" | "assistant" | "function" | "tool" | "unknown";
 interface FunctionCall {
@@ -17,6 +16,7 @@ interface ChatMessage$1 {
     function_call?: FunctionCall | null;
     tool_calls?: ToolCall[] | null;
     tool_call_id?: string | null;
+    name?: string | null;
 }
 type ChatRichContent$1 = {
     type: "text";
@@ -49,18 +49,23 @@ type Money = {
     currency: string;
     amount: number;
 };
-interface GuardrailResult {
+interface EvaluationResult {
     status: "processed" | "skipped" | "error";
-    passed: boolean;
+    passed?: boolean | null;
     score?: number | null;
+    label?: string | null;
     details?: string | null;
     cost?: Money | null;
 }
 interface TypedValueGuardrailResult {
     type: "guardrail_result";
-    value: GuardrailResult;
+    value: EvaluationResult;
+}
+interface TypedValueEvaluationResult {
+    type: "evaluation_result";
+    value: EvaluationResult;
 }
-type SpanInputOutput$1 = TypedValueText | TypedValueChatMessages | TypedValueGuardrailResult | TypedValueJson | TypedValueRaw | {
+type SpanInputOutput$1 = TypedValueText | TypedValueChatMessages | TypedValueGuardrailResult | TypedValueEvaluationResult | TypedValueJson | TypedValueRaw | {
     type: "list";
     value: SpanInputOutput$1[];
 };
@@ -75,19 +80,32 @@ interface SpanMetrics {
     tokens_estimated?: boolean | null;
     cost?: number | null;
 }
-interface SpanParams {
-    temperature?: number;
-    stream?: boolean;
-    functions?: Record<string, any>[];
-    tools?: Record<string, any>[];
-    tool_choice?: string;
-}
+type ReservedSpanParams = {
+    frequency_penalty?: number | null;
+    logit_bias?: Record<string, number> | null;
+    logprobs?: boolean | null;
+    top_logprobs?: number | null;
+    max_tokens?: number | null;
+    n?: number | null;
+    presence_penalty?: number | null;
+    seed?: number | null;
+    stop?: string | string[] | null;
+    stream?: boolean | null;
+    temperature?: number | null;
+    top_p?: number | null;
+    tools?: Record<string, any>[] | null;
+    tool_choice?: Record<string, any> | string | null;
+    parallel_tool_calls?: boolean | null;
+    functions?: Record<string, any>[] | null;
+    user?: string | null;
+};
+type SpanParams = ReservedSpanParams & Record<string, any>;
 interface SpanTimestamps {
     started_at: number;
     first_token_at?: number | null;
     finished_at: number;
 }
-type SpanTypes = "span" | "llm" | "chain" | "tool" | "agent" | "rag" | "guardrail" | "unknown";
+type SpanTypes = "span" | "llm" | "chain" | "tool" | "agent" | "rag" | "guardrail" | "evaluation" | "workflow" | "component" | "server" | "client" | "producer" | "consumer" | "task" | "unknown";
 interface BaseSpan$1 {
     span_id: string;
     parent_id?: string | null;
@@ -99,12 +117,12 @@ interface BaseSpan$1 {
     error?: ErrorCapture | null;
     timestamps: SpanTimestamps;
     metrics?: SpanMetrics | null;
+    params?: SpanParams | null;
 }
 interface LLMSpan$1 extends BaseSpan$1 {
     type: "llm";
     vendor?: string | null;
-    model?: string;
-    params?: SpanParams;
+    model?: string | null;
 }
 interface RAGChunk {
     document_id?: string | null;
@@ -131,25 +149,35 @@ type TraceOutput = {
         embeddings: number[];
     };
 };
+type PrimitiveType = string | number | boolean | null | undefined;
+type ReservedTraceMetadata = {
+    thread_id?: string | null;
+    user_id?: string | null;
+    customer_id?: string | null;
+    labels?: string[] | null;
+    topic_id?: string | null;
+    subtopic_id?: string | null;
+    sdk_version?: string | null;
+    sdk_language?: string | null;
+};
+type CustomMetadata = Record<string, PrimitiveType | PrimitiveType[] | Record<string, PrimitiveType> | Record<string, Record<string, PrimitiveType>>>;
+type TraceMetadata = ReservedTraceMetadata & CustomMetadata;
 type Trace = {
     trace_id: string;
     project_id: string;
-    metadata: {
-        thread_id?: string;
-        user_id?: string;
-        customer_id?: string;
-        labels?: string[];
-        topic_id?: string;
-        subtopic_id?: string;
-    };
+    metadata: TraceMetadata;
     timestamps: {
         started_at: number;
         inserted_at: number;
         updated_at: number;
     };
-    input: TraceInput;
+    input?: TraceInput;
     output?: TraceOutput;
-    metrics: {
+    contexts?: RAGChunk[];
+    expected_output?: {
+        value: string;
+    };
+    metrics?: {
         first_token_ms?: number | null;
         total_time_ms?: number | null;
         prompt_tokens?: number | null;
@@ -159,10 +187,39 @@ type Trace = {
     };
     error?: ErrorCapture | null;
     indexing_md5s?: string[];
+    events?: Event[];
+    evaluations?: Evaluation[];
 };
-type Experiment = {
-    experiment_id: string;
-    variant: number;
+type EvaluationStatus = "scheduled" | "in_progress" | "error" | "skipped" | "processed";
+type Evaluation = {
+    evaluation_id: string;
+    evaluator_id: string;
+    span_id?: string | null;
+    name: string;
+    type?: string | null;
+    is_guardrail?: boolean | null;
+    status: EvaluationStatus;
+    passed?: boolean | null;
+    score?: number | null;
+    label?: string | null;
+    details?: string | null;
+    error?: ErrorCapture | null;
+    retries?: number | null;
+    timestamps: {
+        inserted_at?: number | null;
+        started_at?: number | null;
+        finished_at?: number | null;
+        updated_at?: number | null;
+    };
+};
+type RESTEvaluation$1 = Omit<Evaluation, "evaluation_id" | "evaluator_id" | "status" | "timestamps" | "retries"> & {
+    evaluation_id?: string | null;
+    evaluator_id?: string | null;
+    status?: "processed" | "skipped" | "error" | null;
+    timestamps?: {
+        started_at?: number | null;
+        finished_at?: number | null;
+    } | null;
 };
 type CollectorRESTParams = {
     trace_id?: string | null | undefined;
@@ -172,7 +229,23 @@ type CollectorRESTParams = {
         thread_id?: string | null | undefined;
         customer_id?: string | null | undefined;
         labels?: string[] | null | undefined;
-        experiments?: Experiment[] | null | undefined;
+        sdk_version?: string | null | undefined;
+        sdk_language?: string | null | undefined;
+    } & CustomMetadata;
+    expected_output?: string | null;
+    evaluations?: RESTEvaluation$1[];
+};
+type Event = {
+    event_id: string;
+    event_type: string;
+    project_id: string;
+    metrics: Record<string, number>;
+    event_details: Record<string, string>;
+    trace_id: string;
+    timestamps: {
+        started_at: number;
+        inserted_at: number;
+        updated_at: number;
     };
 };
@@ -202,14 +275,17 @@ type PendingSpan<T extends BaseSpan> = Omit<T, "traceId" | "timestamps"> & {
 type BaseSpan = ConvertServerSpan<BaseSpan$1>;
 type PendingBaseSpan = PendingSpan<BaseSpan>;
 type LLMSpan = ConvertServerSpan<Omit<LLMSpan$1, "vendor" | "model">> & {
-    model: keyof typeof modelPrices | (string & NonNullable<unknown>);
+    model: string;
 };
 type PendingLLMSpan = PendingSpan<LLMSpan>;
 type RAGSpan = ConvertServerSpan<RAGSpan$1>;
 type PendingRAGSpan = PendingSpan<RAGSpan>;
+type RESTEvaluation = SnakeToCamelCaseNested<Omit<RESTEvaluation$1, "error">> & {
+    error?: RESTEvaluation$1["error"];
+};
 declare function convertFromVercelAIMessages(messages: CoreMessage[]): ChatMessage[];
 declare const captureError: (error: unknown) => ErrorCapture;
 declare const autoconvertTypedValues: (value: unknown) => SpanInputOutput;
-export { type BaseSpan as B, type CollectorRESTParams as C, type LLMSpan as L, type Metadata as M, type PendingBaseSpan as P, type RAGSpan as R, type Span as S, type PendingLLMSpan as a, type PendingRAGSpan as b, type SpanTypes as c, type ChatMessage as d, type ChatRichContent as e, type SpanInputOutput as f, convertFromVercelAIMessages as g, captureError as h, autoconvertTypedValues as i };
+export { type BaseSpan as B, type CollectorRESTParams as C, type LLMSpan as L, type Metadata as M, type PendingBaseSpan as P, type RAGChunk as R, type Span as S, type RESTEvaluation as a, type PendingLLMSpan as b, type PendingRAGSpan as c, type SpanTypes as d, type ChatMessage as e, type ChatRichContent as f, type RAGSpan as g, type SpanInputOutput as h, autoconvertTypedValues as i, captureError as j, convertFromVercelAIMessages as k };

package/dist/{utils-K-jSEpnZ.d.ts → utils-CFtM8VVg.d.ts} RENAMED Viewed

@@ -1,5 +1,4 @@
 import { CoreMessage } from 'ai';
-import modelPrices from 'llm-cost/model_prices_and_context_window.json';
 type ChatRole = "system" | "user" | "assistant" | "function" | "tool" | "unknown";
 interface FunctionCall {
@@ -17,6 +16,7 @@ interface ChatMessage$1 {
     function_call?: FunctionCall | null;
     tool_calls?: ToolCall[] | null;
     tool_call_id?: string | null;
+    name?: string | null;
 }
 type ChatRichContent$1 = {
     type: "text";
@@ -49,18 +49,23 @@ type Money = {
     currency: string;
     amount: number;
 };
-interface GuardrailResult {
+interface EvaluationResult {
     status: "processed" | "skipped" | "error";
-    passed: boolean;
+    passed?: boolean | null;
     score?: number | null;
+    label?: string | null;
     details?: string | null;
     cost?: Money | null;
 }
 interface TypedValueGuardrailResult {
     type: "guardrail_result";
-    value: GuardrailResult;
+    value: EvaluationResult;
+}
+interface TypedValueEvaluationResult {
+    type: "evaluation_result";
+    value: EvaluationResult;
 }
-type SpanInputOutput$1 = TypedValueText | TypedValueChatMessages | TypedValueGuardrailResult | TypedValueJson | TypedValueRaw | {
+type SpanInputOutput$1 = TypedValueText | TypedValueChatMessages | TypedValueGuardrailResult | TypedValueEvaluationResult | TypedValueJson | TypedValueRaw | {
     type: "list";
     value: SpanInputOutput$1[];
 };
@@ -75,19 +80,32 @@ interface SpanMetrics {
     tokens_estimated?: boolean | null;
     cost?: number | null;
 }
-interface SpanParams {
-    temperature?: number;
-    stream?: boolean;
-    functions?: Record<string, any>[];
-    tools?: Record<string, any>[];
-    tool_choice?: string;
-}
+type ReservedSpanParams = {
+    frequency_penalty?: number | null;
+    logit_bias?: Record<string, number> | null;
+    logprobs?: boolean | null;
+    top_logprobs?: number | null;
+    max_tokens?: number | null;
+    n?: number | null;
+    presence_penalty?: number | null;
+    seed?: number | null;
+    stop?: string | string[] | null;
+    stream?: boolean | null;
+    temperature?: number | null;
+    top_p?: number | null;
+    tools?: Record<string, any>[] | null;
+    tool_choice?: Record<string, any> | string | null;
+    parallel_tool_calls?: boolean | null;
+    functions?: Record<string, any>[] | null;
+    user?: string | null;
+};
+type SpanParams = ReservedSpanParams & Record<string, any>;
 interface SpanTimestamps {
     started_at: number;
     first_token_at?: number | null;
     finished_at: number;
 }
-type SpanTypes = "span" | "llm" | "chain" | "tool" | "agent" | "rag" | "guardrail" | "unknown";
+type SpanTypes = "span" | "llm" | "chain" | "tool" | "agent" | "rag" | "guardrail" | "evaluation" | "workflow" | "component" | "server" | "client" | "producer" | "consumer" | "task" | "unknown";
 interface BaseSpan$1 {
     span_id: string;
     parent_id?: string | null;
@@ -99,12 +117,12 @@ interface BaseSpan$1 {
     error?: ErrorCapture | null;
     timestamps: SpanTimestamps;
     metrics?: SpanMetrics | null;
+    params?: SpanParams | null;
 }
 interface LLMSpan$1 extends BaseSpan$1 {
     type: "llm";
     vendor?: string | null;
-    model?: string;
-    params?: SpanParams;
+    model?: string | null;
 }
 interface RAGChunk {
     document_id?: string | null;
@@ -131,25 +149,35 @@ type TraceOutput = {
         embeddings: number[];
     };
 };
+type PrimitiveType = string | number | boolean | null | undefined;
+type ReservedTraceMetadata = {
+    thread_id?: string | null;
+    user_id?: string | null;
+    customer_id?: string | null;
+    labels?: string[] | null;
+    topic_id?: string | null;
+    subtopic_id?: string | null;
+    sdk_version?: string | null;
+    sdk_language?: string | null;
+};
+type CustomMetadata = Record<string, PrimitiveType | PrimitiveType[] | Record<string, PrimitiveType> | Record<string, Record<string, PrimitiveType>>>;
+type TraceMetadata = ReservedTraceMetadata & CustomMetadata;
 type Trace = {
     trace_id: string;
     project_id: string;
-    metadata: {
-        thread_id?: string;
-        user_id?: string;
-        customer_id?: string;
-        labels?: string[];
-        topic_id?: string;
-        subtopic_id?: string;
-    };
+    metadata: TraceMetadata;
     timestamps: {
         started_at: number;
         inserted_at: number;
         updated_at: number;
     };
-    input: TraceInput;
+    input?: TraceInput;
     output?: TraceOutput;
-    metrics: {
+    contexts?: RAGChunk[];
+    expected_output?: {
+        value: string;
+    };
+    metrics?: {
         first_token_ms?: number | null;
         total_time_ms?: number | null;
         prompt_tokens?: number | null;
@@ -159,10 +187,39 @@ type Trace = {
     };
     error?: ErrorCapture | null;
     indexing_md5s?: string[];
+    events?: Event[];
+    evaluations?: Evaluation[];
 };
-type Experiment = {
-    experiment_id: string;
-    variant: number;
+type EvaluationStatus = "scheduled" | "in_progress" | "error" | "skipped" | "processed";
+type Evaluation = {
+    evaluation_id: string;
+    evaluator_id: string;
+    span_id?: string | null;
+    name: string;
+    type?: string | null;
+    is_guardrail?: boolean | null;
+    status: EvaluationStatus;
+    passed?: boolean | null;
+    score?: number | null;
+    label?: string | null;
+    details?: string | null;
+    error?: ErrorCapture | null;
+    retries?: number | null;
+    timestamps: {
+        inserted_at?: number | null;
+        started_at?: number | null;
+        finished_at?: number | null;
+        updated_at?: number | null;
+    };
+};
+type RESTEvaluation$1 = Omit<Evaluation, "evaluation_id" | "evaluator_id" | "status" | "timestamps" | "retries"> & {
+    evaluation_id?: string | null;
+    evaluator_id?: string | null;
+    status?: "processed" | "skipped" | "error" | null;
+    timestamps?: {
+        started_at?: number | null;
+        finished_at?: number | null;
+    } | null;
 };
 type CollectorRESTParams = {
     trace_id?: string | null | undefined;
@@ -172,7 +229,23 @@ type CollectorRESTParams = {
         thread_id?: string | null | undefined;
         customer_id?: string | null | undefined;
         labels?: string[] | null | undefined;
-        experiments?: Experiment[] | null | undefined;
+        sdk_version?: string | null | undefined;
+        sdk_language?: string | null | undefined;
+    } & CustomMetadata;
+    expected_output?: string | null;
+    evaluations?: RESTEvaluation$1[];
+};
+type Event = {
+    event_id: string;
+    event_type: string;
+    project_id: string;
+    metrics: Record<string, number>;
+    event_details: Record<string, string>;
+    trace_id: string;
+    timestamps: {
+        started_at: number;
+        inserted_at: number;
+        updated_at: number;
     };
 };
@@ -202,14 +275,17 @@ type PendingSpan<T extends BaseSpan> = Omit<T, "traceId" | "timestamps"> & {
 type BaseSpan = ConvertServerSpan<BaseSpan$1>;
 type PendingBaseSpan = PendingSpan<BaseSpan>;
 type LLMSpan = ConvertServerSpan<Omit<LLMSpan$1, "vendor" | "model">> & {
-    model: keyof typeof modelPrices | (string & NonNullable<unknown>);
+    model: string;
 };
 type PendingLLMSpan = PendingSpan<LLMSpan>;
 type RAGSpan = ConvertServerSpan<RAGSpan$1>;
 type PendingRAGSpan = PendingSpan<RAGSpan>;
+type RESTEvaluation = SnakeToCamelCaseNested<Omit<RESTEvaluation$1, "error">> & {
+    error?: RESTEvaluation$1["error"];
+};
 declare function convertFromVercelAIMessages(messages: CoreMessage[]): ChatMessage[];
 declare const captureError: (error: unknown) => ErrorCapture;
 declare const autoconvertTypedValues: (value: unknown) => SpanInputOutput;
-export { type BaseSpan as B, type CollectorRESTParams as C, type LLMSpan as L, type Metadata as M, type PendingBaseSpan as P, type RAGSpan as R, type Span as S, type PendingLLMSpan as a, type PendingRAGSpan as b, type SpanTypes as c, type ChatMessage as d, type ChatRichContent as e, type SpanInputOutput as f, convertFromVercelAIMessages as g, captureError as h, autoconvertTypedValues as i };
+export { type BaseSpan as B, type CollectorRESTParams as C, type LLMSpan as L, type Metadata as M, type PendingBaseSpan as P, type RAGChunk as R, type Span as S, type RESTEvaluation as a, type PendingLLMSpan as b, type PendingRAGSpan as c, type SpanTypes as d, type ChatMessage as e, type ChatRichContent as f, type RAGSpan as g, type SpanInputOutput as h, autoconvertTypedValues as i, captureError as j, convertFromVercelAIMessages as k };

package/dist/utils.d.mts CHANGED Viewed

@@ -1,3 +1,2 @@
 import 'ai';
-export { i as autoconvertTypedValues, h as captureError, g as convertFromVercelAIMessages } from './utils-K-jSEpnZ.mjs';
-import 'llm-cost/model_prices_and_context_window.json';
+export { i as autoconvertTypedValues, j as captureError, k as convertFromVercelAIMessages } from './utils-CFtM8VVg.mjs';

package/dist/utils.d.ts CHANGED Viewed

@@ -1,3 +1,2 @@
 import 'ai';
-export { i as autoconvertTypedValues, h as captureError, g as convertFromVercelAIMessages } from './utils-K-jSEpnZ.js';
-import 'llm-cost/model_prices_and_context_window.json';
+export { i as autoconvertTypedValues, j as captureError, k as convertFromVercelAIMessages } from './utils-CFtM8VVg.js';