npm - @pauly4010/evalai-sdk - Versions diffs - 1.4.1 → 1.5.5 - Mend

@pauly4010/evalai-sdk 1.4.1 → 1.5.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (95) hide show

package/CHANGELOG.md +85 -0
package/README.md +205 -543
package/dist/assertions.d.ts +2 -2
package/dist/assertions.js +104 -71
package/dist/batch.js +12 -17
package/dist/cache.js +7 -11
package/dist/cli/api.d.ts +108 -0
package/dist/cli/api.js +130 -0
package/dist/cli/check.d.ts +28 -13
package/dist/cli/check.js +249 -142
package/dist/cli/ci-context.d.ts +6 -0
package/dist/cli/ci-context.js +110 -0
package/dist/cli/config.d.ts +30 -0
package/dist/cli/config.js +207 -0
package/dist/cli/constants.d.ts +15 -0
package/dist/cli/constants.js +18 -0
package/dist/cli/doctor.d.ts +11 -0
package/dist/cli/doctor.js +82 -0
package/dist/cli/formatters/github.d.ts +8 -0
package/dist/cli/formatters/github.js +130 -0
package/dist/cli/formatters/human.d.ts +6 -0
package/dist/cli/formatters/human.js +107 -0
package/dist/cli/formatters/json.d.ts +6 -0
package/dist/cli/formatters/json.js +10 -0
package/dist/cli/formatters/pr-comment.d.ts +12 -0
package/dist/cli/formatters/pr-comment.js +101 -0
package/dist/cli/formatters/types.d.ts +100 -0
package/dist/cli/formatters/types.js +5 -0
package/dist/cli/gate.d.ts +21 -0
package/dist/cli/gate.js +175 -0
package/dist/cli/index.d.ts +1 -0
package/dist/cli/index.js +67 -23
package/dist/cli/init.d.ts +7 -0
package/dist/cli/init.js +69 -0
package/dist/cli/policy-packs.d.ts +23 -0
package/dist/cli/policy-packs.js +83 -0
package/dist/cli/profiles.d.ts +28 -0
package/dist/cli/profiles.js +30 -0
package/dist/cli/reason-codes.d.ts +17 -0
package/dist/cli/reason-codes.js +19 -0
package/dist/cli/render/snippet.d.ts +5 -0
package/dist/cli/render/snippet.js +15 -0
package/dist/cli/render/sort.d.ts +10 -0
package/dist/cli/render/sort.js +24 -0
package/dist/cli/report/build-check-report.d.ts +19 -0
package/dist/cli/report/build-check-report.js +124 -0
package/dist/cli/share.d.ts +17 -0
package/dist/cli/share.js +83 -0
package/dist/client.d.ts +2 -2
package/dist/client.js +144 -132
package/dist/context.d.ts +1 -1
package/dist/context.js +4 -6
package/dist/errors.d.ts +2 -0
package/dist/errors.js +116 -107
package/dist/export.d.ts +6 -6
package/dist/export.js +39 -33
package/dist/index.d.ts +25 -24
package/dist/index.js +62 -56
package/dist/integrations/anthropic.d.ts +1 -1
package/dist/integrations/anthropic.js +23 -19
package/dist/integrations/openai-eval.d.ts +57 -0
package/dist/integrations/openai-eval.js +230 -0
package/dist/integrations/openai.d.ts +1 -1
package/dist/integrations/openai.js +23 -19
package/dist/local.d.ts +2 -2
package/dist/local.js +25 -25
package/dist/logger.d.ts +1 -1
package/dist/logger.js +24 -28
package/dist/matchers/index.d.ts +1 -0
package/dist/matchers/index.js +6 -0
package/dist/matchers/to-pass-gate.d.ts +29 -0
package/dist/matchers/to-pass-gate.js +35 -0
package/dist/pagination.d.ts +1 -1
package/dist/pagination.js +6 -6
package/dist/snapshot.js +24 -24
package/dist/streaming.js +11 -11
package/dist/testing.d.ts +6 -2
package/dist/testing.js +30 -12
package/dist/types.d.ts +22 -22
package/dist/types.js +13 -13
package/dist/utils/input-hash.d.ts +8 -0
package/dist/utils/input-hash.js +38 -0
package/dist/version.d.ts +7 -0
package/dist/version.js +10 -0
package/dist/workflows.d.ts +7 -7
package/dist/workflows.js +44 -44
package/package.json +102 -90
package/dist/__tests__/assertions.test.d.ts +0 -1
package/dist/__tests__/assertions.test.js +0 -288
package/dist/__tests__/client.test.d.ts +0 -1
package/dist/__tests__/client.test.js +0 -185
package/dist/__tests__/testing.test.d.ts +0 -1
package/dist/__tests__/testing.test.js +0 -230
package/dist/__tests__/workflows.test.d.ts +0 -1
package/dist/__tests__/workflows.test.js +0 -222

package/dist/types.js CHANGED Viewed

@@ -7,21 +7,21 @@ exports.SDKError = exports.EvaluationTemplates = void 0;
  */
 exports.EvaluationTemplates = {
     // Core Testing
-    UNIT_TESTING: 'unit-testing',
-    OUTPUT_QUALITY: 'output-quality',
+    UNIT_TESTING: "unit-testing",
+    OUTPUT_QUALITY: "output-quality",
     // Advanced Evaluation
-    PROMPT_OPTIMIZATION: 'prompt-optimization',
-    CHAIN_OF_THOUGHT: 'chain-of-thought',
-    LONG_CONTEXT_TESTING: 'long-context-testing',
-    MODEL_STEERING: 'model-steering',
-    REGRESSION_TESTING: 'regression-testing',
-    CONFIDENCE_CALIBRATION: 'confidence-calibration',
+    PROMPT_OPTIMIZATION: "prompt-optimization",
+    CHAIN_OF_THOUGHT: "chain-of-thought",
+    LONG_CONTEXT_TESTING: "long-context-testing",
+    MODEL_STEERING: "model-steering",
+    REGRESSION_TESTING: "regression-testing",
+    CONFIDENCE_CALIBRATION: "confidence-calibration",
     // Safety & Compliance
-    SAFETY_COMPLIANCE: 'safety-compliance',
+    SAFETY_COMPLIANCE: "safety-compliance",
     // Domain-Specific
-    RAG_EVALUATION: 'rag-evaluation',
-    CODE_GENERATION: 'code-generation',
-    SUMMARIZATION: 'summarization',
+    RAG_EVALUATION: "rag-evaluation",
+    CODE_GENERATION: "code-generation",
+    SUMMARIZATION: "summarization",
 };
 /**
  * SDK Error class with additional error details
@@ -45,7 +45,7 @@ exports.EvaluationTemplates = {
 class SDKError extends Error {
     constructor(message, code, statusCode, details) {
         super(message);
-        this.name = 'SDKError';
+        this.name = "SDKError";
         this.code = code;
         this.statusCode = statusCode;
         this.details = details;

package/dist/utils/input-hash.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+/**
+ * Input normalization and hashing for deterministic matching.
+ * Must match platform's @/lib/utils/input-hash.ts for reportToEvalAI.
+ */
+/** Normalize input for stable matching (whitespace, JSON key order). */
+export declare function normalizeInput(input: string): string;
+/** SHA-256 hash of normalized input. */
+export declare function sha256Input(s: string): string;

package/dist/utils/input-hash.js ADDED Viewed

@@ -0,0 +1,38 @@
+"use strict";
+/**
+ * Input normalization and hashing for deterministic matching.
+ * Must match platform's @/lib/utils/input-hash.ts for reportToEvalAI.
+ */
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.normalizeInput = normalizeInput;
+exports.sha256Input = sha256Input;
+const node_crypto_1 = __importDefault(require("node:crypto"));
+function sortKeys(obj) {
+    const sorted = {};
+    for (const k of Object.keys(obj).sort()) {
+        const v = obj[k];
+        sorted[k] =
+            v != null && typeof v === "object" && !Array.isArray(v)
+                ? sortKeys(v)
+                : v;
+    }
+    return sorted;
+}
+/** Normalize input for stable matching (whitespace, JSON key order). */
+function normalizeInput(input) {
+    const s = input.trim();
+    try {
+        const obj = JSON.parse(s);
+        return JSON.stringify(sortKeys(obj));
+    }
+    catch {
+        return s.replace(/\s+/g, " ");
+    }
+}
+/** SHA-256 hash of normalized input. */
+function sha256Input(s) {
+    return node_crypto_1.default.createHash("sha256").update(normalizeInput(s), "utf8").digest("hex");
+}

package/dist/version.d.ts ADDED Viewed

@@ -0,0 +1,7 @@
+/**
+ * SDK and API spec versions for request headers.
+ * X-EvalAI-SDK-Version: SDK package version
+ * X-EvalAI-Spec-Version: OpenAPI spec version (docs/openapi.json info.version)
+ */
+export declare const SDK_VERSION = "1.5.0";
+export declare const SPEC_VERSION = "1.0.0";

package/dist/version.js ADDED Viewed

@@ -0,0 +1,10 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.SPEC_VERSION = exports.SDK_VERSION = void 0;
+/**
+ * SDK and API spec versions for request headers.
+ * X-EvalAI-SDK-Version: SDK package version
+ * X-EvalAI-Spec-Version: OpenAPI spec version (docs/openapi.json info.version)
+ */
+exports.SDK_VERSION = "1.5.0";
+exports.SPEC_VERSION = "1.0.0";

package/dist/workflows.d.ts CHANGED Viewed

@@ -26,13 +26,13 @@
  * await tracer.endWorkflow({ resolution: 'Issue resolved' });
  * ```
  */
-import type { AIEvalClient } from './client';
+import type { AIEvalClient } from "./client";
 /**
  * Node in a workflow DAG
  */
 export interface WorkflowNode {
     id: string;
-    type: 'agent' | 'tool' | 'decision' | 'parallel' | 'human' | 'llm';
+    type: "agent" | "tool" | "decision" | "parallel" | "human" | "llm";
     name: string;
     config?: Record<string, any>;
 }
@@ -68,11 +68,11 @@ export interface WorkflowContext {
 /**
  * Workflow run status
  */
-export type WorkflowStatus = 'running' | 'completed' | 'failed' | 'cancelled';
+export type WorkflowStatus = "running" | "completed" | "failed" | "cancelled";
 /**
  * Handoff types between agents
  */
-export type HandoffType = 'delegation' | 'escalation' | 'parallel' | 'fallback';
+export type HandoffType = "delegation" | "escalation" | "parallel" | "fallback";
 /**
  * Agent handoff record
  */
@@ -95,7 +95,7 @@ export interface DecisionAlternative {
 /**
  * Decision types made by agents
  */
-export type DecisionType = 'action' | 'tool' | 'delegate' | 'respond' | 'route';
+export type DecisionType = "action" | "tool" | "delegate" | "respond" | "route";
 /**
  * Parameters for recording a decision
  */
@@ -120,11 +120,11 @@ export interface RecordDecisionParams {
 /**
  * LLM provider names
  */
-export type LLMProvider = 'openai' | 'anthropic' | 'google' | 'cohere' | 'mistral' | 'custom';
+export type LLMProvider = "openai" | "anthropic" | "google" | "cohere" | "mistral" | "custom";
 /**
  * Cost categories for tracking
  */
-export type CostCategory = 'llm' | 'tool' | 'embedding' | 'other';
+export type CostCategory = "llm" | "tool" | "embedding" | "other";
 /**
  * Parameters for recording cost
  */

package/dist/workflows.js CHANGED Viewed

@@ -67,7 +67,7 @@ class WorkflowTracer {
         this.options = {
             organizationId: options.organizationId || client.getOrganizationId() || 0,
             autoCalculateCost: options.autoCalculateCost ?? true,
-            tracePrefix: options.tracePrefix || 'workflow',
+            tracePrefix: options.tracePrefix || "workflow",
             captureFullPayloads: options.captureFullPayloads ?? true,
             debug: options.debug ?? false,
         };
@@ -92,7 +92,7 @@ class WorkflowTracer {
      */
     async startWorkflow(name, definition, metadata) {
         if (this.currentWorkflow) {
-            throw new Error('A workflow is already active. Call endWorkflow() first.');
+            throw new Error("A workflow is already active. Call endWorkflow() first.");
         }
         const traceId = `${this.options.tracePrefix}-${Date.now()}-${this.generateId()}`;
         const startedAt = new Date().toISOString();
@@ -101,7 +101,7 @@ class WorkflowTracer {
             name: `Workflow: ${name}`,
             traceId,
             organizationId: this.options.organizationId,
-            status: 'pending',
+            status: "pending",
             metadata: (0, context_1.mergeWithContext)({
                 workflowName: name,
                 definition,
@@ -122,22 +122,22 @@ class WorkflowTracer {
         this.costs = [];
         this.activeSpans.clear();
         this.spanCounter = 0;
-        this.log('Started workflow', { name, traceId: trace.id });
+        this.log("Started workflow", { name, traceId: trace.id });
         return this.currentWorkflow;
     }
     /**
      * End the current workflow
      */
-    async endWorkflow(output, status = 'completed') {
+    async endWorkflow(output, status = "completed") {
         if (!this.currentWorkflow) {
-            throw new Error('No active workflow. Call startWorkflow() first.');
+            throw new Error("No active workflow. Call startWorkflow() first.");
         }
         const durationMs = Date.now() - new Date(this.currentWorkflow.startedAt).getTime();
         // Calculate total cost
         const totalCost = this.costs.reduce((sum, cost) => sum + parseFloat(cost.totalCost), 0);
         // Update the original trace with completion data
         await this.client.traces.update(this.currentWorkflow.traceId, {
-            status: status === 'completed' ? 'success' : 'error',
+            status: status === "completed" ? "success" : "error",
             durationMs,
             metadata: (0, context_1.mergeWithContext)({
                 workflowName: this.currentWorkflow.name,
@@ -146,14 +146,14 @@ class WorkflowTracer {
                 totalCost: totalCost.toFixed(6),
                 handoffCount: this.handoffs.length,
                 decisionCount: this.decisions.length,
-                agentCount: new Set(this.handoffs.map(h => h.toAgent)).size + 1,
-                retryCount: this.costs.filter(c => c.isRetry).length,
+                agentCount: new Set(this.handoffs.map((h) => h.toAgent)).size + 1,
+                retryCount: this.costs.filter((c) => c.isRetry).length,
                 handoffs: this.handoffs,
                 decisions: this.decisions,
                 costs: this.costs,
             }),
         });
-        this.log('Ended workflow', {
+        this.log("Ended workflow", {
             name: this.currentWorkflow.name,
             status,
             durationMs,
@@ -176,7 +176,7 @@ class WorkflowTracer {
      */
     async startAgentSpan(agentName, input, parentSpanId) {
         if (!this.currentWorkflow) {
-            throw new Error('No active workflow. Call startWorkflow() first.');
+            throw new Error("No active workflow. Call startWorkflow() first.");
         }
         const spanId = `span-${++this.spanCounter}-${this.generateId()}`;
         const startTime = new Date().toISOString();
@@ -199,7 +199,7 @@ class WorkflowTracer {
                 ...(this.options.captureFullPayloads ? { input } : {}),
             }),
         });
-        this.log('Started agent span', { agentName, spanId });
+        this.log("Started agent span", { agentName, spanId });
         return spanContext;
     }
     /**
@@ -207,7 +207,7 @@ class WorkflowTracer {
      */
     async endAgentSpan(span, output, error) {
         if (!this.currentWorkflow) {
-            throw new Error('No active workflow.');
+            throw new Error("No active workflow.");
         }
         const endTime = new Date().toISOString();
         const durationMs = new Date(endTime).getTime() - new Date(span.startTime).getTime();
@@ -226,7 +226,7 @@ class WorkflowTracer {
             }),
         });
         this.activeSpans.delete(span.spanId);
-        this.log('Ended agent span', { agentName: span.agentName, spanId: span.spanId, durationMs });
+        this.log("Ended agent span", { agentName: span.agentName, spanId: span.spanId, durationMs });
     }
     // ==========================================================================
     // HANDOFFS
@@ -244,9 +244,9 @@ class WorkflowTracer {
      * );
      * ```
      */
-    async recordHandoff(fromAgent, toAgent, context, handoffType = 'delegation') {
+    async recordHandoff(fromAgent, toAgent, context, handoffType = "delegation") {
         if (!this.currentWorkflow) {
-            throw new Error('No active workflow. Call startWorkflow() first.');
+            throw new Error("No active workflow. Call startWorkflow() first.");
         }
         const handoff = {
             fromAgent,
@@ -259,7 +259,7 @@ class WorkflowTracer {
         // Also create a span for the handoff
         const spanId = `handoff-${this.handoffs.length}-${this.generateId()}`;
         await this.client.traces.createSpan(this.currentWorkflow.traceId, {
-            name: `Handoff: ${fromAgent || 'start'} → ${toAgent}`,
+            name: `Handoff: ${fromAgent || "start"} → ${toAgent}`,
             spanId,
             startTime: handoff.timestamp,
             endTime: handoff.timestamp,
@@ -271,7 +271,7 @@ class WorkflowTracer {
                 context,
             }),
         });
-        this.log('Recorded handoff', { fromAgent, toAgent, handoffType });
+        this.log("Recorded handoff", { fromAgent, toAgent, handoffType });
     }
     // ==========================================================================
     // DECISION AUDITING
@@ -297,7 +297,7 @@ class WorkflowTracer {
      */
     async recordDecision(params) {
         if (!this.currentWorkflow) {
-            throw new Error('No active workflow. Call startWorkflow() first.');
+            throw new Error("No active workflow. Call startWorkflow() first.");
         }
         this.decisions.push(params);
         // Create a span for the decision
@@ -321,7 +321,7 @@ class WorkflowTracer {
                 inputContext: params.inputContext,
             }),
         });
-        this.log('Recorded decision', {
+        this.log("Recorded decision", {
             agent: params.agent,
             type: params.type,
             chosen: params.chosen,
@@ -356,7 +356,7 @@ class WorkflowTracer {
         const costRecord = {
             ...params,
             totalTokens,
-            category: params.category || 'llm',
+            category: params.category || "llm",
             inputCost: inputCost.toFixed(6),
             outputCost: outputCost.toFixed(6),
             totalCost: totalCost.toFixed(6),
@@ -377,7 +377,7 @@ class WorkflowTracer {
                 }),
             });
         }
-        this.log('Recorded cost', {
+        this.log("Recorded cost", {
             provider: params.provider,
             model: params.model,
             totalTokens,
@@ -402,7 +402,7 @@ class WorkflowTracer {
             other: 0,
         };
         for (const cost of this.costs) {
-            const category = cost.category || 'other';
+            const category = cost.category || "other";
             breakdown[category] += parseFloat(cost.totalCost);
         }
         return breakdown;
@@ -417,23 +417,23 @@ class WorkflowTracer {
         // Default pricing (can be extended with API lookup)
         const knownPricing = {
             // OpenAI
-            'openai/gpt-4': { inputPricePerMillion: 30.00, outputPricePerMillion: 60.00 },
-            'openai/gpt-4-turbo': { inputPricePerMillion: 10.00, outputPricePerMillion: 30.00 },
-            'openai/gpt-4o': { inputPricePerMillion: 5.00, outputPricePerMillion: 15.00 },
-            'openai/gpt-4o-mini': { inputPricePerMillion: 0.15, outputPricePerMillion: 0.60 },
-            'openai/gpt-3.5-turbo': { inputPricePerMillion: 0.50, outputPricePerMillion: 1.50 },
+            "openai/gpt-4": { inputPricePerMillion: 30.0, outputPricePerMillion: 60.0 },
+            "openai/gpt-4-turbo": { inputPricePerMillion: 10.0, outputPricePerMillion: 30.0 },
+            "openai/gpt-4o": { inputPricePerMillion: 5.0, outputPricePerMillion: 15.0 },
+            "openai/gpt-4o-mini": { inputPricePerMillion: 0.15, outputPricePerMillion: 0.6 },
+            "openai/gpt-3.5-turbo": { inputPricePerMillion: 0.5, outputPricePerMillion: 1.5 },
             // Anthropic
-            'anthropic/claude-3-opus': { inputPricePerMillion: 15.00, outputPricePerMillion: 75.00 },
-            'anthropic/claude-3-sonnet': { inputPricePerMillion: 3.00, outputPricePerMillion: 15.00 },
-            'anthropic/claude-3-haiku': { inputPricePerMillion: 0.25, outputPricePerMillion: 1.25 },
-            'anthropic/claude-3.5-sonnet': { inputPricePerMillion: 3.00, outputPricePerMillion: 15.00 },
+            "anthropic/claude-3-opus": { inputPricePerMillion: 15.0, outputPricePerMillion: 75.0 },
+            "anthropic/claude-3-sonnet": { inputPricePerMillion: 3.0, outputPricePerMillion: 15.0 },
+            "anthropic/claude-3-haiku": { inputPricePerMillion: 0.25, outputPricePerMillion: 1.25 },
+            "anthropic/claude-3.5-sonnet": { inputPricePerMillion: 3.0, outputPricePerMillion: 15.0 },
             // Google
-            'google/gemini-pro': { inputPricePerMillion: 0.50, outputPricePerMillion: 1.50 },
-            'google/gemini-1.5-pro': { inputPricePerMillion: 3.50, outputPricePerMillion: 10.50 },
-            'google/gemini-1.5-flash': { inputPricePerMillion: 0.075, outputPricePerMillion: 0.30 },
+            "google/gemini-pro": { inputPricePerMillion: 0.5, outputPricePerMillion: 1.5 },
+            "google/gemini-1.5-pro": { inputPricePerMillion: 3.5, outputPricePerMillion: 10.5 },
+            "google/gemini-1.5-flash": { inputPricePerMillion: 0.075, outputPricePerMillion: 0.3 },
         };
         const key = `${provider}/${model}`;
-        return knownPricing[key] || { inputPricePerMillion: 1.00, outputPricePerMillion: 3.00 };
+        return knownPricing[key] || { inputPricePerMillion: 1.0, outputPricePerMillion: 3.0 };
     }
     /**
      * Generate a unique ID
@@ -446,7 +446,7 @@ class WorkflowTracer {
      */
     log(message, data) {
         if (this.options.debug) {
-            console.log(`[WorkflowTracer] ${message}`, data || '');
+            console.log(`[WorkflowTracer] ${message}`, data || "");
         }
     }
     /**
@@ -498,7 +498,7 @@ exports.WorkflowTracer = WorkflowTracer;
  * ```
  */
 function traceLangChainAgent(executor, tracer, options = {}) {
-    const agentName = options.agentName || 'LangChainAgent';
+    const agentName = options.agentName || "LangChainAgent";
     const originalInvoke = executor.invoke?.bind(executor);
     const originalCall = executor.call?.bind(executor);
     if (originalInvoke) {
@@ -544,7 +544,7 @@ function traceLangChainAgent(executor, tracer, options = {}) {
  * ```
  */
 function traceCrewAI(crew, tracer, options = {}) {
-    const crewName = options.crewName || 'CrewAI';
+    const crewName = options.crewName || "CrewAI";
     const originalKickoff = crew.kickoff?.bind(crew);
     if (originalKickoff) {
         crew.kickoff = async (input) => {
@@ -553,12 +553,12 @@ function traceCrewAI(crew, tracer, options = {}) {
             try {
                 const result = await originalKickoff(input);
                 await tracer.endAgentSpan(span, { output: result });
-                await tracer.endWorkflow({ result }, 'completed');
+                await tracer.endWorkflow({ result }, "completed");
                 return result;
             }
             catch (error) {
                 await tracer.endAgentSpan(span, undefined, error instanceof Error ? error.message : String(error));
-                await tracer.endWorkflow({ error: error instanceof Error ? error.message : String(error) }, 'failed');
+                await tracer.endWorkflow({ error: error instanceof Error ? error.message : String(error) }, "failed");
                 throw error;
             }
         };
@@ -576,7 +576,7 @@ function traceCrewAI(crew, tracer, options = {}) {
  * ```
  */
 function traceAutoGen(conversation, tracer, options = {}) {
-    const conversationName = options.conversationName || 'AutoGenConversation';
+    const conversationName = options.conversationName || "AutoGenConversation";
     const originalInitiateChat = conversation.initiate_chat?.bind(conversation);
     if (originalInitiateChat) {
         conversation.initiate_chat = async (...args) => {
@@ -585,12 +585,12 @@ function traceAutoGen(conversation, tracer, options = {}) {
             try {
                 const result = await originalInitiateChat(...args);
                 await tracer.endAgentSpan(span, { output: result });
-                await tracer.endWorkflow({ result }, 'completed');
+                await tracer.endWorkflow({ result }, "completed");
                 return result;
             }
             catch (error) {
                 await tracer.endAgentSpan(span, undefined, error instanceof Error ? error.message : String(error));
-                await tracer.endWorkflow({ error: error instanceof Error ? error.message : String(error) }, 'failed');
+                await tracer.endWorkflow({ error: error instanceof Error ? error.message : String(error) }, "failed");
                 throw error;
             }
         };

package/package.json CHANGED Viewed

@@ -1,90 +1,102 @@
-{
-  "name": "@pauly4010/evalai-sdk",
-  "version": "1.4.1",
-  "description": "AI Evaluation Platform SDK - Complete API Coverage with Performance Optimizations",
-  "main": "dist/index.js",
-  "module": "dist/index.js",
-  "types": "dist/index.d.ts",
-  "sideEffects": false,
-  "files": ["dist", "README.md", "CHANGELOG.md"],
-  "bin": {
-    "evalai": "./dist/cli/index.js"
-  },
-  "engines": {
-    "node": ">=16.0.0"
-  },
-  "scripts": {
-    "build": "tsc",
-    "dev": "tsc --watch",
-    "test": "vitest",
-    "prepublishOnly": "npm run build"
-  },
-  "keywords": [
-    "ai",
-    "evaluation",
-    "llm",
-    "testing",
-    "observability",
-    "tracing",
-    "monitoring",
-    "annotations",
-    "webhooks",
-    "developer-tools",
-    "openai",
-    "anthropic"
-  ],
-  "author": "EvalAI Team",
-  "license": "MIT",
-  "repository": {
-    "type": "git",
-    "url": "git+https://github.com/pauly7610/ai-evaluation-platform.git",
-    "directory": "src/packages/sdk"
-  },
-  "homepage": "https://v0-ai-evaluation-platform-nu.vercel.app",
-  "bugs": {
-    "url": "https://github.com/pauly7610/ai-evaluation-platform/issues"
-  },
-  "dependencies": {
-    "commander": "^14.0.0"
-  },
-  "peerDependencies": {
-    "openai": "^4.0.0",
-    "@anthropic-ai/sdk": "^0.20.0"
-  },
-  "peerDependenciesMeta": {
-    "openai": {
-      "optional": true
-    },
-    "@anthropic-ai/sdk": {
-      "optional": true
-    }
-  },
-  "devDependencies": {
-    "@types/node": "^20.0.0",
-    "typescript": "^5.0.0",
-    "vitest": "^1.0.0"
-  },
-  "exports": {
-    ".": {
-      "import": "./dist/index.js",
-      "require": "./dist/index.js",
-      "types": "./dist/index.d.ts"
-    },
-    "./assertions": {
-      "import": "./dist/assertions.js",
-      "types": "./dist/assertions.d.ts"
-    },
-    "./testing": {
-      "import": "./dist/testing.js",
-      "types": "./dist/testing.d.ts"
-    },
-    "./integrations/openai": {
-      "import": "./dist/integrations/openai.js",
-      "types": "./dist/integrations/openai.d.ts"
-    },
-    "./integrations/anthropic": {
-      "import": "./dist/integrations/anthropic.js",
-      "types": "./dist/integrations/anthropic.d.ts"
-    }
-  }
-}
+{
+  "name": "@pauly4010/evalai-sdk",
+  "version": "1.5.5",
+  "description": "AI Evaluation Platform SDK - Complete API Coverage with Performance Optimizations",
+  "main": "dist/index.js",
+  "module": "dist/index.js",
+  "types": "dist/index.d.ts",
+  "sideEffects": false,
+  "files": [
+    "dist",
+    "README.md",
+    "CHANGELOG.md"
+  ],
+  "bin": {
+    "evalai": "./dist/cli/index.js"
+  },
+  "engines": {
+    "node": ">=16.0.0"
+  },
+  "scripts": {
+    "build": "tsc",
+    "dev": "tsc --watch",
+    "test": "vitest",
+    "prepublishOnly": "npm run build"
+  },
+  "keywords": [
+    "ai",
+    "evaluation",
+    "llm",
+    "testing",
+    "observability",
+    "tracing",
+    "monitoring",
+    "annotations",
+    "webhooks",
+    "developer-tools",
+    "openai",
+    "anthropic"
+  ],
+  "author": "EvalAI Team",
+  "license": "MIT",
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/pauly7610/ai-evaluation-platform.git",
+    "directory": "src/packages/sdk"
+  },
+  "homepage": "https://v0-ai-evaluation-platform-nu.vercel.app",
+  "bugs": {
+    "url": "https://github.com/pauly7610/ai-evaluation-platform/issues"
+  },
+  "dependencies": {
+    "commander": "^14.0.0"
+  },
+  "peerDependencies": {
+    "openai": "^4.0.0",
+    "@anthropic-ai/sdk": "^0.20.0"
+  },
+  "peerDependenciesMeta": {
+    "openai": {
+      "optional": true
+    },
+    "@anthropic-ai/sdk": {
+      "optional": true
+    }
+  },
+  "devDependencies": {
+    "@types/node": "^20.0.0",
+    "typescript": "^5.0.0",
+    "vitest": "^1.0.0"
+  },
+  "exports": {
+    ".": {
+      "import": "./dist/index.js",
+      "require": "./dist/index.js",
+      "types": "./dist/index.d.ts"
+    },
+    "./assertions": {
+      "import": "./dist/assertions.js",
+      "types": "./dist/assertions.d.ts"
+    },
+    "./testing": {
+      "import": "./dist/testing.js",
+      "types": "./dist/testing.d.ts"
+    },
+    "./integrations/openai": {
+      "import": "./dist/integrations/openai.js",
+      "types": "./dist/integrations/openai.d.ts"
+    },
+    "./integrations/anthropic": {
+      "import": "./dist/integrations/anthropic.js",
+      "types": "./dist/integrations/anthropic.d.ts"
+    },
+    "./integrations/openai-eval": {
+      "import": "./dist/integrations/openai-eval.js",
+      "types": "./dist/integrations/openai-eval.d.ts"
+    },
+    "./matchers": {
+      "import": "./dist/matchers/index.js",
+      "types": "./dist/matchers/index.d.ts"
+    }
+  }
+}

package/dist/__tests__/assertions.test.d.ts DELETED Viewed

	@@ -1 +0,0 @@
1	- export {};