npm - @agentv/eval - Versions diffs - 0.2.1 → 0.3.0 - Mend

@agentv/eval 0.2.1 → 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/dist/index.d.ts CHANGED Viewed

@@ -74,7 +74,7 @@ declare const TraceSummarySchema: z.ZodObject<{
     toolDurations?: Record<string, number[]> | undefined;
 }>;
 /**
- * Tool call schema for output messages.
+ * Tool call schema.
  */
 declare const ToolCallSchema: z.ZodObject<{
     tool: z.ZodString;
@@ -96,11 +96,10 @@ declare const ToolCallSchema: z.ZodObject<{
     timestamp?: string | undefined;
 }>;
 /**
- * Output message schema.
+ * Unified message schema for input, expected, and output messages.
  */
-declare const OutputMessageSchema: z.ZodObject<{
+declare const MessageSchema: z.ZodObject<{
     role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
-    name: z.ZodOptional<z.ZodString>;
     content: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodRecord<z.ZodString, z.ZodUnknown>, z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">]>>;
     toolCalls: z.ZodOptional<z.ZodArray<z.ZodObject<{
         tool: z.ZodString;
@@ -121,12 +120,12 @@ declare const OutputMessageSchema: z.ZodObject<{
         id?: string | undefined;
         timestamp?: string | undefined;
     }>, "many">>;
+    name: z.ZodOptional<z.ZodString>;
     timestamp: z.ZodOptional<z.ZodString>;
     metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
 }, "strip", z.ZodTypeAny, {
     role: "tool" | "assistant" | "user" | "system";
     timestamp?: string | undefined;
-    name?: string | undefined;
     content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
     toolCalls?: {
         tool: string;
@@ -135,11 +134,11 @@ declare const OutputMessageSchema: z.ZodObject<{
         id?: string | undefined;
         timestamp?: string | undefined;
     }[] | undefined;
+    name?: string | undefined;
     metadata?: Record<string, unknown> | undefined;
 }, {
     role: "tool" | "assistant" | "user" | "system";
     timestamp?: string | undefined;
-    name?: string | undefined;
     content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
     toolCalls?: {
         tool: string;
@@ -148,6 +147,7 @@ declare const OutputMessageSchema: z.ZodObject<{
         id?: string | undefined;
         timestamp?: string | undefined;
     }[] | undefined;
+    name?: string | undefined;
     metadata?: Record<string, unknown> | undefined;
 }>;
 /**
@@ -156,12 +156,62 @@ declare const OutputMessageSchema: z.ZodObject<{
 declare const CodeJudgeInputSchema: z.ZodObject<{
     question: z.ZodString;
     expectedOutcome: z.ZodString;
-    expectedMessages: z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">;
+    expectedMessages: z.ZodArray<z.ZodObject<{
+        role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
+        content: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodRecord<z.ZodString, z.ZodUnknown>, z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">]>>;
+        toolCalls: z.ZodOptional<z.ZodArray<z.ZodObject<{
+            tool: z.ZodString;
+            input: z.ZodOptional<z.ZodUnknown>;
+            output: z.ZodOptional<z.ZodUnknown>;
+            id: z.ZodOptional<z.ZodString>;
+            timestamp: z.ZodOptional<z.ZodString>;
+        }, "strip", z.ZodTypeAny, {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }, {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }>, "many">>;
+        name: z.ZodOptional<z.ZodString>;
+        timestamp: z.ZodOptional<z.ZodString>;
+        metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
+    }, "strip", z.ZodTypeAny, {
+        role: "tool" | "assistant" | "user" | "system";
+        timestamp?: string | undefined;
+        content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
+        toolCalls?: {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }[] | undefined;
+        name?: string | undefined;
+        metadata?: Record<string, unknown> | undefined;
+    }, {
+        role: "tool" | "assistant" | "user" | "system";
+        timestamp?: string | undefined;
+        content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
+        toolCalls?: {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }[] | undefined;
+        name?: string | undefined;
+        metadata?: Record<string, unknown> | undefined;
+    }>, "many">;
     referenceAnswer: z.ZodOptional<z.ZodString>;
     candidateAnswer: z.ZodString;
     outputMessages: z.ZodOptional<z.ZodNullable<z.ZodArray<z.ZodObject<{
         role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
-        name: z.ZodOptional<z.ZodString>;
         content: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodRecord<z.ZodString, z.ZodUnknown>, z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">]>>;
         toolCalls: z.ZodOptional<z.ZodArray<z.ZodObject<{
             tool: z.ZodString;
@@ -182,12 +232,12 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
             id?: string | undefined;
             timestamp?: string | undefined;
         }>, "many">>;
+        name: z.ZodOptional<z.ZodString>;
         timestamp: z.ZodOptional<z.ZodString>;
         metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
     }, "strip", z.ZodTypeAny, {
         role: "tool" | "assistant" | "user" | "system";
         timestamp?: string | undefined;
-        name?: string | undefined;
         content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
         toolCalls?: {
             tool: string;
@@ -196,11 +246,11 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
             id?: string | undefined;
             timestamp?: string | undefined;
         }[] | undefined;
+        name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }, {
         role: "tool" | "assistant" | "user" | "system";
         timestamp?: string | undefined;
-        name?: string | undefined;
         content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
         toolCalls?: {
             tool: string;
@@ -209,19 +259,62 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
             id?: string | undefined;
             timestamp?: string | undefined;
         }[] | undefined;
+        name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }>, "many">>>;
     guidelineFiles: z.ZodArray<z.ZodString, "many">;
     inputFiles: z.ZodArray<z.ZodString, "many">;
     inputMessages: z.ZodArray<z.ZodObject<{
-        role: z.ZodEnum<["system", "user", "assistant", "tool"]>;
-        content: z.ZodUnion<[z.ZodString, z.ZodRecord<z.ZodString, z.ZodUnknown>, z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">]>;
+        role: z.ZodEnum<["assistant", "user", "system", "tool"]>;
+        content: z.ZodOptional<z.ZodUnion<[z.ZodString, z.ZodRecord<z.ZodString, z.ZodUnknown>, z.ZodArray<z.ZodRecord<z.ZodString, z.ZodUnknown>, "many">]>>;
+        toolCalls: z.ZodOptional<z.ZodArray<z.ZodObject<{
+            tool: z.ZodString;
+            input: z.ZodOptional<z.ZodUnknown>;
+            output: z.ZodOptional<z.ZodUnknown>;
+            id: z.ZodOptional<z.ZodString>;
+            timestamp: z.ZodOptional<z.ZodString>;
+        }, "strip", z.ZodTypeAny, {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }, {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }>, "many">>;
+        name: z.ZodOptional<z.ZodString>;
+        timestamp: z.ZodOptional<z.ZodString>;
+        metadata: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
     }, "strip", z.ZodTypeAny, {
         role: "tool" | "assistant" | "user" | "system";
-        content: string | Record<string, unknown> | Record<string, unknown>[];
+        timestamp?: string | undefined;
+        content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
+        toolCalls?: {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }[] | undefined;
+        name?: string | undefined;
+        metadata?: Record<string, unknown> | undefined;
     }, {
         role: "tool" | "assistant" | "user" | "system";
-        content: string | Record<string, unknown> | Record<string, unknown>[];
+        timestamp?: string | undefined;
+        content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
+        toolCalls?: {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }[] | undefined;
+        name?: string | undefined;
+        metadata?: Record<string, unknown> | undefined;
     }>, "many">;
     traceSummary: z.ZodOptional<z.ZodNullable<z.ZodObject<{
         eventCount: z.ZodNumber;
@@ -275,19 +368,41 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
 }, "strip", z.ZodTypeAny, {
     question: string;
     expectedOutcome: string;
-    expectedMessages: Record<string, unknown>[];
+    expectedMessages: {
+        role: "tool" | "assistant" | "user" | "system";
+        timestamp?: string | undefined;
+        content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
+        toolCalls?: {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }[] | undefined;
+        name?: string | undefined;
+        metadata?: Record<string, unknown> | undefined;
+    }[];
     candidateAnswer: string;
     guidelineFiles: string[];
     inputFiles: string[];
     inputMessages: {
         role: "tool" | "assistant" | "user" | "system";
-        content: string | Record<string, unknown> | Record<string, unknown>[];
+        timestamp?: string | undefined;
+        content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
+        toolCalls?: {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }[] | undefined;
+        name?: string | undefined;
+        metadata?: Record<string, unknown> | undefined;
     }[];
     referenceAnswer?: string | undefined;
     outputMessages?: {
         role: "tool" | "assistant" | "user" | "system";
         timestamp?: string | undefined;
-        name?: string | undefined;
         content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
         toolCalls?: {
             tool: string;
@@ -296,6 +411,7 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
             id?: string | undefined;
             timestamp?: string | undefined;
         }[] | undefined;
+        name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[] | null | undefined;
     traceSummary?: {
@@ -316,19 +432,41 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
 }, {
     question: string;
     expectedOutcome: string;
-    expectedMessages: Record<string, unknown>[];
+    expectedMessages: {
+        role: "tool" | "assistant" | "user" | "system";
+        timestamp?: string | undefined;
+        content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
+        toolCalls?: {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }[] | undefined;
+        name?: string | undefined;
+        metadata?: Record<string, unknown> | undefined;
+    }[];
     candidateAnswer: string;
     guidelineFiles: string[];
     inputFiles: string[];
     inputMessages: {
         role: "tool" | "assistant" | "user" | "system";
-        content: string | Record<string, unknown> | Record<string, unknown>[];
+        timestamp?: string | undefined;
+        content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
+        toolCalls?: {
+            tool: string;
+            input?: unknown;
+            output?: unknown;
+            id?: string | undefined;
+            timestamp?: string | undefined;
+        }[] | undefined;
+        name?: string | undefined;
+        metadata?: Record<string, unknown> | undefined;
     }[];
     referenceAnswer?: string | undefined;
     outputMessages?: {
         role: "tool" | "assistant" | "user" | "system";
         timestamp?: string | undefined;
-        name?: string | undefined;
         content?: string | Record<string, unknown> | Record<string, unknown>[] | undefined;
         toolCalls?: {
             tool: string;
@@ -337,6 +475,7 @@ declare const CodeJudgeInputSchema: z.ZodObject<{
             id?: string | undefined;
             timestamp?: string | undefined;
         }[] | undefined;
+        name?: string | undefined;
         metadata?: Record<string, unknown> | undefined;
     }[] | null | undefined;
     traceSummary?: {
@@ -363,16 +502,20 @@ declare const CodeJudgeResultSchema: z.ZodObject<{
     hits: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodString, "many">>>;
     misses: z.ZodDefault<z.ZodOptional<z.ZodArray<z.ZodString, "many">>>;
     reasoning: z.ZodOptional<z.ZodString>;
+    /** Optional structured details for domain-specific metrics (e.g., TP/TN/FP/FN counts, alignments). */
+    details: z.ZodOptional<z.ZodRecord<z.ZodString, z.ZodUnknown>>;
 }, "strip", z.ZodTypeAny, {
     score: number;
     hits: string[];
     misses: string[];
     reasoning?: string | undefined;
+    details?: Record<string, unknown> | undefined;
 }, {
     score: number;
     hits?: string[] | undefined;
     misses?: string[] | undefined;
     reasoning?: string | undefined;
+    details?: Record<string, unknown> | undefined;
 }>;
 /**
  * Inferred types from schemas.
@@ -380,10 +523,118 @@ declare const CodeJudgeResultSchema: z.ZodObject<{
 type CodeJudgeInput = z.infer<typeof CodeJudgeInputSchema>;
 type CodeJudgeResult = z.infer<typeof CodeJudgeResultSchema>;
 type TraceSummary = z.infer<typeof TraceSummarySchema>;
-type OutputMessage = z.infer<typeof OutputMessageSchema>;
+type Message = z.infer<typeof MessageSchema>;
 type ToolCall = z.infer<typeof ToolCallSchema>;
 type TokenUsage = z.infer<typeof TokenUsageSchema>;
+/**
+ * Client for invoking configured targets from code_judge scripts.
+ *
+ * Environment variables (set automatically by AgentV when `target` config is present):
+ * - AGENTV_TARGET_PROXY_URL: The URL of the local proxy server
+ * - AGENTV_TARGET_PROXY_TOKEN: Bearer token for authentication
+ */
+/**
+ * Request to invoke the target
+ */
+interface TargetInvokeRequest {
+    readonly question: string;
+    readonly systemPrompt?: string;
+    readonly evalCaseId?: string;
+    readonly attempt?: number;
+    /** Optional target override - use a different target for this invocation */
+    readonly target?: string;
+}
+/**
+ * Response from a target invocation
+ */
+interface TargetInvokeResponse {
+    readonly outputMessages: readonly unknown[];
+    readonly rawText?: string;
+}
+/**
+ * Information about the target proxy configuration
+ */
+interface TargetInfo {
+    /** Name of the default target being used */
+    readonly targetName: string;
+    /** Maximum number of calls allowed */
+    readonly maxCalls: number;
+    /** Current number of calls made */
+    readonly callCount: number;
+    /** List of all available target names */
+    readonly availableTargets: readonly string[];
+}
+/**
+ * Target client for making target invocations
+ */
+interface TargetClient {
+    /**
+     * Invoke the configured target with a prompt.
+     * @param request - The question and optional system prompt
+     * @returns The target's response with output messages and optional raw text
+     */
+    invoke(request: TargetInvokeRequest): Promise<TargetInvokeResponse>;
+    /**
+     * Invoke the target with multiple requests in sequence.
+     * Each request counts toward the max_calls limit.
+     * @param requests - Array of target requests
+     * @returns Array of target responses
+     */
+    invokeBatch(requests: readonly TargetInvokeRequest[]): Promise<readonly TargetInvokeResponse[]>;
+    /**
+     * Get information about the target proxy configuration.
+     * Returns the default target name, max calls, current call count, and available targets.
+     */
+    getInfo(): Promise<TargetInfo>;
+}
+/**
+ * Error thrown when target proxy is not available
+ */
+declare class TargetNotAvailableError extends Error {
+    constructor(message: string);
+}
+/**
+ * Error thrown when target invocation fails
+ */
+declare class TargetInvocationError extends Error {
+    readonly statusCode?: number;
+    constructor(message: string, statusCode?: number);
+}
+/**
+ * Create a target client from environment variables.
+ *
+ * This function reads the proxy URL and token from environment variables
+ * that are automatically set by AgentV when a `target` config block is present
+ * on a `code_judge` evaluator.
+ *
+ * @returns A target client if environment variables are set, otherwise undefined
+ * @throws TargetNotAvailableError if token is missing when URL is present
+ *
+ * @example
+ * ```typescript
+ * import { createTargetClient, defineCodeJudge } from '@agentv/eval';
+ *
+ * export default defineCodeJudge(async ({ question, expectedOutcome }) => {
+ *   const target = createTargetClient();
+ *
+ *   if (!target) {
+ *     // Target not available - no target config on this evaluator
+ *     return { score: 0.5, reasoning: 'Target not available' };
+ *   }
+ *
+ *   const response = await target.invoke({
+ *     question: `Is this answer correct? Question: ${question}, Expected: ${expectedOutcome}`,
+ *     systemPrompt: 'You are an expert evaluator. Respond with JSON: { "correct": true/false }'
+ *   });
+ *
+ *   const result = JSON.parse(response.rawText ?? '{}');
+ *   return { score: result.correct ? 1.0 : 0.0 };
+ * });
+ * ```
+ */
+declare function createTargetClient(): TargetClient | undefined;
 /**
  * Handler function type for code judges.
  */
@@ -394,7 +645,7 @@ type CodeJudgeHandler = (input: CodeJudgeInput) => CodeJudgeResult | Promise<Cod
  *
  * Build custom code judges for evaluating AI agent outputs.
  *
- * @example
+ * @example Basic code judge
  * ```typescript
  * #!/usr/bin/env bun
  * import { defineCodeJudge } from '@agentv/eval';
@@ -406,6 +657,27 @@ type CodeJudgeHandler = (input: CodeJudgeInput) => CodeJudgeResult | Promise<Cod
  * }));
  * ```
  *
+ * @example Code judge with target access (requires `target` config in YAML)
+ * ```typescript
+ * #!/usr/bin/env bun
+ * import { defineCodeJudge, createTargetClient } from '@agentv/eval';
+ *
+ * export default defineCodeJudge(async ({ question }) => {
+ *   const target = createTargetClient();
+ *   if (!target) {
+ *     return { score: 0, misses: ['Target not available'] };
+ *   }
+ *
+ *   const response = await target.invoke({
+ *     question: `Evaluate: ${question}`,
+ *     systemPrompt: 'Respond with JSON: { "score": 0-1 }'
+ *   });
+ *
+ *   const result = JSON.parse(response.rawText ?? '{}');
+ *   return { score: result.score ?? 0 };
+ * });
+ * ```
+ *
  * @packageDocumentation
  */
@@ -455,4 +727,4 @@ type CodeJudgeHandler = (input: CodeJudgeInput) => CodeJudgeResult | Promise<Cod
  */
 declare function defineCodeJudge(handler: CodeJudgeHandler): void;
-export { type CodeJudgeHandler, type CodeJudgeInput, CodeJudgeInputSchema, type CodeJudgeResult, CodeJudgeResultSchema, type OutputMessage, OutputMessageSchema, type TokenUsage, TokenUsageSchema, type ToolCall, ToolCallSchema, type TraceSummary, TraceSummarySchema, defineCodeJudge };
+export { type CodeJudgeHandler, type CodeJudgeInput, CodeJudgeInputSchema, type CodeJudgeResult, CodeJudgeResultSchema, type Message, MessageSchema, type TargetClient, type TargetInfo, TargetInvocationError, type TargetInvokeRequest, type TargetInvokeResponse, TargetNotAvailableError, type TokenUsage, TokenUsageSchema, type ToolCall, ToolCallSchema, type TraceSummary, TraceSummarySchema, createTargetClient, defineCodeJudge };

package/dist/index.js CHANGED Viewed

@@ -22,29 +22,24 @@ var ToolCallSchema = z.object({
   id: z.string().optional(),
   timestamp: z.string().optional()
 });
-var OutputMessageSchema = z.object({
+var MessageSchema = z.object({
   role: z.enum(["assistant", "user", "system", "tool"]),
-  // Optional message name (e.g., agent name) used by some providers for multi-agent transcripts.
-  name: z.string().optional(),
   content: z.union([z.string(), z.record(z.unknown()), z.array(z.record(z.unknown()))]).optional(),
   toolCalls: z.array(ToolCallSchema).optional(),
+  name: z.string().optional(),
   timestamp: z.string().optional(),
   metadata: z.record(z.unknown()).optional()
 });
-var TestMessageSchema = z.object({
-  role: z.enum(["system", "user", "assistant", "tool"]),
-  content: z.union([z.string(), z.record(z.unknown()), z.array(z.record(z.unknown()))])
-});
 var CodeJudgeInputSchema = z.object({
   question: z.string(),
   expectedOutcome: z.string(),
-  expectedMessages: z.array(z.record(z.unknown())),
+  expectedMessages: z.array(MessageSchema),
   referenceAnswer: z.string().optional(),
   candidateAnswer: z.string(),
-  outputMessages: z.array(OutputMessageSchema).nullable().optional(),
+  outputMessages: z.array(MessageSchema).nullable().optional(),
   guidelineFiles: z.array(z.string()),
   inputFiles: z.array(z.string()),
-  inputMessages: z.array(TestMessageSchema),
+  inputMessages: z.array(MessageSchema),
   traceSummary: TraceSummarySchema.nullable().optional(),
   config: z.record(z.unknown()).nullable().optional()
 });
@@ -52,9 +47,119 @@ var CodeJudgeResultSchema = z.object({
   score: z.number().min(0).max(1),
   hits: z.array(z.string()).optional().default([]),
   misses: z.array(z.string()).optional().default([]),
-  reasoning: z.string().optional()
+  reasoning: z.string().optional(),
+  /** Optional structured details for domain-specific metrics (e.g., TP/TN/FP/FN counts, alignments). */
+  details: z.record(z.unknown()).optional()
 });
+// src/target-client.ts
+var TargetNotAvailableError = class extends Error {
+  constructor(message) {
+    super(message);
+    this.name = "TargetNotAvailableError";
+  }
+};
+var TargetInvocationError = class extends Error {
+  statusCode;
+  constructor(message, statusCode) {
+    super(message);
+    this.name = "TargetInvocationError";
+    this.statusCode = statusCode;
+  }
+};
+function createTargetClient() {
+  const proxyUrl = process.env.AGENTV_TARGET_PROXY_URL;
+  const proxyToken = process.env.AGENTV_TARGET_PROXY_TOKEN;
+  if (!proxyUrl) {
+    return void 0;
+  }
+  if (!proxyToken) {
+    throw new TargetNotAvailableError(
+      "AGENTV_TARGET_PROXY_URL is set but AGENTV_TARGET_PROXY_TOKEN is missing"
+    );
+  }
+  return createTargetClientInternal(proxyUrl, proxyToken);
+}
+function createTargetClientInternal(url, token) {
+  const headers = {
+    "Content-Type": "application/json",
+    Authorization: `Bearer ${token}`
+  };
+  return {
+    async invoke(request) {
+      const response = await fetch(`${url}/invoke`, {
+        method: "POST",
+        headers,
+        body: JSON.stringify({
+          question: request.question,
+          systemPrompt: request.systemPrompt,
+          evalCaseId: request.evalCaseId,
+          attempt: request.attempt,
+          target: request.target
+        })
+      });
+      if (!response.ok) {
+        const errorBody = await response.text();
+        let errorMessage;
+        try {
+          const errorJson = JSON.parse(errorBody);
+          errorMessage = errorJson.error ?? `HTTP ${response.status}`;
+        } catch {
+          errorMessage = errorBody || `HTTP ${response.status}`;
+        }
+        throw new TargetInvocationError(errorMessage, response.status);
+      }
+      return await response.json();
+    },
+    async invokeBatch(requests) {
+      const response = await fetch(`${url}/invokeBatch`, {
+        method: "POST",
+        headers,
+        body: JSON.stringify({
+          requests: requests.map((r) => ({
+            question: r.question,
+            systemPrompt: r.systemPrompt,
+            evalCaseId: r.evalCaseId,
+            attempt: r.attempt,
+            target: r.target
+          }))
+        })
+      });
+      if (!response.ok) {
+        const errorBody = await response.text();
+        let errorMessage;
+        try {
+          const errorJson = JSON.parse(errorBody);
+          errorMessage = errorJson.error ?? `HTTP ${response.status}`;
+        } catch {
+          errorMessage = errorBody || `HTTP ${response.status}`;
+        }
+        throw new TargetInvocationError(errorMessage, response.status);
+      }
+      const result = await response.json();
+      return result.responses;
+    },
+    async getInfo() {
+      const response = await fetch(`${url}/info`, {
+        method: "GET",
+        headers
+      });
+      if (!response.ok) {
+        const errorBody = await response.text();
+        let errorMessage;
+        try {
+          const errorJson = JSON.parse(errorBody);
+          errorMessage = errorJson.error ?? `HTTP ${response.status}`;
+        } catch {
+          errorMessage = errorBody || `HTTP ${response.status}`;
+        }
+        throw new TargetInvocationError(errorMessage, response.status);
+      }
+      return await response.json();
+    }
+  };
+}
 // src/index.ts
 import { z as z2 } from "zod";
@@ -134,10 +239,13 @@ function defineCodeJudge(handler) {
 export {
   CodeJudgeInputSchema,
   CodeJudgeResultSchema,
-  OutputMessageSchema,
+  MessageSchema,
+  TargetInvocationError,
+  TargetNotAvailableError,
   TokenUsageSchema,
   ToolCallSchema,
   TraceSummarySchema,
+  createTargetClient,
   defineCodeJudge,
   z2 as z
 };