npm - @agentv/core - Versions diffs - 3.6.0 → 3.8.0 - Mend

@agentv/core 3.6.0 → 3.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/dist/{chunk-2IZOTQ25.js → chunk-3ZS3GCMI.js} +143 -3
package/dist/chunk-3ZS3GCMI.js.map +1 -0
package/dist/evaluation/validation/index.cjs +227 -39
package/dist/evaluation/validation/index.cjs.map +1 -1
package/dist/evaluation/validation/index.js +84 -5
package/dist/evaluation/validation/index.js.map +1 -1
package/dist/index.cjs +23 -22
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +6 -9
package/dist/index.d.ts +6 -9
package/dist/index.js +429 -562
package/dist/index.js.map +1 -1
package/package.json +1 -1
package/dist/chunk-2IZOTQ25.js.map +0 -1

package/dist/index.d.cts CHANGED Viewed

@@ -251,10 +251,8 @@ interface TokenUsage {
 interface TraceSummary {
     /** Total number of events in trace */
     readonly eventCount: number;
-    /** Unique tool names, sorted alphabetically */
-    readonly toolNames: readonly string[];
     /** Map of tool name to call count */
-    readonly toolCallsByName: Readonly<Record<string, number>>;
+    readonly toolCalls: Readonly<Record<string, number>>;
     /** Number of error events */
     readonly errorCount: number;
     /** Per-tool duration arrays in milliseconds (optional) */
@@ -1134,7 +1132,6 @@ interface EvaluationResult {
     readonly conversationId?: string;
     readonly score: number;
     readonly assertions: readonly AssertionEntry[];
-    readonly outputText: string;
     readonly target: string;
     /** Token usage metrics from provider (optional) */
     readonly tokenUsage?: TokenUsage;
@@ -1157,10 +1154,10 @@ interface EvaluationResult {
     readonly trace?: TraceSummary;
     /** Path to the temporary workspace directory (included on failure for debugging) */
     readonly workspacePath?: string;
-    /** Input messages or prompt string sent to the agent */
-    readonly input?: readonly Message[] | string;
-    /** Full output messages from agent execution (only included when --trace flag is set) */
-    readonly output?: readonly Message[];
+    /** Input messages sent to the agent. Always Message[] for consistent shape with output. */
+    readonly input?: readonly Message[];
+    /** Output messages from agent execution. Always present — at minimum contains the final assistant message. */
+    readonly output: readonly Message[];
     /** Captured output from workspace before_all script */
     readonly beforeAllOutput?: string;
     /** Captured output from workspace before_each script */
@@ -1202,7 +1199,7 @@ interface EvaluatorResult {
     readonly verdict?: EvaluationVerdict;
     readonly assertions: readonly AssertionEntry[];
     readonly rawRequest?: JsonObject;
-    readonly evaluatorProviderRequest?: JsonObject;
+    readonly input?: JsonObject;
     readonly scores?: readonly EvaluatorResult[];
     /** Optional structured details from code graders (e.g., TP/TN/FP/FN counts). */
     readonly details?: JsonObject;

package/dist/index.d.ts CHANGED Viewed

@@ -251,10 +251,8 @@ interface TokenUsage {
 interface TraceSummary {
     /** Total number of events in trace */
     readonly eventCount: number;
-    /** Unique tool names, sorted alphabetically */
-    readonly toolNames: readonly string[];
     /** Map of tool name to call count */
-    readonly toolCallsByName: Readonly<Record<string, number>>;
+    readonly toolCalls: Readonly<Record<string, number>>;
     /** Number of error events */
     readonly errorCount: number;
     /** Per-tool duration arrays in milliseconds (optional) */
@@ -1134,7 +1132,6 @@ interface EvaluationResult {
     readonly conversationId?: string;
     readonly score: number;
     readonly assertions: readonly AssertionEntry[];
-    readonly outputText: string;
     readonly target: string;
     /** Token usage metrics from provider (optional) */
     readonly tokenUsage?: TokenUsage;
@@ -1157,10 +1154,10 @@ interface EvaluationResult {
     readonly trace?: TraceSummary;
     /** Path to the temporary workspace directory (included on failure for debugging) */
     readonly workspacePath?: string;
-    /** Input messages or prompt string sent to the agent */
-    readonly input?: readonly Message[] | string;
-    /** Full output messages from agent execution (only included when --trace flag is set) */
-    readonly output?: readonly Message[];
+    /** Input messages sent to the agent. Always Message[] for consistent shape with output. */
+    readonly input?: readonly Message[];
+    /** Output messages from agent execution. Always present — at minimum contains the final assistant message. */
+    readonly output: readonly Message[];
     /** Captured output from workspace before_all script */
     readonly beforeAllOutput?: string;
     /** Captured output from workspace before_each script */
@@ -1202,7 +1199,7 @@ interface EvaluatorResult {
     readonly verdict?: EvaluationVerdict;
     readonly assertions: readonly AssertionEntry[];
     readonly rawRequest?: JsonObject;
-    readonly evaluatorProviderRequest?: JsonObject;
+    readonly input?: JsonObject;
     readonly scores?: readonly EvaluatorResult[];
     /** Optional structured details from code graders (e.g., TP/TN/FP/FN counts). */
     readonly details?: JsonObject;