@agentv/core 3.7.0 → 3.8.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{chunk-2IZOTQ25.js → chunk-3ZS3GCMI.js} +143 -3
- package/dist/chunk-3ZS3GCMI.js.map +1 -0
- package/dist/evaluation/validation/index.cjs +227 -39
- package/dist/evaluation/validation/index.cjs.map +1 -1
- package/dist/evaluation/validation/index.js +84 -5
- package/dist/evaluation/validation/index.js.map +1 -1
- package/dist/index.cjs +13 -11
- package/dist/index.cjs.map +1 -1
- package/dist/index.d.cts +5 -6
- package/dist/index.d.ts +5 -6
- package/dist/index.js +419 -551
- package/dist/index.js.map +1 -1
- package/package.json +1 -1
- package/dist/chunk-2IZOTQ25.js.map +0 -1
package/dist/index.d.cts
CHANGED
|
@@ -1132,7 +1132,6 @@ interface EvaluationResult {
|
|
|
1132
1132
|
readonly conversationId?: string;
|
|
1133
1133
|
readonly score: number;
|
|
1134
1134
|
readonly assertions: readonly AssertionEntry[];
|
|
1135
|
-
readonly outputText: string;
|
|
1136
1135
|
readonly target: string;
|
|
1137
1136
|
/** Token usage metrics from provider (optional) */
|
|
1138
1137
|
readonly tokenUsage?: TokenUsage;
|
|
@@ -1155,10 +1154,10 @@ interface EvaluationResult {
|
|
|
1155
1154
|
readonly trace?: TraceSummary;
|
|
1156
1155
|
/** Path to the temporary workspace directory (included on failure for debugging) */
|
|
1157
1156
|
readonly workspacePath?: string;
|
|
1158
|
-
/** Input messages
|
|
1159
|
-
readonly input?: readonly Message[]
|
|
1160
|
-
/**
|
|
1161
|
-
readonly output
|
|
1157
|
+
/** Input messages sent to the agent. Always Message[] for consistent shape with output. */
|
|
1158
|
+
readonly input?: readonly Message[];
|
|
1159
|
+
/** Output messages from agent execution. Always present — at minimum contains the final assistant message. */
|
|
1160
|
+
readonly output: readonly Message[];
|
|
1162
1161
|
/** Captured output from workspace before_all script */
|
|
1163
1162
|
readonly beforeAllOutput?: string;
|
|
1164
1163
|
/** Captured output from workspace before_each script */
|
|
@@ -1200,7 +1199,7 @@ interface EvaluatorResult {
|
|
|
1200
1199
|
readonly verdict?: EvaluationVerdict;
|
|
1201
1200
|
readonly assertions: readonly AssertionEntry[];
|
|
1202
1201
|
readonly rawRequest?: JsonObject;
|
|
1203
|
-
readonly
|
|
1202
|
+
readonly input?: JsonObject;
|
|
1204
1203
|
readonly scores?: readonly EvaluatorResult[];
|
|
1205
1204
|
/** Optional structured details from code graders (e.g., TP/TN/FP/FN counts). */
|
|
1206
1205
|
readonly details?: JsonObject;
|
package/dist/index.d.ts
CHANGED
|
@@ -1132,7 +1132,6 @@ interface EvaluationResult {
|
|
|
1132
1132
|
readonly conversationId?: string;
|
|
1133
1133
|
readonly score: number;
|
|
1134
1134
|
readonly assertions: readonly AssertionEntry[];
|
|
1135
|
-
readonly outputText: string;
|
|
1136
1135
|
readonly target: string;
|
|
1137
1136
|
/** Token usage metrics from provider (optional) */
|
|
1138
1137
|
readonly tokenUsage?: TokenUsage;
|
|
@@ -1155,10 +1154,10 @@ interface EvaluationResult {
|
|
|
1155
1154
|
readonly trace?: TraceSummary;
|
|
1156
1155
|
/** Path to the temporary workspace directory (included on failure for debugging) */
|
|
1157
1156
|
readonly workspacePath?: string;
|
|
1158
|
-
/** Input messages
|
|
1159
|
-
readonly input?: readonly Message[]
|
|
1160
|
-
/**
|
|
1161
|
-
readonly output
|
|
1157
|
+
/** Input messages sent to the agent. Always Message[] for consistent shape with output. */
|
|
1158
|
+
readonly input?: readonly Message[];
|
|
1159
|
+
/** Output messages from agent execution. Always present — at minimum contains the final assistant message. */
|
|
1160
|
+
readonly output: readonly Message[];
|
|
1162
1161
|
/** Captured output from workspace before_all script */
|
|
1163
1162
|
readonly beforeAllOutput?: string;
|
|
1164
1163
|
/** Captured output from workspace before_each script */
|
|
@@ -1200,7 +1199,7 @@ interface EvaluatorResult {
|
|
|
1200
1199
|
readonly verdict?: EvaluationVerdict;
|
|
1201
1200
|
readonly assertions: readonly AssertionEntry[];
|
|
1202
1201
|
readonly rawRequest?: JsonObject;
|
|
1203
|
-
readonly
|
|
1202
|
+
readonly input?: JsonObject;
|
|
1204
1203
|
readonly scores?: readonly EvaluatorResult[];
|
|
1205
1204
|
/** Optional structured details from code graders (e.g., TP/TN/FP/FN counts). */
|
|
1206
1205
|
readonly details?: JsonObject;
|