npm - @agentv/core - Versions diffs - 0.6.1 → 0.7.0 - Mend

@agentv/core 0.6.1 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

package/dist/{chunk-OW3SHBIJ.js → chunk-L7I5UTJU.js} +1 -1
package/dist/{chunk-OW3SHBIJ.js.map → chunk-L7I5UTJU.js.map} +1 -1
package/dist/evaluation/validation/index.cjs.map +1 -1
package/dist/evaluation/validation/index.js +1 -1
package/dist/index.cjs +221 -242
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +11 -13
package/dist/index.d.ts +11 -13
package/dist/index.js +222 -243
package/dist/index.js.map +1 -1
package/package.json +1 -1

package/dist/index.d.cts CHANGED Viewed

@@ -99,17 +99,18 @@ type EvaluatorConfig = CodeEvaluatorConfig | LlmJudgeEvaluatorConfig;
  */
 interface EvalCase {
     readonly id: string;
-    readonly dataset: string;
+    readonly dataset?: string;
     readonly conversation_id?: string;
-    readonly task: string;
-    readonly user_segments: readonly JsonObject[];
+    readonly question: string;
+    readonly input_segments: readonly JsonObject[];
+    readonly output_segments: readonly JsonObject[];
     readonly system_message?: string;
-    readonly expected_assistant_raw: string;
+    readonly reference_answer: string;
     readonly guideline_paths: readonly string[];
     readonly guideline_patterns?: readonly string[];
     readonly file_paths: readonly string[];
     readonly code_snippets: readonly string[];
-    readonly outcome: string;
+    readonly expected_outcome: string;
     readonly evaluator?: EvaluatorKind;
     readonly evaluators?: readonly EvaluatorConfig[];
 }
@@ -118,12 +119,12 @@ interface EvalCase {
  */
 interface EvaluationResult {
     readonly eval_id: string;
-    readonly dataset: string;
+    readonly dataset?: string;
     readonly conversation_id?: string;
     readonly score: number;
     readonly hits: readonly string[];
     readonly misses: readonly string[];
-    readonly model_answer: string;
+    readonly candidate_answer: string;
     readonly expected_aspect_count: number;
     readonly target: string;
     readonly timestamp: string;
@@ -167,7 +168,7 @@ declare function loadEvalCases(evalFilePath: string, repoRoot: URL | string, opt
  * Build prompt inputs by consolidating user request context and guideline content.
  */
 declare function buildPromptInputs(testCase: EvalCase): Promise<{
-    request: string;
+    question: string;
     guidelines: string;
     systemMessage?: string;
 }>;
@@ -204,7 +205,7 @@ declare function resolveFileReference(rawValue: string, searchRoots: readonly st
 type ChatPrompt = AxChatRequest["chatPrompt"];
 type ProviderKind = "azure" | "anthropic" | "gemini" | "codex" | "cli" | "mock" | "vscode" | "vscode-insiders";
 interface ProviderRequest {
-    readonly prompt: string;
+    readonly question: string;
     readonly guidelines?: string;
     readonly guideline_patterns?: readonly string[];
     readonly chatPrompt?: ChatPrompt;
@@ -404,7 +405,7 @@ interface EvaluationContext {
     readonly provider: Provider;
     readonly attempt: number;
     readonly promptInputs: {
-        readonly request: string;
+        readonly question: string;
         readonly guidelines: string;
         readonly systemMessage?: string;
     };
@@ -442,10 +443,7 @@ declare class LlmJudgeEvaluator implements Evaluator {
     private readonly customPrompt?;
     constructor(options: LlmJudgeEvaluatorOptions);
     evaluate(context: EvaluationContext): Promise<EvaluationScore>;
-    private evaluateWithAx;
     private evaluateWithPrompt;
-    private buildJudgeForwardOptions;
-    private buildJudgeModelConfig;
 }
 interface CodeEvaluatorOptions {
     readonly script: string;

package/dist/index.d.ts CHANGED Viewed

@@ -99,17 +99,18 @@ type EvaluatorConfig = CodeEvaluatorConfig | LlmJudgeEvaluatorConfig;
  */
 interface EvalCase {
     readonly id: string;
-    readonly dataset: string;
+    readonly dataset?: string;
     readonly conversation_id?: string;
-    readonly task: string;
-    readonly user_segments: readonly JsonObject[];
+    readonly question: string;
+    readonly input_segments: readonly JsonObject[];
+    readonly output_segments: readonly JsonObject[];
     readonly system_message?: string;
-    readonly expected_assistant_raw: string;
+    readonly reference_answer: string;
     readonly guideline_paths: readonly string[];
     readonly guideline_patterns?: readonly string[];
     readonly file_paths: readonly string[];
     readonly code_snippets: readonly string[];
-    readonly outcome: string;
+    readonly expected_outcome: string;
     readonly evaluator?: EvaluatorKind;
     readonly evaluators?: readonly EvaluatorConfig[];
 }
@@ -118,12 +119,12 @@ interface EvalCase {
  */
 interface EvaluationResult {
     readonly eval_id: string;
-    readonly dataset: string;
+    readonly dataset?: string;
     readonly conversation_id?: string;
     readonly score: number;
     readonly hits: readonly string[];
     readonly misses: readonly string[];
-    readonly model_answer: string;
+    readonly candidate_answer: string;
     readonly expected_aspect_count: number;
     readonly target: string;
     readonly timestamp: string;
@@ -167,7 +168,7 @@ declare function loadEvalCases(evalFilePath: string, repoRoot: URL | string, opt
  * Build prompt inputs by consolidating user request context and guideline content.
  */
 declare function buildPromptInputs(testCase: EvalCase): Promise<{
-    request: string;
+    question: string;
     guidelines: string;
     systemMessage?: string;
 }>;
@@ -204,7 +205,7 @@ declare function resolveFileReference(rawValue: string, searchRoots: readonly st
 type ChatPrompt = AxChatRequest["chatPrompt"];
 type ProviderKind = "azure" | "anthropic" | "gemini" | "codex" | "cli" | "mock" | "vscode" | "vscode-insiders";
 interface ProviderRequest {
-    readonly prompt: string;
+    readonly question: string;
     readonly guidelines?: string;
     readonly guideline_patterns?: readonly string[];
     readonly chatPrompt?: ChatPrompt;
@@ -404,7 +405,7 @@ interface EvaluationContext {
     readonly provider: Provider;
     readonly attempt: number;
     readonly promptInputs: {
-        readonly request: string;
+        readonly question: string;
         readonly guidelines: string;
         readonly systemMessage?: string;
     };
@@ -442,10 +443,7 @@ declare class LlmJudgeEvaluator implements Evaluator {
     private readonly customPrompt?;
     constructor(options: LlmJudgeEvaluatorOptions);
     evaluate(context: EvaluationContext): Promise<EvaluationScore>;
-    private evaluateWithAx;
     private evaluateWithPrompt;
-    private buildJudgeForwardOptions;
-    private buildJudgeModelConfig;
 }
 interface CodeEvaluatorOptions {
     readonly script: string;