npm - @agentv/core - Versions diffs - 0.15.0 → 0.17.0 - Mend

@agentv/core 0.15.0 → 0.17.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/dist/{chunk-IOCVST3R.js → chunk-YCIZ33BO.js} +28 -11
package/dist/chunk-YCIZ33BO.js.map +1 -0
package/dist/evaluation/validation/index.cjs +68 -64
package/dist/evaluation/validation/index.cjs.map +1 -1
package/dist/evaluation/validation/index.js +64 -67
package/dist/evaluation/validation/index.js.map +1 -1
package/dist/index.cjs +297 -149
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +18 -5
package/dist/index.d.ts +18 -5
package/dist/index.js +251 -115
package/dist/index.js.map +1 -1
package/package.json +15 -16
package/LICENSE +0 -21
package/dist/chunk-IOCVST3R.js.map +0 -1

package/dist/index.d.cts CHANGED Viewed

@@ -101,7 +101,7 @@ interface EvalCase {
     readonly question: string;
     readonly input_messages: readonly TestMessage[];
     readonly input_segments: readonly JsonObject[];
-    readonly output_segments: readonly JsonObject[];
+    readonly expected_segments: readonly JsonObject[];
     readonly reference_answer?: string;
     readonly guideline_paths: readonly string[];
     readonly guideline_patterns?: readonly string[];
@@ -262,6 +262,17 @@ interface TargetDefinition {
     readonly retryStatusCodes?: unknown | undefined;
 }
+/**
+ * Formatting mode for segment content.
+ * - 'agent': File references only (for providers with filesystem access)
+ * - 'lm': Embedded file content with XML tags (for language model providers)
+ */
+type FormattingMode = "agent" | "lm";
+/**
+ * Extract fenced code blocks from AgentV user segments.
+ */
+declare function extractCodeBlocks(segments: readonly JsonObject[]): readonly string[];
 /**
  * Build prompt inputs by consolidating user request context and guideline content.
  */
@@ -271,12 +282,13 @@ interface PromptInputs {
     readonly chatPrompt?: ChatPrompt;
     readonly systemMessage?: string;
 }
-declare function buildPromptInputs(testCase: EvalCase): Promise<PromptInputs>;
 /**
- * Extract fenced code blocks from AgentV user segments.
+ * Build prompt inputs by consolidating user request context and guideline content.
+ *
+ * @param testCase - The evaluation test case
+ * @param mode - Formatting mode: 'agent' for file references, 'lm' for embedded content (default: 'lm')
  */
-declare function extractCodeBlocks(segments: readonly JsonObject[]): readonly string[];
+declare function buildPromptInputs(testCase: EvalCase, mode?: FormattingMode): Promise<PromptInputs>;
 /**
  * Determine whether a path references guideline content (instructions or prompts).
@@ -605,6 +617,7 @@ interface RunEvaluationOptions {
     readonly evalId?: string;
     readonly verbose?: boolean;
     readonly maxConcurrency?: number;
+    readonly evalCases?: readonly EvalCase[];
     readonly onResult?: (result: EvaluationResult) => MaybePromise<void>;
     readonly onProgress?: (event: ProgressEvent) => MaybePromise<void>;
 }

package/dist/index.d.ts CHANGED Viewed

@@ -101,7 +101,7 @@ interface EvalCase {
     readonly question: string;
     readonly input_messages: readonly TestMessage[];
     readonly input_segments: readonly JsonObject[];
-    readonly output_segments: readonly JsonObject[];
+    readonly expected_segments: readonly JsonObject[];
     readonly reference_answer?: string;
     readonly guideline_paths: readonly string[];
     readonly guideline_patterns?: readonly string[];
@@ -262,6 +262,17 @@ interface TargetDefinition {
     readonly retryStatusCodes?: unknown | undefined;
 }
+/**
+ * Formatting mode for segment content.
+ * - 'agent': File references only (for providers with filesystem access)
+ * - 'lm': Embedded file content with XML tags (for language model providers)
+ */
+type FormattingMode = "agent" | "lm";
+/**
+ * Extract fenced code blocks from AgentV user segments.
+ */
+declare function extractCodeBlocks(segments: readonly JsonObject[]): readonly string[];
 /**
  * Build prompt inputs by consolidating user request context and guideline content.
  */
@@ -271,12 +282,13 @@ interface PromptInputs {
     readonly chatPrompt?: ChatPrompt;
     readonly systemMessage?: string;
 }
-declare function buildPromptInputs(testCase: EvalCase): Promise<PromptInputs>;
 /**
- * Extract fenced code blocks from AgentV user segments.
+ * Build prompt inputs by consolidating user request context and guideline content.
+ *
+ * @param testCase - The evaluation test case
+ * @param mode - Formatting mode: 'agent' for file references, 'lm' for embedded content (default: 'lm')
  */
-declare function extractCodeBlocks(segments: readonly JsonObject[]): readonly string[];
+declare function buildPromptInputs(testCase: EvalCase, mode?: FormattingMode): Promise<PromptInputs>;
 /**
  * Determine whether a path references guideline content (instructions or prompts).
@@ -605,6 +617,7 @@ interface RunEvaluationOptions {
     readonly evalId?: string;
     readonly verbose?: boolean;
     readonly maxConcurrency?: number;
+    readonly evalCases?: readonly EvalCase[];
     readonly onResult?: (result: EvaluationResult) => MaybePromise<void>;
     readonly onProgress?: (event: ProgressEvent) => MaybePromise<void>;
 }