@agentv/core 2.5.4 → 2.5.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/index.d.cts CHANGED
@@ -462,7 +462,7 @@ interface ChatMessage {
462
462
  readonly name?: string;
463
463
  }
464
464
  type ChatPrompt = readonly ChatMessage[];
465
- type ProviderKind = 'azure' | 'anthropic' | 'gemini' | 'codex' | 'pi-coding-agent' | 'pi-agent-sdk' | 'claude-code' | 'cli' | 'mock' | 'vscode' | 'vscode-insiders';
465
+ type ProviderKind = 'azure' | 'anthropic' | 'gemini' | 'codex' | 'copilot-cli' | 'pi-coding-agent' | 'pi-agent-sdk' | 'claude-code' | 'cli' | 'mock' | 'vscode' | 'vscode-insiders';
466
466
  interface ProviderRequest {
467
467
  readonly question: string;
468
468
  readonly systemPrompt?: string;
@@ -598,6 +598,8 @@ interface TargetDefinition {
598
598
  readonly logFormat?: string | unknown | undefined;
599
599
  readonly log_output_format?: string | unknown | undefined;
600
600
  readonly logOutputFormat?: string | unknown | undefined;
601
+ readonly system_prompt?: string | unknown | undefined;
602
+ readonly systemPrompt?: string | unknown | undefined;
601
603
  readonly response?: string | unknown | undefined;
602
604
  readonly delayMs?: number | unknown | undefined;
603
605
  readonly delayMinMs?: number | unknown | undefined;
@@ -864,6 +866,16 @@ interface CodexResolvedConfig {
864
866
  readonly logFormat?: 'summary' | 'json';
865
867
  readonly systemPrompt?: string;
866
868
  }
869
+ interface CopilotResolvedConfig {
870
+ readonly executable: string;
871
+ readonly model?: string;
872
+ readonly args?: readonly string[];
873
+ readonly cwd?: string;
874
+ readonly timeoutMs?: number;
875
+ readonly logDir?: string;
876
+ readonly logFormat?: 'summary' | 'json';
877
+ readonly systemPrompt?: string;
878
+ }
867
879
  interface PiCodingAgentResolvedConfig {
868
880
  readonly executable: string;
869
881
  readonly provider?: string;
@@ -936,6 +948,13 @@ type ResolvedTarget = {
936
948
  readonly workers?: number;
937
949
  readonly providerBatching?: boolean;
938
950
  readonly config: CodexResolvedConfig;
951
+ } | {
952
+ readonly kind: 'copilot-cli';
953
+ readonly name: string;
954
+ readonly judgeTarget?: string;
955
+ readonly workers?: number;
956
+ readonly providerBatching?: boolean;
957
+ readonly config: CopilotResolvedConfig;
939
958
  } | {
940
959
  readonly kind: 'pi-coding-agent';
941
960
  readonly name: string;
@@ -1032,6 +1051,16 @@ type ClaudeCodeLogListener = (entry: ClaudeCodeLogEntry) => void;
1032
1051
  declare function consumeClaudeCodeLogEntries(): ClaudeCodeLogEntry[];
1033
1052
  declare function subscribeToClaudeCodeLogEntries(listener: ClaudeCodeLogListener): () => void;
1034
1053
 
1054
+ type CopilotCliLogEntry = {
1055
+ readonly filePath: string;
1056
+ readonly evalCaseId?: string;
1057
+ readonly targetName: string;
1058
+ readonly attempt?: number;
1059
+ };
1060
+ type CopilotCliLogListener = (entry: CopilotCliLogEntry) => void;
1061
+ declare function consumeCopilotCliLogEntries(): CopilotCliLogEntry[];
1062
+ declare function subscribeToCopilotCliLogEntries(listener: CopilotCliLogListener): () => void;
1063
+
1035
1064
  declare function createProvider(target: ResolvedTarget): Provider;
1036
1065
  declare function resolveAndCreateProvider(definition: TargetDefinition, env?: EnvLookup): Provider;
1037
1066
 
@@ -1376,4 +1405,4 @@ type AgentKernel = {
1376
1405
  };
1377
1406
  declare function createAgentKernel(): AgentKernel;
1378
1407
 
1379
- export { type AgentKernel, type AnthropicResolvedConfig, type AssistantTestMessage, type AzureResolvedConfig, type ChildEvaluatorResult, type ClaudeCodeResolvedConfig, type CliResolvedConfig, CodeEvaluator, type CodeEvaluatorConfig, type CodeEvaluatorOptions, type CompositeAggregatorConfig, CompositeEvaluator, type CompositeEvaluatorConfig, type CompositeEvaluatorOptions, CostEvaluator, type CostEvaluatorConfig, type CostEvaluatorOptions, DEFAULT_EXPLORATION_TOOLS, type EnsureSubagentsOptions, type EnsureSubagentsResult, type EnvLookup, type EvalCase, type EvaluationCache, type EvaluationContext, type EvaluationResult, type EvaluationScore, type EvaluationVerdict, type Evaluator, type EvaluatorConfig, type EvaluatorFactory, type EvaluatorKind, type EvaluatorResult, type ExecutionMetrics, FieldAccuracyEvaluator, type FieldAccuracyEvaluatorConfig, type FieldAccuracyEvaluatorOptions, type FieldAggregationType, type FieldConfig, type FieldMatchType, type GeminiResolvedConfig, type GenerateRubricsOptions, type JsonObject, type JsonPrimitive, type JsonValue, LatencyEvaluator, type LatencyEvaluatorConfig, type LatencyEvaluatorOptions, LlmJudgeEvaluator, type LlmJudgeEvaluatorConfig, type LlmJudgeEvaluatorOptions, type MockResolvedConfig, type PiAgentSdkResolvedConfig, type PiCodingAgentResolvedConfig, type ProgressEvent, type PromptInputs, type PromptScriptConfig, type Provider, type ProviderKind, type ProviderRequest, type ProviderResponse, type ProviderTokenUsage, type ResolvedTarget, type RubricItem, type RunEvalCaseOptions, type RunEvaluationOptions, type ScoreRange, type SystemTestMessage, TEST_MESSAGE_ROLES, type TargetAccessConfig, type TargetDefinition, type TestMessage, type TestMessageContent, type TestMessageRole, type TokenUsage, TokenUsageEvaluator, type TokenUsageEvaluatorConfig, type TokenUsageEvaluatorOptions, type ToolTestMessage, ToolTrajectoryEvaluator, type ToolTrajectoryEvaluatorConfig, type ToolTrajectoryEvaluatorOptions, type ToolTrajectoryExpectedItem, type TraceSummary, type UserTestMessage, type VSCodeResolvedConfig, avgToolDurationMs, buildDirectoryChain, buildOutputSchema, buildPromptInputs, buildSearchRoots, clampScore, computeTraceSummary, consumeClaudeCodeLogEntries, consumeCodexLogEntries, consumePiLogEntries, createAgentKernel, createProvider, deepEqual, detectFormat, ensureVSCodeSubagents, executeScript, explorationRatio, extractJsonBlob, fileExists, findGitRoot, freeformEvaluationSchema, generateRubrics, getHitCount, isEvaluatorKind, isGuidelineFile, isJsonObject, isJsonValue, isNonEmptyString, isTestMessage, isTestMessageRole, listTargetNames, loadEvalCases, mergeExecutionMetrics, normalizeLineEndings, parseJsonFromText, parseJsonSafe, readJsonFile, readTargetDefinitions, readTestSuiteMetadata, readTextFile, resolveAndCreateProvider, resolveFileReference, resolveTargetDefinition, runEvalCase, runEvaluation, scoreToVerdict, subscribeToClaudeCodeLogEntries, subscribeToCodexLogEntries, subscribeToPiLogEntries, tokensPerTool };
1408
+ export { type AgentKernel, type AnthropicResolvedConfig, type AssistantTestMessage, type AzureResolvedConfig, type ChildEvaluatorResult, type ClaudeCodeResolvedConfig, type CliResolvedConfig, CodeEvaluator, type CodeEvaluatorConfig, type CodeEvaluatorOptions, type CompositeAggregatorConfig, CompositeEvaluator, type CompositeEvaluatorConfig, type CompositeEvaluatorOptions, type CopilotResolvedConfig, CostEvaluator, type CostEvaluatorConfig, type CostEvaluatorOptions, DEFAULT_EXPLORATION_TOOLS, type EnsureSubagentsOptions, type EnsureSubagentsResult, type EnvLookup, type EvalCase, type EvaluationCache, type EvaluationContext, type EvaluationResult, type EvaluationScore, type EvaluationVerdict, type Evaluator, type EvaluatorConfig, type EvaluatorFactory, type EvaluatorKind, type EvaluatorResult, type ExecutionMetrics, FieldAccuracyEvaluator, type FieldAccuracyEvaluatorConfig, type FieldAccuracyEvaluatorOptions, type FieldAggregationType, type FieldConfig, type FieldMatchType, type GeminiResolvedConfig, type GenerateRubricsOptions, type JsonObject, type JsonPrimitive, type JsonValue, LatencyEvaluator, type LatencyEvaluatorConfig, type LatencyEvaluatorOptions, LlmJudgeEvaluator, type LlmJudgeEvaluatorConfig, type LlmJudgeEvaluatorOptions, type MockResolvedConfig, type PiAgentSdkResolvedConfig, type PiCodingAgentResolvedConfig, type ProgressEvent, type PromptInputs, type PromptScriptConfig, type Provider, type ProviderKind, type ProviderRequest, type ProviderResponse, type ProviderTokenUsage, type ResolvedTarget, type RubricItem, type RunEvalCaseOptions, type RunEvaluationOptions, type ScoreRange, type SystemTestMessage, TEST_MESSAGE_ROLES, type TargetAccessConfig, type TargetDefinition, type TestMessage, type TestMessageContent, type TestMessageRole, type TokenUsage, TokenUsageEvaluator, type TokenUsageEvaluatorConfig, type TokenUsageEvaluatorOptions, type ToolTestMessage, ToolTrajectoryEvaluator, type ToolTrajectoryEvaluatorConfig, type ToolTrajectoryEvaluatorOptions, type ToolTrajectoryExpectedItem, type TraceSummary, type UserTestMessage, type VSCodeResolvedConfig, avgToolDurationMs, buildDirectoryChain, buildOutputSchema, buildPromptInputs, buildSearchRoots, clampScore, computeTraceSummary, consumeClaudeCodeLogEntries, consumeCodexLogEntries, consumeCopilotCliLogEntries, consumePiLogEntries, createAgentKernel, createProvider, deepEqual, detectFormat, ensureVSCodeSubagents, executeScript, explorationRatio, extractJsonBlob, fileExists, findGitRoot, freeformEvaluationSchema, generateRubrics, getHitCount, isEvaluatorKind, isGuidelineFile, isJsonObject, isJsonValue, isNonEmptyString, isTestMessage, isTestMessageRole, listTargetNames, loadEvalCases, mergeExecutionMetrics, normalizeLineEndings, parseJsonFromText, parseJsonSafe, readJsonFile, readTargetDefinitions, readTestSuiteMetadata, readTextFile, resolveAndCreateProvider, resolveFileReference, resolveTargetDefinition, runEvalCase, runEvaluation, scoreToVerdict, subscribeToClaudeCodeLogEntries, subscribeToCodexLogEntries, subscribeToCopilotCliLogEntries, subscribeToPiLogEntries, tokensPerTool };
package/dist/index.d.ts CHANGED
@@ -462,7 +462,7 @@ interface ChatMessage {
462
462
  readonly name?: string;
463
463
  }
464
464
  type ChatPrompt = readonly ChatMessage[];
465
- type ProviderKind = 'azure' | 'anthropic' | 'gemini' | 'codex' | 'pi-coding-agent' | 'pi-agent-sdk' | 'claude-code' | 'cli' | 'mock' | 'vscode' | 'vscode-insiders';
465
+ type ProviderKind = 'azure' | 'anthropic' | 'gemini' | 'codex' | 'copilot-cli' | 'pi-coding-agent' | 'pi-agent-sdk' | 'claude-code' | 'cli' | 'mock' | 'vscode' | 'vscode-insiders';
466
466
  interface ProviderRequest {
467
467
  readonly question: string;
468
468
  readonly systemPrompt?: string;
@@ -598,6 +598,8 @@ interface TargetDefinition {
598
598
  readonly logFormat?: string | unknown | undefined;
599
599
  readonly log_output_format?: string | unknown | undefined;
600
600
  readonly logOutputFormat?: string | unknown | undefined;
601
+ readonly system_prompt?: string | unknown | undefined;
602
+ readonly systemPrompt?: string | unknown | undefined;
601
603
  readonly response?: string | unknown | undefined;
602
604
  readonly delayMs?: number | unknown | undefined;
603
605
  readonly delayMinMs?: number | unknown | undefined;
@@ -864,6 +866,16 @@ interface CodexResolvedConfig {
864
866
  readonly logFormat?: 'summary' | 'json';
865
867
  readonly systemPrompt?: string;
866
868
  }
869
+ interface CopilotResolvedConfig {
870
+ readonly executable: string;
871
+ readonly model?: string;
872
+ readonly args?: readonly string[];
873
+ readonly cwd?: string;
874
+ readonly timeoutMs?: number;
875
+ readonly logDir?: string;
876
+ readonly logFormat?: 'summary' | 'json';
877
+ readonly systemPrompt?: string;
878
+ }
867
879
  interface PiCodingAgentResolvedConfig {
868
880
  readonly executable: string;
869
881
  readonly provider?: string;
@@ -936,6 +948,13 @@ type ResolvedTarget = {
936
948
  readonly workers?: number;
937
949
  readonly providerBatching?: boolean;
938
950
  readonly config: CodexResolvedConfig;
951
+ } | {
952
+ readonly kind: 'copilot-cli';
953
+ readonly name: string;
954
+ readonly judgeTarget?: string;
955
+ readonly workers?: number;
956
+ readonly providerBatching?: boolean;
957
+ readonly config: CopilotResolvedConfig;
939
958
  } | {
940
959
  readonly kind: 'pi-coding-agent';
941
960
  readonly name: string;
@@ -1032,6 +1051,16 @@ type ClaudeCodeLogListener = (entry: ClaudeCodeLogEntry) => void;
1032
1051
  declare function consumeClaudeCodeLogEntries(): ClaudeCodeLogEntry[];
1033
1052
  declare function subscribeToClaudeCodeLogEntries(listener: ClaudeCodeLogListener): () => void;
1034
1053
 
1054
+ type CopilotCliLogEntry = {
1055
+ readonly filePath: string;
1056
+ readonly evalCaseId?: string;
1057
+ readonly targetName: string;
1058
+ readonly attempt?: number;
1059
+ };
1060
+ type CopilotCliLogListener = (entry: CopilotCliLogEntry) => void;
1061
+ declare function consumeCopilotCliLogEntries(): CopilotCliLogEntry[];
1062
+ declare function subscribeToCopilotCliLogEntries(listener: CopilotCliLogListener): () => void;
1063
+
1035
1064
  declare function createProvider(target: ResolvedTarget): Provider;
1036
1065
  declare function resolveAndCreateProvider(definition: TargetDefinition, env?: EnvLookup): Provider;
1037
1066
 
@@ -1376,4 +1405,4 @@ type AgentKernel = {
1376
1405
  };
1377
1406
  declare function createAgentKernel(): AgentKernel;
1378
1407
 
1379
- export { type AgentKernel, type AnthropicResolvedConfig, type AssistantTestMessage, type AzureResolvedConfig, type ChildEvaluatorResult, type ClaudeCodeResolvedConfig, type CliResolvedConfig, CodeEvaluator, type CodeEvaluatorConfig, type CodeEvaluatorOptions, type CompositeAggregatorConfig, CompositeEvaluator, type CompositeEvaluatorConfig, type CompositeEvaluatorOptions, CostEvaluator, type CostEvaluatorConfig, type CostEvaluatorOptions, DEFAULT_EXPLORATION_TOOLS, type EnsureSubagentsOptions, type EnsureSubagentsResult, type EnvLookup, type EvalCase, type EvaluationCache, type EvaluationContext, type EvaluationResult, type EvaluationScore, type EvaluationVerdict, type Evaluator, type EvaluatorConfig, type EvaluatorFactory, type EvaluatorKind, type EvaluatorResult, type ExecutionMetrics, FieldAccuracyEvaluator, type FieldAccuracyEvaluatorConfig, type FieldAccuracyEvaluatorOptions, type FieldAggregationType, type FieldConfig, type FieldMatchType, type GeminiResolvedConfig, type GenerateRubricsOptions, type JsonObject, type JsonPrimitive, type JsonValue, LatencyEvaluator, type LatencyEvaluatorConfig, type LatencyEvaluatorOptions, LlmJudgeEvaluator, type LlmJudgeEvaluatorConfig, type LlmJudgeEvaluatorOptions, type MockResolvedConfig, type PiAgentSdkResolvedConfig, type PiCodingAgentResolvedConfig, type ProgressEvent, type PromptInputs, type PromptScriptConfig, type Provider, type ProviderKind, type ProviderRequest, type ProviderResponse, type ProviderTokenUsage, type ResolvedTarget, type RubricItem, type RunEvalCaseOptions, type RunEvaluationOptions, type ScoreRange, type SystemTestMessage, TEST_MESSAGE_ROLES, type TargetAccessConfig, type TargetDefinition, type TestMessage, type TestMessageContent, type TestMessageRole, type TokenUsage, TokenUsageEvaluator, type TokenUsageEvaluatorConfig, type TokenUsageEvaluatorOptions, type ToolTestMessage, ToolTrajectoryEvaluator, type ToolTrajectoryEvaluatorConfig, type ToolTrajectoryEvaluatorOptions, type ToolTrajectoryExpectedItem, type TraceSummary, type UserTestMessage, type VSCodeResolvedConfig, avgToolDurationMs, buildDirectoryChain, buildOutputSchema, buildPromptInputs, buildSearchRoots, clampScore, computeTraceSummary, consumeClaudeCodeLogEntries, consumeCodexLogEntries, consumePiLogEntries, createAgentKernel, createProvider, deepEqual, detectFormat, ensureVSCodeSubagents, executeScript, explorationRatio, extractJsonBlob, fileExists, findGitRoot, freeformEvaluationSchema, generateRubrics, getHitCount, isEvaluatorKind, isGuidelineFile, isJsonObject, isJsonValue, isNonEmptyString, isTestMessage, isTestMessageRole, listTargetNames, loadEvalCases, mergeExecutionMetrics, normalizeLineEndings, parseJsonFromText, parseJsonSafe, readJsonFile, readTargetDefinitions, readTestSuiteMetadata, readTextFile, resolveAndCreateProvider, resolveFileReference, resolveTargetDefinition, runEvalCase, runEvaluation, scoreToVerdict, subscribeToClaudeCodeLogEntries, subscribeToCodexLogEntries, subscribeToPiLogEntries, tokensPerTool };
1408
+ export { type AgentKernel, type AnthropicResolvedConfig, type AssistantTestMessage, type AzureResolvedConfig, type ChildEvaluatorResult, type ClaudeCodeResolvedConfig, type CliResolvedConfig, CodeEvaluator, type CodeEvaluatorConfig, type CodeEvaluatorOptions, type CompositeAggregatorConfig, CompositeEvaluator, type CompositeEvaluatorConfig, type CompositeEvaluatorOptions, type CopilotResolvedConfig, CostEvaluator, type CostEvaluatorConfig, type CostEvaluatorOptions, DEFAULT_EXPLORATION_TOOLS, type EnsureSubagentsOptions, type EnsureSubagentsResult, type EnvLookup, type EvalCase, type EvaluationCache, type EvaluationContext, type EvaluationResult, type EvaluationScore, type EvaluationVerdict, type Evaluator, type EvaluatorConfig, type EvaluatorFactory, type EvaluatorKind, type EvaluatorResult, type ExecutionMetrics, FieldAccuracyEvaluator, type FieldAccuracyEvaluatorConfig, type FieldAccuracyEvaluatorOptions, type FieldAggregationType, type FieldConfig, type FieldMatchType, type GeminiResolvedConfig, type GenerateRubricsOptions, type JsonObject, type JsonPrimitive, type JsonValue, LatencyEvaluator, type LatencyEvaluatorConfig, type LatencyEvaluatorOptions, LlmJudgeEvaluator, type LlmJudgeEvaluatorConfig, type LlmJudgeEvaluatorOptions, type MockResolvedConfig, type PiAgentSdkResolvedConfig, type PiCodingAgentResolvedConfig, type ProgressEvent, type PromptInputs, type PromptScriptConfig, type Provider, type ProviderKind, type ProviderRequest, type ProviderResponse, type ProviderTokenUsage, type ResolvedTarget, type RubricItem, type RunEvalCaseOptions, type RunEvaluationOptions, type ScoreRange, type SystemTestMessage, TEST_MESSAGE_ROLES, type TargetAccessConfig, type TargetDefinition, type TestMessage, type TestMessageContent, type TestMessageRole, type TokenUsage, TokenUsageEvaluator, type TokenUsageEvaluatorConfig, type TokenUsageEvaluatorOptions, type ToolTestMessage, ToolTrajectoryEvaluator, type ToolTrajectoryEvaluatorConfig, type ToolTrajectoryEvaluatorOptions, type ToolTrajectoryExpectedItem, type TraceSummary, type UserTestMessage, type VSCodeResolvedConfig, avgToolDurationMs, buildDirectoryChain, buildOutputSchema, buildPromptInputs, buildSearchRoots, clampScore, computeTraceSummary, consumeClaudeCodeLogEntries, consumeCodexLogEntries, consumeCopilotCliLogEntries, consumePiLogEntries, createAgentKernel, createProvider, deepEqual, detectFormat, ensureVSCodeSubagents, executeScript, explorationRatio, extractJsonBlob, fileExists, findGitRoot, freeformEvaluationSchema, generateRubrics, getHitCount, isEvaluatorKind, isGuidelineFile, isJsonObject, isJsonValue, isNonEmptyString, isTestMessage, isTestMessageRole, listTargetNames, loadEvalCases, mergeExecutionMetrics, normalizeLineEndings, parseJsonFromText, parseJsonSafe, readJsonFile, readTargetDefinitions, readTestSuiteMetadata, readTextFile, resolveAndCreateProvider, resolveFileReference, resolveTargetDefinition, runEvalCase, runEvaluation, scoreToVerdict, subscribeToClaudeCodeLogEntries, subscribeToCodexLogEntries, subscribeToCopilotCliLogEntries, subscribeToPiLogEntries, tokensPerTool };