@wix/evalforge-evaluator 0.88.0 → 0.89.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/build/index.js +20 -16
- package/build/index.js.map +4 -4
- package/build/index.mjs +11 -7
- package/build/index.mjs.map +4 -4
- package/build/types/run-scenario/agents/claude-code/claude-code-adapter.d.ts +2 -1
- package/build/types/run-scenario/agents/registry.d.ts +14 -14
- package/package.json +4 -4
package/build/index.mjs
CHANGED
|
@@ -531,7 +531,7 @@ import { randomUUID as randomUUID2 } from "crypto";
|
|
|
531
531
|
// src/run-scenario/agents/registry.ts
|
|
532
532
|
var AgentAdapterRegistry = class {
|
|
533
533
|
/**
|
|
534
|
-
* Map of
|
|
534
|
+
* Map of run commands to their registered adapters.
|
|
535
535
|
* Multiple commands can map to the same adapter.
|
|
536
536
|
*/
|
|
537
537
|
adapters = /* @__PURE__ */ new Map();
|
|
@@ -560,9 +560,9 @@ var AgentAdapterRegistry = class {
|
|
|
560
560
|
}
|
|
561
561
|
}
|
|
562
562
|
/**
|
|
563
|
-
* Get an adapter by command
|
|
563
|
+
* Get an adapter by run command.
|
|
564
564
|
*
|
|
565
|
-
* @param runCommand - The command
|
|
565
|
+
* @param runCommand - The run command to look up
|
|
566
566
|
* @returns The registered adapter, or undefined if not found
|
|
567
567
|
*/
|
|
568
568
|
get(runCommand) {
|
|
@@ -571,7 +571,7 @@ var AgentAdapterRegistry = class {
|
|
|
571
571
|
/**
|
|
572
572
|
* Check if a command has a registered adapter.
|
|
573
573
|
*
|
|
574
|
-
* @param runCommand - The command
|
|
574
|
+
* @param runCommand - The run command to check
|
|
575
575
|
* @returns True if an adapter is registered for this command
|
|
576
576
|
*/
|
|
577
577
|
has(runCommand) {
|
|
@@ -588,7 +588,7 @@ var AgentAdapterRegistry = class {
|
|
|
588
588
|
/**
|
|
589
589
|
* Get all supported commands.
|
|
590
590
|
*
|
|
591
|
-
* @returns Array of all registered
|
|
591
|
+
* @returns Array of all registered run commands
|
|
592
592
|
*/
|
|
593
593
|
getSupportedCommands() {
|
|
594
594
|
return Array.from(this.adapters.keys());
|
|
@@ -638,6 +638,9 @@ function getAdapter(runCommand) {
|
|
|
638
638
|
return adapter;
|
|
639
639
|
}
|
|
640
640
|
|
|
641
|
+
// src/run-scenario/agents/claude-code/claude-code-adapter.ts
|
|
642
|
+
import { AgentRunCommand } from "@wix/evalforge-types";
|
|
643
|
+
|
|
641
644
|
// src/run-scenario/agents/claude-code/execute.ts
|
|
642
645
|
import {
|
|
643
646
|
ClaudeModel,
|
|
@@ -1659,7 +1662,7 @@ function buildLLMTraceFromSteps(steps, totalDurationMs, usage, model) {
|
|
|
1659
1662
|
var ClaudeCodeAdapter = class {
|
|
1660
1663
|
id = "claude-code";
|
|
1661
1664
|
name = "Claude Code";
|
|
1662
|
-
supportedCommands = [
|
|
1665
|
+
supportedCommands = [AgentRunCommand.CLAUDE];
|
|
1663
1666
|
/**
|
|
1664
1667
|
* Execute a skill using the Claude Code SDK.
|
|
1665
1668
|
*
|
|
@@ -2440,7 +2443,8 @@ function extractTemplateFiles(before, after) {
|
|
|
2440
2443
|
}
|
|
2441
2444
|
|
|
2442
2445
|
// src/run-scenario/run-agent-with-context.ts
|
|
2443
|
-
|
|
2446
|
+
import { AgentRunCommand as AgentRunCommand2 } from "@wix/evalforge-types";
|
|
2447
|
+
var DEFAULT_AGENT_COMMAND = AgentRunCommand2.CLAUDE;
|
|
2444
2448
|
async function runAgentWithContext(config, evalRunId2, scenario, evalData, workDir) {
|
|
2445
2449
|
const skillsGroupId = evalData.evalRun.skillsGroupId;
|
|
2446
2450
|
if (!skillsGroupId) {
|