@wix/evalforge-evaluator 0.108.0 → 0.110.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/build/index.js CHANGED
@@ -2661,6 +2661,7 @@ var ClaudeCodeAdapter = class {
2661
2661
  model: modelForSdk,
2662
2662
  temperature: modelConfig?.temperature,
2663
2663
  maxTokens: modelConfig?.maxTokens,
2664
+ maxTurns: modelConfig?.maxTurns,
2664
2665
  aiGatewayUrl,
2665
2666
  aiGatewayHeaders,
2666
2667
  traceContext,
@@ -42693,7 +42694,6 @@ var MODEL_PRICING = {
42693
42694
  CLAUDE_4_OPUS_1_0: { input: 15, output: 75 },
42694
42695
  CLAUDE_4_SONNET_1_0: { input: 3, output: 15 },
42695
42696
  // Anthropic — Claude 3.x
42696
- CLAUDE_3_7_SONNET_1_0: { input: 3, output: 15 },
42697
42697
  CLAUDE_3_5_SONNET_2_0: { input: 3, output: 15 },
42698
42698
  CLAUDE_3_5_SONNET_1_0: { input: 3, output: 15 },
42699
42699
  CLAUDE_3_HAIKU_1_0: { input: 0.25, output: 1.25 },
@@ -42811,7 +42811,7 @@ function estimateStepTimestamp(startMs, stepIndex, totalSteps) {
42811
42811
  // src/run-scenario/agents/simple-agent/execute.ts
42812
42812
  var PROVIDER_ANTHROPIC2 = "anthropic";
42813
42813
  var PROVIDER_OPENAI = "openai";
42814
- var MAX_TOOL_STEPS = 25;
42814
+ var DEFAULT_MAX_TOOL_STEPS = 25;
42815
42815
  function createModel(modelId, baseUrl, headers) {
42816
42816
  const isClaudeModel = import_evalforge_types6.AVAILABLE_CLAUDE_MODEL_IDS.includes(
42817
42817
  modelId
@@ -42894,7 +42894,7 @@ async function executeWithAiSdk(context2) {
42894
42894
  temperature: supportsThinking ? void 0 : modelConfig.temperature,
42895
42895
  maxOutputTokens: modelConfig.maxTokens,
42896
42896
  tools: mcpTools,
42897
- stopWhen: mcpTools ? stepCountIs(MAX_TOOL_STEPS) : stepCountIs(1),
42897
+ stopWhen: mcpTools ? stepCountIs(modelConfig.maxTurns ?? DEFAULT_MAX_TOOL_STEPS) : stepCountIs(1),
42898
42898
  providerOptions: providerOpts
42899
42899
  });
42900
42900
  const durationMs = Date.now() - startTime;