@wix/evalforge-evaluator 0.161.0 → 0.162.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/build/index.js CHANGED
@@ -3775,7 +3775,7 @@ async function executeWithAiSdk(context) {
3775
3775
  const timeoutHandle = setTimeout(() => {
3776
3776
  abortController.abort(
3777
3777
  new Error(
3778
- `Simple Agent generateText timed out after ${SDK_TIMEOUT_MS}ms (model=${modelId}, scenario=${scenario.name})`
3778
+ `Simple Agent generateText / streamText timed out after ${SDK_TIMEOUT_MS}ms (model=${modelId}, scenario=${scenario.name})`
3779
3779
  )
3780
3780
  );
3781
3781
  }, SDK_TIMEOUT_MS);
@@ -3821,7 +3821,7 @@ async function executeWithAiSdk(context) {
3821
3821
  const stepTimestamps = [];
3822
3822
  const { triggerPromptImages } = context;
3823
3823
  const hasImages = triggerPromptImages && triggerPromptImages.length > 0;
3824
- const result = await (0, import_ai.generateText)({
3824
+ const sdkParams = {
3825
3825
  ...topLevelExtras,
3826
3826
  model,
3827
3827
  abortSignal: abortController.signal,
@@ -3878,15 +3878,32 @@ async function executeWithAiSdk(context) {
3878
3878
  );
3879
3879
  }
3880
3880
  }
3881
- });
3881
+ };
3882
+ const shouldStream = !isResponsesAPI;
3883
+ let text;
3884
+ let steps;
3885
+ let rawUsage;
3886
+ if (shouldStream) {
3887
+ const stream = (0, import_ai.streamText)(sdkParams);
3888
+ [text, steps, rawUsage] = await Promise.all([
3889
+ stream.text,
3890
+ stream.steps,
3891
+ stream.usage
3892
+ ]);
3893
+ } else {
3894
+ const result = await (0, import_ai.generateText)(sdkParams);
3895
+ text = result.text;
3896
+ steps = result.steps;
3897
+ rawUsage = result.usage;
3898
+ }
3882
3899
  const durationMs = Date.now() - startTime;
3883
3900
  const usage = {
3884
- inputTokens: result.usage.inputTokens ?? 0,
3885
- outputTokens: result.usage.outputTokens ?? 0,
3886
- totalTokens: result.usage.totalTokens ?? 0
3901
+ inputTokens: rawUsage.inputTokens ?? 0,
3902
+ outputTokens: rawUsage.outputTokens ?? 0,
3903
+ totalTokens: rawUsage.totalTokens ?? 0
3887
3904
  };
3888
3905
  const llmTrace = buildLLMTrace2(
3889
- result.steps,
3906
+ steps,
3890
3907
  durationMs,
3891
3908
  usage,
3892
3909
  modelId,
@@ -3899,12 +3916,12 @@ async function executeWithAiSdk(context) {
3899
3916
  }
3900
3917
  const conversation = buildConversation3(
3901
3918
  scenario.triggerPrompt,
3902
- result.steps,
3919
+ steps,
3903
3920
  startTime,
3904
3921
  stepTimestamps
3905
3922
  );
3906
3923
  return {
3907
- outputText: result.text,
3924
+ outputText: text,
3908
3925
  durationMs,
3909
3926
  usage,
3910
3927
  llmTrace,