@m4trix/evals 0.27.0 → 0.28.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/index.cjs CHANGED
@@ -841,7 +841,7 @@ var RunConfig = class _RunConfig {
841
841
  getDisplayLabel() {
842
842
  return this._displayName ?? this._name;
843
843
  }
844
- /** Tags from `RunConfig.define({ tags })`; surfaced as `runConfigTags` on evaluator callbacks. */
844
+ /** Tags from `RunConfig.define({ tags })`; surfaced as `meta.runConfigTags` on evaluator callbacks. */
845
845
  getTags() {
846
846
  return [...this._tags];
847
847
  }
@@ -1014,10 +1014,11 @@ var TestCase = class _TestCase {
1014
1014
  static describe(config) {
1015
1015
  const name = validateTestCaseName(config.name, "TestCase.describe");
1016
1016
  const displayName = normalizeOptionalDisplayName(config.displayName);
1017
+ const tags = config.tags !== void 0 ? [...config.tags] : [];
1017
1018
  return new _TestCase({
1018
1019
  name,
1019
1020
  displayName,
1020
- tags: config.tags,
1021
+ tags,
1021
1022
  inputSchema: config.inputSchema,
1022
1023
  input: config.input,
1023
1024
  outputSchema: config.outputSchema,
@@ -1034,7 +1035,7 @@ var TestCase = class _TestCase {
1034
1035
  return this._config.displayName ?? this._config.name;
1035
1036
  }
1036
1037
  getTags() {
1037
- return this._config.tags;
1038
+ return [...this._config.tags];
1038
1039
  }
1039
1040
  getInputSchema() {
1040
1041
  return this._config.inputSchema;
@@ -1595,11 +1596,12 @@ function processOneEvaluation(task, unit, totalEvaluations, publishEvent, persis
1595
1596
  repetitionId,
1596
1597
  repetitionIndex,
1597
1598
  repetitionCount,
1598
- runConfigName: task.runConfigName
1599
+ runConfigName: task.runConfigName,
1600
+ ...task.experimentName !== void 0 && task.experimentName !== "" ? { experimentName: task.experimentName } : {},
1601
+ testCaseTags: getTestCaseTagList(testCaseItem.testCase),
1602
+ runConfigTags: task.runConfigTags,
1603
+ evaluatorTags: getEvaluatorTagList(evaluator)
1599
1604
  },
1600
- testCaseTags: getTestCaseTagList(testCaseItem.testCase),
1601
- runConfigTags: task.runConfigTags,
1602
- evaluatorTags: getEvaluatorTagList(evaluator),
1603
1605
  logDiff,
1604
1606
  log,
1605
1607
  createError
@@ -2078,7 +2080,8 @@ var EffectRunner = class {
2078
2080
  globalEvaluationSemaphore: sem,
2079
2081
  runConfigName: job.runConfigName,
2080
2082
  runConfigTags: job.runConfigTags,
2081
- repetitions: job.repetitions
2083
+ repetitions: job.repetitions,
2084
+ experimentName: request.experimentName
2082
2085
  })
2083
2086
  );
2084
2087
  }
@@ -2113,7 +2116,8 @@ var EffectRunner = class {
2113
2116
  maxConcurrency: request.concurrency ?? this.config.maxConcurrency ?? 1,
2114
2117
  repetitions: request.repetitions,
2115
2118
  runConfigName,
2116
- runConfigTags: request.runConfigTags
2119
+ runConfigTags: request.runConfigTags,
2120
+ experimentName: request.experimentName
2117
2121
  });
2118
2122
  }
2119
2123
  async startDatasetRun(params) {
@@ -2188,7 +2192,8 @@ var EffectRunner = class {
2188
2192
  globalEvaluationSemaphore: params.globalEvaluationSemaphore,
2189
2193
  runConfigName: params.runConfigName,
2190
2194
  runConfigTags,
2191
- repetitions
2195
+ repetitions,
2196
+ experimentName: params.experimentName
2192
2197
  })
2193
2198
  );
2194
2199
  return snapshot;