@m4trix/evals 0.27.0 → 0.28.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +5 -2
- package/dist/cli-simple.cjs +36 -15
- package/dist/cli-simple.cjs.map +1 -1
- package/dist/cli-simple.js +36 -15
- package/dist/cli-simple.js.map +1 -1
- package/dist/cli.cjs +11 -7
- package/dist/cli.cjs.map +1 -1
- package/dist/cli.js +11 -7
- package/dist/cli.js.map +1 -1
- package/dist/index.cjs +15 -10
- package/dist/index.cjs.map +1 -1
- package/dist/index.d.ts +35 -14
- package/dist/index.js +15 -10
- package/dist/index.js.map +1 -1
- package/package.json +1 -1
package/dist/index.cjs
CHANGED
|
@@ -841,7 +841,7 @@ var RunConfig = class _RunConfig {
|
|
|
841
841
|
getDisplayLabel() {
|
|
842
842
|
return this._displayName ?? this._name;
|
|
843
843
|
}
|
|
844
|
-
/** Tags from `RunConfig.define({ tags })`; surfaced as `runConfigTags` on evaluator callbacks. */
|
|
844
|
+
/** Tags from `RunConfig.define({ tags })`; surfaced as `meta.runConfigTags` on evaluator callbacks. */
|
|
845
845
|
getTags() {
|
|
846
846
|
return [...this._tags];
|
|
847
847
|
}
|
|
@@ -1014,10 +1014,11 @@ var TestCase = class _TestCase {
|
|
|
1014
1014
|
static describe(config) {
|
|
1015
1015
|
const name = validateTestCaseName(config.name, "TestCase.describe");
|
|
1016
1016
|
const displayName = normalizeOptionalDisplayName(config.displayName);
|
|
1017
|
+
const tags = config.tags !== void 0 ? [...config.tags] : [];
|
|
1017
1018
|
return new _TestCase({
|
|
1018
1019
|
name,
|
|
1019
1020
|
displayName,
|
|
1020
|
-
tags
|
|
1021
|
+
tags,
|
|
1021
1022
|
inputSchema: config.inputSchema,
|
|
1022
1023
|
input: config.input,
|
|
1023
1024
|
outputSchema: config.outputSchema,
|
|
@@ -1034,7 +1035,7 @@ var TestCase = class _TestCase {
|
|
|
1034
1035
|
return this._config.displayName ?? this._config.name;
|
|
1035
1036
|
}
|
|
1036
1037
|
getTags() {
|
|
1037
|
-
return this._config.tags;
|
|
1038
|
+
return [...this._config.tags];
|
|
1038
1039
|
}
|
|
1039
1040
|
getInputSchema() {
|
|
1040
1041
|
return this._config.inputSchema;
|
|
@@ -1595,11 +1596,12 @@ function processOneEvaluation(task, unit, totalEvaluations, publishEvent, persis
|
|
|
1595
1596
|
repetitionId,
|
|
1596
1597
|
repetitionIndex,
|
|
1597
1598
|
repetitionCount,
|
|
1598
|
-
runConfigName: task.runConfigName
|
|
1599
|
+
runConfigName: task.runConfigName,
|
|
1600
|
+
...task.experimentName !== void 0 && task.experimentName !== "" ? { experimentName: task.experimentName } : {},
|
|
1601
|
+
testCaseTags: getTestCaseTagList(testCaseItem.testCase),
|
|
1602
|
+
runConfigTags: task.runConfigTags,
|
|
1603
|
+
evaluatorTags: getEvaluatorTagList(evaluator)
|
|
1599
1604
|
},
|
|
1600
|
-
testCaseTags: getTestCaseTagList(testCaseItem.testCase),
|
|
1601
|
-
runConfigTags: task.runConfigTags,
|
|
1602
|
-
evaluatorTags: getEvaluatorTagList(evaluator),
|
|
1603
1605
|
logDiff,
|
|
1604
1606
|
log,
|
|
1605
1607
|
createError
|
|
@@ -2078,7 +2080,8 @@ var EffectRunner = class {
|
|
|
2078
2080
|
globalEvaluationSemaphore: sem,
|
|
2079
2081
|
runConfigName: job.runConfigName,
|
|
2080
2082
|
runConfigTags: job.runConfigTags,
|
|
2081
|
-
repetitions: job.repetitions
|
|
2083
|
+
repetitions: job.repetitions,
|
|
2084
|
+
experimentName: request.experimentName
|
|
2082
2085
|
})
|
|
2083
2086
|
);
|
|
2084
2087
|
}
|
|
@@ -2113,7 +2116,8 @@ var EffectRunner = class {
|
|
|
2113
2116
|
maxConcurrency: request.concurrency ?? this.config.maxConcurrency ?? 1,
|
|
2114
2117
|
repetitions: request.repetitions,
|
|
2115
2118
|
runConfigName,
|
|
2116
|
-
runConfigTags: request.runConfigTags
|
|
2119
|
+
runConfigTags: request.runConfigTags,
|
|
2120
|
+
experimentName: request.experimentName
|
|
2117
2121
|
});
|
|
2118
2122
|
}
|
|
2119
2123
|
async startDatasetRun(params) {
|
|
@@ -2188,7 +2192,8 @@ var EffectRunner = class {
|
|
|
2188
2192
|
globalEvaluationSemaphore: params.globalEvaluationSemaphore,
|
|
2189
2193
|
runConfigName: params.runConfigName,
|
|
2190
2194
|
runConfigTags,
|
|
2191
|
-
repetitions
|
|
2195
|
+
repetitions,
|
|
2196
|
+
experimentName: params.experimentName
|
|
2192
2197
|
})
|
|
2193
2198
|
);
|
|
2194
2199
|
return snapshot;
|