@m4trix/evals 0.29.0 → 0.31.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +1 -1
- package/dist/cli-simple.cjs +19 -6
- package/dist/cli-simple.cjs.map +1 -1
- package/dist/cli-simple.js +19 -6
- package/dist/cli-simple.js.map +1 -1
- package/dist/cli.cjs +9 -1
- package/dist/cli.cjs.map +1 -1
- package/dist/cli.js +9 -1
- package/dist/cli.js.map +1 -1
- package/dist/index.cjs +7 -0
- package/dist/index.cjs.map +1 -1
- package/dist/index.d.ts +15 -0
- package/dist/index.js +7 -0
- package/dist/index.js.map +1 -1
- package/package.json +1 -1
package/dist/index.cjs
CHANGED
|
@@ -1591,6 +1591,8 @@ function processOneEvaluation(task, unit, totalEvaluations, publishEvent, persis
|
|
|
1591
1591
|
output,
|
|
1592
1592
|
meta: {
|
|
1593
1593
|
triggerId: task.triggerId,
|
|
1594
|
+
triggerTimestamp: task.triggerTimestamp,
|
|
1595
|
+
triggeredAt: new Date(task.triggerTimestamp).toISOString(),
|
|
1594
1596
|
runId: evaluatorRunId,
|
|
1595
1597
|
datasetName: task.dataset.getDisplayLabel(),
|
|
1596
1598
|
testCaseId: testCaseItem.id,
|
|
@@ -2071,6 +2073,7 @@ var EffectRunner = class {
|
|
|
2071
2073
|
const globalConcurrency = Math.max(1, request.globalConcurrency);
|
|
2072
2074
|
const sem = effect.Effect.unsafeMakeSemaphore(globalConcurrency);
|
|
2073
2075
|
const triggerId = request.triggerId ?? `trg-${crypto.randomUUID()}`;
|
|
2076
|
+
const triggerTimestamp = request.triggerTimestamp ?? Date.now();
|
|
2074
2077
|
const snapshots = [];
|
|
2075
2078
|
for (const job of request.jobs) {
|
|
2076
2079
|
snapshots.push(
|
|
@@ -2078,6 +2081,7 @@ var EffectRunner = class {
|
|
|
2078
2081
|
datasetId: job.datasetId,
|
|
2079
2082
|
evaluatorIds: job.evaluatorIds,
|
|
2080
2083
|
triggerId,
|
|
2084
|
+
triggerTimestamp,
|
|
2081
2085
|
maxConcurrency: this.config.maxConcurrency ?? 1,
|
|
2082
2086
|
globalEvaluationSemaphore: sem,
|
|
2083
2087
|
runConfigName: job.runConfigName,
|
|
@@ -2115,6 +2119,7 @@ var EffectRunner = class {
|
|
|
2115
2119
|
datasetId: request.datasetId,
|
|
2116
2120
|
evaluatorIds: request.evaluatorIds,
|
|
2117
2121
|
triggerId: request.triggerId,
|
|
2122
|
+
triggerTimestamp: request.triggerTimestamp ?? Date.now(),
|
|
2118
2123
|
maxConcurrency: request.concurrency ?? this.config.maxConcurrency ?? 1,
|
|
2119
2124
|
repetitions: request.repetitions,
|
|
2120
2125
|
runConfigName,
|
|
@@ -2142,6 +2147,7 @@ var EffectRunner = class {
|
|
|
2142
2147
|
const totalEvaluations = selectedTestCases.length * repetitions;
|
|
2143
2148
|
const runConfigTags = [...params.runConfigTags ?? []];
|
|
2144
2149
|
const triggerId = params.triggerId ?? `trg-${crypto.randomUUID()}`;
|
|
2150
|
+
const triggerTimestamp = params.triggerTimestamp ?? Date.now();
|
|
2145
2151
|
const runId = `run-${crypto.randomUUID()}`;
|
|
2146
2152
|
const artifactPath = createArtifactPath(this.config.artifactDirectory, params.datasetId, runId);
|
|
2147
2153
|
const snapshot = {
|
|
@@ -2185,6 +2191,7 @@ var EffectRunner = class {
|
|
|
2185
2191
|
effect.Queue.offer(this.runQueue, {
|
|
2186
2192
|
runId,
|
|
2187
2193
|
triggerId,
|
|
2194
|
+
triggerTimestamp,
|
|
2188
2195
|
datasetId: params.datasetId,
|
|
2189
2196
|
dataset: dataset.dataset,
|
|
2190
2197
|
evaluators: selectedEvaluators,
|