@ls-stack/agent-eval 0.29.0 → 0.30.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/{app-D6-msfKP.mjs → app-CbOZBHju.mjs} +4 -4
- package/dist/apps/web/dist/assets/{index-BCr6J8Uj.js → index-DEikHy2a.js} +35 -35
- package/dist/apps/web/dist/index.html +1 -1
- package/dist/bin.mjs +1 -1
- package/dist/{cli-CIc_gBNM.mjs → cli-CiFOqMwS.mjs} +3 -3
- package/dist/index.d.mts +133 -109
- package/dist/index.mjs +3 -3
- package/dist/runChild.mjs +1 -1
- package/dist/{runOrchestration-CIARrLs6.mjs → runOrchestration-CO3Vf0cQ.mjs} +35 -9
- package/dist/{runner-Bq1f9B9d.mjs → runner-4pF_Qrc9.mjs} +1 -1
- package/dist/{runner-1F8MeY5V.mjs → runner-CXHkf7ih.mjs} +2 -2
- package/dist/src-BiPLv9ya.mjs +3 -0
- package/package.json +1 -1
- package/skills/agent-eval/SKILL.md +8 -5
- package/dist/src-CkWT1iSu.mjs +0 -3
package/dist/index.mjs
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { $ as defaultConfigKeySchema, $n as incrementEvalOutput, $t as cacheEntryWithDebugKeySchema, A as createRunRequestSchema, An as buildTraceTree, At as runLogPhaseSchema, B as getEvalDisplayStatus, Bn as repoFile, Bt as manualInputTextFieldSchema, Cn as columnKindSchema, Ct as evalStatAggregateSchema, Dn as repoFileRefSchema, Dt as runLogEntrySchema, En as numberDisplayOptionsSchema, Et as evalSummarySchema, F as extractApiCalls, Fn as hashCacheKeySync, Ft as manualInputJsonFieldSchema, G as runSummarySchema, Gn as advanceEvalTime, Gt as evalChartConfigSchema, H as deriveStatusFromCaseRows, Hn as readManualInputFile, Ht as evalChartAxisSchema, I as extractLlmCalls, In as deserializeCacheRecording, It as manualInputMultilineFieldSchema, J as agentEvalsConfigSchema, Jn as evalAssert, Jt as evalChartTypeSchema, K as DEFAULT_API_CALLS_CONFIG, Kn as appendToEvalOutput, Kt as evalChartMetricSchema, L as applyDerivedCallAttributes, Ln as deserializeCacheValue, Lt as manualInputNumberFieldSchema, M as sseEnvelopeSchema, Mn as evalSpan, Mt as manualInputBooleanFieldSchema, N as extractCacheEntries, Nn as evalTracer, Nt as manualInputDescriptorSchema, O as configReloadStateSchema, On as runArtifactRefSchema, Ot as runLogLevelSchema, P as extractCacheHits, Pn as hashCacheKey, Pt as manualInputFieldDescriptorSchema, Q as apiCallsConfigSchema, Qn as getEvalStartTime, Qt as cacheEntrySchema, R as getNestedAttribute, Rn as serializeCacheRecording, Rt as manualInputSelectFieldSchema, Sn as columnFormatSchema, St as evalFreshnessStatusSchema, Tn as jsonCellSchema, Tt as evalStatsConfigSchema, U as deriveStatusFromChildStatuses, Un as evalExpect, Ut as evalChartBuiltinMetricSchema, V as deriveScopedSummaryFromCases, Vn as manualInputFileValueSchema, Vt as evalChartAggregateSchema, W as runManifestSchema, Wn as EvalAssertionError, Wt as evalChartColorSchema, X as apiCallMetricPlacementSchema, Xn as getCurrentScope, Xt as cacheDebugKeyEntrySchema, Y as apiCallMetricFormatSchema, Yn as evalLog, Yt as evalChartsConfigSchema, Z as apiCallMetricSchema, Zn as getEvalCaseInput, Zt as cacheDebugKeyFileSchema, _n as traceSpanKindSchema, _t as getCaseRowEvalKey, an as cacheRecordingSchema, ar as runInExistingEvalScope, at as llmCallMetricSchema, bn as cellValueSchema, bt as caseRowSchema, cn as spanCacheOptionsSchema, cr as startEvalBackgroundJob, ct as llmCallsConfigSchema, dn as traceAttributeDisplayInputSchema, dt as resolveLlmCallsConfig, en as cacheFileSchema, er as isInEvalScope, et as evalColumnOverrideSchema, fn as traceAttributeDisplayPlacementSchema, ft as runLogsConfigSchema, gn as traceSpanErrorSchema, gt as getCaseRowCaseKey, hn as traceDisplayInputConfigSchema, ht as buildEvalKey, in as cacheRecordingOpSchema, ir as runInEvalScope, it as llmCallMetricPlacementSchema, j as updateManualScoreRequestSchema, jn as captureEvalSpanError, jt as scoreTraceSchema, k as configReloadStatusSchema, kn as z, kt as runLogLocationSchema, ln as traceCacheRefSchema, lr as defineEval, lt as removeDefaultConfigSchema, mn as traceDisplayConfigSchema, mt as buildCaseKey, nn as cacheModeSchema, nr as nextEvalId, nt as evalDeriveConfigSchema, on as cacheStatusSchema, or as setEvalOutput, ot as llmCallPricingRateSchema, pn as traceAttributeDisplaySchema, pt as trialSelectionModeSchema, q as DEFAULT_LLM_CALLS_CONFIG, qt as evalChartTooltipExtraSchema, rn as cacheOperationTypeSchema, rr as runInEvalRuntimeScope, rt as llmCallMetricFormatSchema, sn as serializedCacheSpanSchema, sr as setScopeCacheContext, st as llmCallPricingSchema, tn as cacheListItemSchema, tr as mergeEvalOutput, tt as evalColumnsSchema, un as traceAttributeDisplayFormatSchema, ur as getEvalRegistry, ut as resolveApiCallsConfig, vn as traceSpanSchema, vt as assertionFailureSchema, wn as fileRefSchema, wt as evalStatItemSchema, xn as columnDefSchema, xt as discoveryIssueSchema, yn as traceSpanWarningSchema, yt as caseDetailSchema, z as getEvalTitle, zn as serializeCacheValue, zt as manualInputSelectOptionSchema } from "./runOrchestration-
|
|
2
|
-
import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-
|
|
3
|
-
import "./src-
|
|
1
|
+
import { $ as defaultConfigKeySchema, $n as incrementEvalOutput, $t as cacheEntryWithDebugKeySchema, A as createRunRequestSchema, An as buildTraceTree, At as runLogPhaseSchema, B as getEvalDisplayStatus, Bn as repoFile, Bt as manualInputTextFieldSchema, Cn as columnKindSchema, Ct as evalStatAggregateSchema, Dn as repoFileRefSchema, Dt as runLogEntrySchema, En as numberDisplayOptionsSchema, Et as evalSummarySchema, F as extractApiCalls, Fn as hashCacheKeySync, Ft as manualInputJsonFieldSchema, G as runSummarySchema, Gn as advanceEvalTime, Gt as evalChartConfigSchema, H as deriveStatusFromCaseRows, Hn as readManualInputFile, Ht as evalChartAxisSchema, I as extractLlmCalls, In as deserializeCacheRecording, It as manualInputMultilineFieldSchema, J as agentEvalsConfigSchema, Jn as evalAssert, Jt as evalChartTypeSchema, K as DEFAULT_API_CALLS_CONFIG, Kn as appendToEvalOutput, Kt as evalChartMetricSchema, L as applyDerivedCallAttributes, Ln as deserializeCacheValue, Lt as manualInputNumberFieldSchema, M as sseEnvelopeSchema, Mn as evalSpan, Mt as manualInputBooleanFieldSchema, N as extractCacheEntries, Nn as evalTracer, Nt as manualInputDescriptorSchema, O as configReloadStateSchema, On as runArtifactRefSchema, Ot as runLogLevelSchema, P as extractCacheHits, Pn as hashCacheKey, Pt as manualInputFieldDescriptorSchema, Q as apiCallsConfigSchema, Qn as getEvalStartTime, Qt as cacheEntrySchema, R as getNestedAttribute, Rn as serializeCacheRecording, Rt as manualInputSelectFieldSchema, Sn as columnFormatSchema, St as evalFreshnessStatusSchema, Tn as jsonCellSchema, Tt as evalStatsConfigSchema, U as deriveStatusFromChildStatuses, Un as evalExpect, Ut as evalChartBuiltinMetricSchema, V as deriveScopedSummaryFromCases, Vn as manualInputFileValueSchema, Vt as evalChartAggregateSchema, W as runManifestSchema, Wn as EvalAssertionError, Wt as evalChartColorSchema, X as apiCallMetricPlacementSchema, Xn as getCurrentScope, Xt as cacheDebugKeyEntrySchema, Y as apiCallMetricFormatSchema, Yn as evalLog, Yt as evalChartsConfigSchema, Z as apiCallMetricSchema, Zn as getEvalCaseInput, Zt as cacheDebugKeyFileSchema, _n as traceSpanKindSchema, _t as getCaseRowEvalKey, an as cacheRecordingSchema, ar as runInExistingEvalScope, at as llmCallMetricSchema, bn as cellValueSchema, bt as caseRowSchema, cn as spanCacheOptionsSchema, cr as startEvalBackgroundJob, ct as llmCallsConfigSchema, dn as traceAttributeDisplayInputSchema, dt as resolveLlmCallsConfig, en as cacheFileSchema, er as isInEvalScope, et as evalColumnOverrideSchema, fn as traceAttributeDisplayPlacementSchema, ft as runLogsConfigSchema, gn as traceSpanErrorSchema, gt as getCaseRowCaseKey, hn as traceDisplayInputConfigSchema, ht as buildEvalKey, in as cacheRecordingOpSchema, ir as runInEvalScope, it as llmCallMetricPlacementSchema, j as updateManualScoreRequestSchema, jn as captureEvalSpanError, jt as scoreTraceSchema, k as configReloadStatusSchema, kn as z, kt as runLogLocationSchema, ln as traceCacheRefSchema, lr as defineEval, lt as removeDefaultConfigSchema, mn as traceDisplayConfigSchema, mt as buildCaseKey, nn as cacheModeSchema, nr as nextEvalId, nt as evalDeriveConfigSchema, on as cacheStatusSchema, or as setEvalOutput, ot as llmCallPricingRateSchema, pn as traceAttributeDisplaySchema, pt as trialSelectionModeSchema, q as DEFAULT_LLM_CALLS_CONFIG, qt as evalChartTooltipExtraSchema, rn as cacheOperationTypeSchema, rr as runInEvalRuntimeScope, rt as llmCallMetricFormatSchema, sn as serializedCacheSpanSchema, sr as setScopeCacheContext, st as llmCallPricingSchema, tn as cacheListItemSchema, tr as mergeEvalOutput, tt as evalColumnsSchema, un as traceAttributeDisplayFormatSchema, ur as getEvalRegistry, ut as resolveApiCallsConfig, vn as traceSpanSchema, vt as assertionFailureSchema, wn as fileRefSchema, wt as evalStatItemSchema, xn as columnDefSchema, xt as discoveryIssueSchema, yn as traceSpanWarningSchema, yt as caseDetailSchema, z as getEvalTitle, zn as serializeCacheValue, zt as manualInputSelectOptionSchema } from "./runOrchestration-CO3Vf0cQ.mjs";
|
|
2
|
+
import { a as materializeManualInputFiles, i as isManualInputFileValue, n as createRunner, o as stageManualInputFile, r as cleanupStagedManualInputFiles, s as stageManualInputFileFromPath, t as runCli } from "./cli-CiFOqMwS.mjs";
|
|
3
|
+
import "./src-BiPLv9ya.mjs";
|
|
4
4
|
export { DEFAULT_API_CALLS_CONFIG, DEFAULT_LLM_CALLS_CONFIG, EvalAssertionError, advanceEvalTime, agentEvalsConfigSchema, apiCallMetricFormatSchema, apiCallMetricPlacementSchema, apiCallMetricSchema, apiCallsConfigSchema, appendToEvalOutput, applyDerivedCallAttributes, assertionFailureSchema, buildCaseKey, buildEvalKey, buildTraceTree, cacheDebugKeyEntrySchema, cacheDebugKeyFileSchema, cacheEntrySchema, cacheEntryWithDebugKeySchema, cacheFileSchema, cacheListItemSchema, cacheModeSchema, cacheOperationTypeSchema, cacheRecordingOpSchema, cacheRecordingSchema, cacheStatusSchema, captureEvalSpanError, caseDetailSchema, caseRowSchema, cellValueSchema, cleanupStagedManualInputFiles, columnDefSchema, columnFormatSchema, columnKindSchema, configReloadStateSchema, configReloadStatusSchema, createRunRequestSchema, createRunner, defaultConfigKeySchema, defineEval, deriveScopedSummaryFromCases, deriveStatusFromCaseRows, deriveStatusFromChildStatuses, deserializeCacheRecording, deserializeCacheValue, discoveryIssueSchema, evalAssert, evalChartAggregateSchema, evalChartAxisSchema, evalChartBuiltinMetricSchema, evalChartColorSchema, evalChartConfigSchema, evalChartMetricSchema, evalChartTooltipExtraSchema, evalChartTypeSchema, evalChartsConfigSchema, evalColumnOverrideSchema, evalColumnsSchema, evalDeriveConfigSchema, evalExpect, evalFreshnessStatusSchema, evalLog, evalSpan, evalStatAggregateSchema, evalStatItemSchema, evalStatsConfigSchema, evalSummarySchema, evalTracer, extractApiCalls, extractCacheEntries, extractCacheHits, extractLlmCalls, fileRefSchema, getCaseRowCaseKey, getCaseRowEvalKey, getCurrentScope, getEvalCaseInput, getEvalDisplayStatus, getEvalRegistry, getEvalStartTime, getEvalTitle, getNestedAttribute, hashCacheKey, hashCacheKeySync, incrementEvalOutput, isInEvalScope, isManualInputFileValue, jsonCellSchema, llmCallMetricFormatSchema, llmCallMetricPlacementSchema, llmCallMetricSchema, llmCallPricingRateSchema, llmCallPricingSchema, llmCallsConfigSchema, manualInputBooleanFieldSchema, manualInputDescriptorSchema, manualInputFieldDescriptorSchema, manualInputFileValueSchema, manualInputJsonFieldSchema, manualInputMultilineFieldSchema, manualInputNumberFieldSchema, manualInputSelectFieldSchema, manualInputSelectOptionSchema, manualInputTextFieldSchema, materializeManualInputFiles, mergeEvalOutput, nextEvalId, numberDisplayOptionsSchema, readManualInputFile, removeDefaultConfigSchema, repoFile, repoFileRefSchema, resolveApiCallsConfig, resolveLlmCallsConfig, runArtifactRefSchema, runCli, runInEvalRuntimeScope, runInEvalScope, runInExistingEvalScope, runLogEntrySchema, runLogLevelSchema, runLogLocationSchema, runLogPhaseSchema, runLogsConfigSchema, runManifestSchema, runSummarySchema, scoreTraceSchema, serializeCacheRecording, serializeCacheValue, serializedCacheSpanSchema, setEvalOutput, setScopeCacheContext, spanCacheOptionsSchema, sseEnvelopeSchema, stageManualInputFile, stageManualInputFileFromPath, startEvalBackgroundJob, traceAttributeDisplayFormatSchema, traceAttributeDisplayInputSchema, traceAttributeDisplayPlacementSchema, traceAttributeDisplaySchema, traceCacheRefSchema, traceDisplayConfigSchema, traceDisplayInputConfigSchema, traceSpanErrorSchema, traceSpanKindSchema, traceSpanSchema, traceSpanWarningSchema, trialSelectionModeSchema, updateManualScoreRequestSchema, z };
|
package/dist/runChild.mjs
CHANGED
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import { A as createRunRequestSchema, C as loadConfig, D as createFsCacheStore, G as runSummarySchema, Nt as manualInputDescriptorSchema, Tt as evalStatsConfigSchema, W as runManifestSchema, Yt as evalChartsConfigSchema, ht as buildEvalKey, qn as configureEvalRunLogs, r as getTargetEvals$1, t as executeRun, x as parseEvalDiscovery, xn as columnDefSchema } from "./runOrchestration-
|
|
1
|
+
import { A as createRunRequestSchema, C as loadConfig, D as createFsCacheStore, G as runSummarySchema, Nt as manualInputDescriptorSchema, Tt as evalStatsConfigSchema, W as runManifestSchema, Yt as evalChartsConfigSchema, ht as buildEvalKey, qn as configureEvalRunLogs, r as getTargetEvals$1, t as executeRun, x as parseEvalDiscovery, xn as columnDefSchema } from "./runOrchestration-CO3Vf0cQ.mjs";
|
|
2
2
|
import { createHash } from "node:crypto";
|
|
3
3
|
import { readFile } from "node:fs/promises";
|
|
4
4
|
import { relative } from "node:path";
|
|
@@ -3219,6 +3219,8 @@ const llmCallMetricPlacementSchema = z.enum(["header", "body"]);
|
|
|
3219
3219
|
/** Where an API-call metric is rendered inside the API calls tab. */
|
|
3220
3220
|
const apiCallMetricPlacementSchema = llmCallMetricPlacementSchema;
|
|
3221
3221
|
const callDerivedAttributeSchema = z.custom((value) => typeof value === "function", { message: "Expected a derived attribute function" });
|
|
3222
|
+
const callDerivedAttributesFnSchema = z.custom((value) => typeof value === "function", { message: "Expected a derived attributes function" });
|
|
3223
|
+
const callDerivedAttributesConfigSchema = z.union([z.record(z.string().min(1), callDerivedAttributeSchema), callDerivedAttributesFnSchema]);
|
|
3222
3224
|
/**
|
|
3223
3225
|
* Schema for a single user-defined metric attached to LLM call rows.
|
|
3224
3226
|
*
|
|
@@ -3345,10 +3347,11 @@ const llmCallsConfigSchema = z.object({
|
|
|
3345
3347
|
/**
|
|
3346
3348
|
* Derived attributes persisted onto every matching LLM span before
|
|
3347
3349
|
* `deriveFromTracing`, default outputs, trace display, and call metrics read
|
|
3348
|
-
* the trace.
|
|
3349
|
-
*
|
|
3350
|
+
* the trace. Use a keyed map for one-off fields, or one callback returning a
|
|
3351
|
+
* path/value object for multiple fields. Keys are dot-paths under
|
|
3352
|
+
* `span.attributes`; return `undefined` to skip one span or one returned key.
|
|
3350
3353
|
*/
|
|
3351
|
-
derivedAttributes:
|
|
3354
|
+
derivedAttributes: callDerivedAttributesConfigSchema.optional(),
|
|
3352
3355
|
/**
|
|
3353
3356
|
* Model-keyed pricing registry used to calculate LLM-call costs from token
|
|
3354
3357
|
* counts. Built-in LLM cost fields are only derived from this registry.
|
|
@@ -3380,11 +3383,12 @@ const apiCallsConfigSchema = z.object({
|
|
|
3380
3383
|
}).optional(),
|
|
3381
3384
|
/**
|
|
3382
3385
|
* Derived attributes persisted onto every matching API span before trace
|
|
3383
|
-
* display and call metrics read the trace.
|
|
3384
|
-
*
|
|
3385
|
-
*
|
|
3386
|
+
* display and call metrics read the trace. Use a keyed map for one-off
|
|
3387
|
+
* fields, or one callback returning a path/value object for multiple fields.
|
|
3388
|
+
* Keys are dot-paths under `span.attributes`; return `undefined` to skip one
|
|
3389
|
+
* span or one returned key.
|
|
3386
3390
|
*/
|
|
3387
|
-
derivedAttributes:
|
|
3391
|
+
derivedAttributes: callDerivedAttributesConfigSchema.optional(),
|
|
3388
3392
|
/** Custom user-defined metrics surfaced on each API call. */
|
|
3389
3393
|
metrics: z.array(apiCallMetricSchema).optional()
|
|
3390
3394
|
});
|
|
@@ -3444,7 +3448,9 @@ const DEFAULT_API_CALLS_CONFIG = {
|
|
|
3444
3448
|
metrics: []
|
|
3445
3449
|
};
|
|
3446
3450
|
function resolveDerivedAttributes(input) {
|
|
3447
|
-
|
|
3451
|
+
if (input === void 0) return [];
|
|
3452
|
+
if (typeof input === "function") return [{ computeMany: input }];
|
|
3453
|
+
return Object.entries(input).map(([path, compute]) => ({
|
|
3448
3454
|
path,
|
|
3449
3455
|
compute
|
|
3450
3456
|
}));
|
|
@@ -3809,11 +3815,31 @@ function mergeNestedAttribute$1(value, path, attributeValue) {
|
|
|
3809
3815
|
function applyDerivedAttributesForKind(params) {
|
|
3810
3816
|
let attributes = params.span.attributes;
|
|
3811
3817
|
for (const derivedAttribute of params.derivedAttributes) {
|
|
3812
|
-
if (derivedAttribute.compute === void 0) continue;
|
|
3813
3818
|
const span = {
|
|
3814
3819
|
...params.span,
|
|
3815
3820
|
attributes
|
|
3816
3821
|
};
|
|
3822
|
+
if (derivedAttribute.computeMany !== void 0) {
|
|
3823
|
+
const values = (() => {
|
|
3824
|
+
try {
|
|
3825
|
+
return derivedAttribute.computeMany({
|
|
3826
|
+
attributes,
|
|
3827
|
+
span,
|
|
3828
|
+
get: (path) => getNestedAttribute(attributes, path)
|
|
3829
|
+
});
|
|
3830
|
+
} catch {
|
|
3831
|
+
return;
|
|
3832
|
+
}
|
|
3833
|
+
})();
|
|
3834
|
+
if (!isRecord$3(values)) continue;
|
|
3835
|
+
for (const [path, value] of Object.entries(values)) {
|
|
3836
|
+
if (value === void 0) continue;
|
|
3837
|
+
attributes = mergeNestedAttribute$1(attributes, path, value);
|
|
3838
|
+
}
|
|
3839
|
+
continue;
|
|
3840
|
+
}
|
|
3841
|
+
if (derivedAttribute.path === void 0) continue;
|
|
3842
|
+
if (derivedAttribute.compute === void 0) continue;
|
|
3817
3843
|
const value = (() => {
|
|
3818
3844
|
try {
|
|
3819
3845
|
return derivedAttribute.compute({
|
|
@@ -1,2 +1,2 @@
|
|
|
1
|
-
import { n as initRunner, t as getRunnerInstance } from "./runner-
|
|
1
|
+
import { n as initRunner, t as getRunnerInstance } from "./runner-CXHkf7ih.mjs";
|
|
2
2
|
export { getRunnerInstance, initRunner };
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
import { n as createRunner } from "./cli-
|
|
2
|
-
import "./src-
|
|
1
|
+
import { n as createRunner } from "./cli-CiFOqMwS.mjs";
|
|
2
|
+
import "./src-BiPLv9ya.mjs";
|
|
3
3
|
//#region ../../apps/server/src/runner.ts
|
|
4
4
|
let runnerInstance = null;
|
|
5
5
|
function getRunnerInstance() {
|
package/package.json
CHANGED
|
@@ -345,8 +345,10 @@ See `EvalScoreDef` / `EvalManualScoreDef` in the types for the full shape
|
|
|
345
345
|
persist computed values back onto matching LLM spans before trace consumers
|
|
346
346
|
run, and add entries to `metrics` to surface arbitrary user metrics
|
|
347
347
|
(`format: 'string' | 'number' | 'duration' | 'json' | 'boolean'`,
|
|
348
|
-
`placements: ['header' | 'body']`). `derivedAttributes`
|
|
349
|
-
|
|
348
|
+
`placements: ['header' | 'body']`). `derivedAttributes` can be a keyed map
|
|
349
|
+
for one-off fields or one callback that returns multiple path/value pairs.
|
|
350
|
+
Derived keys are dot-paths under `span.attributes`; return `undefined` to
|
|
351
|
+
skip one span or one returned key. For saved runs,
|
|
350
352
|
the case drawer more menu can recalculate configured LLM/API derived
|
|
351
353
|
attributes for one case and persist the updated trace artifacts without
|
|
352
354
|
re-running the eval.
|
|
@@ -374,9 +376,10 @@ cacheCreationInputTokens` so cache details are not double-counted.
|
|
|
374
376
|
and `'fetch'` spans with `method`, `url`, `statusCode`, `request`,
|
|
375
377
|
`response`, `requestBody`, `responseBody`, `headers`, `durationMs`, and
|
|
376
378
|
`error` read from conventional attribute paths. Override `kinds` or
|
|
377
|
-
`attributes.<field>` for external tracers, add `derivedAttributes`
|
|
378
|
-
|
|
379
|
-
formats and placements as
|
|
379
|
+
`attributes.<field>` for external tracers, add `derivedAttributes` as a
|
|
380
|
+
keyed map or object-returning callback for computed persisted API span
|
|
381
|
+
attributes, and add `metrics` with the same formats and placements as
|
|
382
|
+
LLM-call metrics.
|
|
380
383
|
- `runLogs` (in `agent-evals.config.ts`) controls case log capture. Use
|
|
381
384
|
`runLogs: { captureConsole: false }` to keep console output in the terminal
|
|
382
385
|
without persisting console calls to case details. Manual `evalLog(...)` calls
|
package/dist/src-CkWT1iSu.mjs
DELETED