@absolutejs/absolute 0.19.0-beta.532 → 0.19.0-beta.534

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1194,6 +1194,7 @@ export type RAGEvaluationSuiteRun = {
1194
1194
  finishedAt: number;
1195
1195
  elapsedMs: number;
1196
1196
  response: RAGEvaluationResponse;
1197
+ traceSummary?: RAGRetrievalTraceComparisonSummary;
1197
1198
  metadata?: Record<string, unknown>;
1198
1199
  };
1199
1200
  export type RAGEvaluationHistoryStore = {
@@ -1231,6 +1232,19 @@ export type RAGEvaluationRunDiff = {
1231
1232
  failedCases: number;
1232
1233
  partialCases: number;
1233
1234
  };
1235
+ traceSummaryDelta?: {
1236
+ modesChanged: boolean;
1237
+ vectorCases: number;
1238
+ lexicalCases: number;
1239
+ transformedCases: number;
1240
+ variantCases: number;
1241
+ averageFinalCount: number;
1242
+ averageVectorCount: number;
1243
+ averageLexicalCount: number;
1244
+ averageCandidateTopK: number;
1245
+ averageLexicalTopK: number;
1246
+ stageCounts: Partial<Record<RAGRetrievalTraceStage, number>>;
1247
+ };
1234
1248
  };
1235
1249
  export type RAGEvaluationHistory = {
1236
1250
  suiteId: string;
@@ -1241,6 +1255,10 @@ export type RAGEvaluationHistory = {
1241
1255
  previousRun?: RAGEvaluationSuiteRun;
1242
1256
  diff?: RAGEvaluationRunDiff;
1243
1257
  };
1258
+ export type RAGLabelValueRow = {
1259
+ label: string;
1260
+ value: string;
1261
+ };
1244
1262
  export type RAGEvaluationLeaderboardEntry = {
1245
1263
  runId: string;
1246
1264
  suiteId: string;
@@ -1777,6 +1777,23 @@ var buildTraceStageCounts = (traces) => {
1777
1777
  }
1778
1778
  return counts;
1779
1779
  };
1780
+ var diffTraceStageCounts = ({
1781
+ current,
1782
+ previous
1783
+ }) => {
1784
+ const next = {};
1785
+ const stages = new Set([
1786
+ ...Object.keys(current),
1787
+ ...Object.keys(previous)
1788
+ ]);
1789
+ for (const stage of stages) {
1790
+ const delta = (current[stage] ?? 0) - (previous[stage] ?? 0);
1791
+ if (delta !== 0) {
1792
+ next[stage] = delta;
1793
+ }
1794
+ }
1795
+ return next;
1796
+ };
1780
1797
  var roundTraceAverage = (value, total) => total > 0 ? Number((value / total).toFixed(2)) : 0;
1781
1798
  var summarizeRetrievalTraces = (traces) => {
1782
1799
  if (traces.length === 0) {
@@ -2138,6 +2155,166 @@ var buildGroundingCaseSnapshots = ({
2138
2155
  });
2139
2156
  };
2140
2157
  var getStatusRank = (status) => status === "pass" ? 2 : status === "partial" ? 1 : 0;
2158
+ var formatSignedDelta = (value, decimals = 0, suffix = "") => `${value >= 0 ? "+" : ""}${value.toFixed(decimals)}${suffix}`;
2159
+ var formatEvaluationSummary = (response) => `${response.summary.passedCases}/${response.totalCases} pass \xB7 f1 ${response.summary.averageF1.toFixed(3)} \xB7 latency ${response.summary.averageLatencyMs.toFixed(1)}ms`;
2160
+ var formatHistoryCaseLabels = (cases) => cases.length > 0 ? cases.map((entry) => entry.label ?? entry.caseId).join(", ") : "none";
2161
+ var formatTraceModes = (modes) => modes.length > 0 ? modes.join(" / ") : "n/a";
2162
+ var formatTraceStageSummary = (stageCounts) => {
2163
+ const topStages = Object.entries(stageCounts).sort((left, right) => right[1] - left[1]).slice(0, 3);
2164
+ return topStages.length > 0 ? topStages.map(([stage, count]) => `${stage} ${count}`).join(" \xB7 ") : "n/a";
2165
+ };
2166
+ var formatTraceRatio = (count, total) => `${count}/${total}`;
2167
+ var formatTraceCountDelta = (value) => `${value >= 0 ? "+" : ""}${value}`;
2168
+ var buildRAGComparisonTraceSummaryRows = (entry) => {
2169
+ const trace = entry.traceSummary;
2170
+ if (!trace) {
2171
+ return [{ label: "Trace", value: "Unavailable" }];
2172
+ }
2173
+ return [
2174
+ { label: "Modes", value: formatTraceModes(trace.modes) },
2175
+ { label: "Avg final", value: trace.averageFinalCount.toFixed(1) },
2176
+ { label: "Avg vector", value: trace.averageVectorCount.toFixed(1) },
2177
+ { label: "Avg lexical", value: trace.averageLexicalCount.toFixed(1) },
2178
+ {
2179
+ label: "Transforms",
2180
+ value: formatTraceRatio(trace.transformedCases, trace.totalCases)
2181
+ },
2182
+ {
2183
+ label: "Variants",
2184
+ value: formatTraceRatio(trace.variantCases, trace.totalCases)
2185
+ },
2186
+ {
2187
+ label: "TopK",
2188
+ value: `${trace.averageCandidateTopK.toFixed(1)} / ${trace.averageLexicalTopK.toFixed(1)}`
2189
+ },
2190
+ {
2191
+ label: "Stages",
2192
+ value: formatTraceStageSummary(trace.stageCounts)
2193
+ }
2194
+ ];
2195
+ };
2196
+ var buildRAGComparisonTraceDiffRows = (entry, leader) => {
2197
+ const trace = entry.traceSummary;
2198
+ if (!trace) {
2199
+ return [{ label: "Trace", value: "Unavailable for comparison" }];
2200
+ }
2201
+ const leaderTrace = leader?.traceSummary;
2202
+ if (!leaderTrace) {
2203
+ return [{ label: "Baseline", value: "Leader trace unavailable" }];
2204
+ }
2205
+ if (entry === leader) {
2206
+ return [{ label: "Baseline", value: "Leader strategy" }];
2207
+ }
2208
+ const stageDelta = Object.keys({
2209
+ ...leaderTrace.stageCounts,
2210
+ ...trace.stageCounts
2211
+ }).map((stage) => {
2212
+ const typedStage = stage;
2213
+ const delta = (trace.stageCounts[typedStage] ?? 0) - (leaderTrace.stageCounts[typedStage] ?? 0);
2214
+ return delta === 0 ? null : `${typedStage} ${formatTraceCountDelta(delta)}`;
2215
+ }).filter((value) => Boolean(value)).slice(0, 3).join(" \xB7 ");
2216
+ const rows = [
2217
+ { label: "Baseline", value: leader.label }
2218
+ ];
2219
+ if (formatTraceModes(trace.modes) !== formatTraceModes(leaderTrace.modes)) {
2220
+ rows.push({
2221
+ label: "Modes vs leader",
2222
+ value: `${formatTraceModes(trace.modes)} vs ${formatTraceModes(leaderTrace.modes)}`
2223
+ });
2224
+ }
2225
+ rows.push({
2226
+ label: "Final delta",
2227
+ value: formatSignedDelta(trace.averageFinalCount - leaderTrace.averageFinalCount, 1)
2228
+ }, {
2229
+ label: "Vector delta",
2230
+ value: formatSignedDelta(trace.averageVectorCount - leaderTrace.averageVectorCount, 1)
2231
+ }, {
2232
+ label: "Lexical delta",
2233
+ value: formatSignedDelta(trace.averageLexicalCount - leaderTrace.averageLexicalCount, 1)
2234
+ }, {
2235
+ label: "Transform delta",
2236
+ value: formatTraceCountDelta(trace.transformedCases - leaderTrace.transformedCases)
2237
+ });
2238
+ if (stageDelta) {
2239
+ rows.push({ label: "Stage delta", value: stageDelta });
2240
+ }
2241
+ return rows;
2242
+ };
2243
+ var buildRAGEvaluationHistoryRows = (history) => {
2244
+ if (!history?.latestRun) {
2245
+ return [
2246
+ { label: "History", value: "No persisted benchmark runs yet." }
2247
+ ];
2248
+ }
2249
+ const rows = [
2250
+ { label: "Runs recorded", value: String(history.runs.length) },
2251
+ {
2252
+ label: "Latest",
2253
+ value: `${history.latestRun.label} \xB7 ${formatEvaluationSummary(history.latestRun.response)}`
2254
+ }
2255
+ ];
2256
+ if (history.latestRun.traceSummary) {
2257
+ rows.push({
2258
+ label: "Latest trace",
2259
+ value: `${formatTraceModes(history.latestRun.traceSummary.modes)} \xB7 final ${history.latestRun.traceSummary.averageFinalCount.toFixed(1)} \xB7 vector ${history.latestRun.traceSummary.averageVectorCount.toFixed(1)} \xB7 lexical ${history.latestRun.traceSummary.averageLexicalCount.toFixed(1)}`
2260
+ });
2261
+ }
2262
+ if (history.previousRun) {
2263
+ rows.push({
2264
+ label: "Previous",
2265
+ value: `${history.previousRun.label} \xB7 ${formatEvaluationSummary(history.previousRun.response)}`
2266
+ });
2267
+ }
2268
+ if (!history.diff) {
2269
+ rows.push({
2270
+ label: "History diff",
2271
+ value: "Run the benchmark again to diff regressions over time."
2272
+ });
2273
+ return rows;
2274
+ }
2275
+ rows.push({
2276
+ label: "Passing delta",
2277
+ value: formatSignedDelta(history.diff.summaryDelta.passingRate, 1, "%")
2278
+ }, {
2279
+ label: "Average F1 delta",
2280
+ value: formatSignedDelta(history.diff.summaryDelta.averageF1, 3)
2281
+ }, {
2282
+ label: "Latency delta",
2283
+ value: formatSignedDelta(history.diff.summaryDelta.averageLatencyMs, 1, "ms")
2284
+ }, {
2285
+ label: "Improved",
2286
+ value: formatHistoryCaseLabels(history.diff.improvedCases)
2287
+ }, {
2288
+ label: "Regressed",
2289
+ value: formatHistoryCaseLabels(history.diff.regressedCases)
2290
+ });
2291
+ if (history.diff.traceSummaryDelta) {
2292
+ rows.push({
2293
+ label: "Trace mode shift",
2294
+ value: history.diff.traceSummaryDelta.modesChanged ? "changed" : "stable"
2295
+ }, {
2296
+ label: "Trace final delta",
2297
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageFinalCount, 1)
2298
+ }, {
2299
+ label: "Trace vector delta",
2300
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageVectorCount, 1)
2301
+ }, {
2302
+ label: "Trace lexical delta",
2303
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageLexicalCount, 1)
2304
+ }, {
2305
+ label: "Trace transform delta",
2306
+ value: formatTraceCountDelta(history.diff.traceSummaryDelta.transformedCases)
2307
+ }, {
2308
+ label: "Trace variant delta",
2309
+ value: formatTraceCountDelta(history.diff.traceSummaryDelta.variantCases)
2310
+ });
2311
+ const stageDelta = Object.entries(history.diff.traceSummaryDelta.stageCounts ?? {}).map(([stage, count]) => `${stage} ${formatTraceCountDelta(count)}`).join(", ");
2312
+ if (stageDelta) {
2313
+ rows.push({ label: "Trace stage delta", value: stageDelta });
2314
+ }
2315
+ }
2316
+ return rows;
2317
+ };
2141
2318
  var buildRAGEvaluationRunDiff = ({
2142
2319
  current,
2143
2320
  previous
@@ -2161,6 +2338,22 @@ var buildRAGEvaluationRunDiff = ({
2161
2338
  passingRate: current.response.passingRate - (previous?.response.passingRate ?? 0),
2162
2339
  partialCases: current.response.summary.partialCases - (previous?.response.summary.partialCases ?? 0)
2163
2340
  },
2341
+ traceSummaryDelta: current.traceSummary || previous?.traceSummary ? {
2342
+ averageCandidateTopK: (current.traceSummary?.averageCandidateTopK ?? 0) - (previous?.traceSummary?.averageCandidateTopK ?? 0),
2343
+ averageFinalCount: (current.traceSummary?.averageFinalCount ?? 0) - (previous?.traceSummary?.averageFinalCount ?? 0),
2344
+ averageLexicalCount: (current.traceSummary?.averageLexicalCount ?? 0) - (previous?.traceSummary?.averageLexicalCount ?? 0),
2345
+ averageLexicalTopK: (current.traceSummary?.averageLexicalTopK ?? 0) - (previous?.traceSummary?.averageLexicalTopK ?? 0),
2346
+ averageVectorCount: (current.traceSummary?.averageVectorCount ?? 0) - (previous?.traceSummary?.averageVectorCount ?? 0),
2347
+ lexicalCases: (current.traceSummary?.lexicalCases ?? 0) - (previous?.traceSummary?.lexicalCases ?? 0),
2348
+ modesChanged: (current.traceSummary?.modes ?? []).join("|") !== (previous?.traceSummary?.modes ?? []).join("|"),
2349
+ stageCounts: diffTraceStageCounts({
2350
+ current: current.traceSummary?.stageCounts ?? {},
2351
+ previous: previous?.traceSummary?.stageCounts ?? {}
2352
+ }),
2353
+ transformedCases: (current.traceSummary?.transformedCases ?? 0) - (previous?.traceSummary?.transformedCases ?? 0),
2354
+ variantCases: (current.traceSummary?.variantCases ?? 0) - (previous?.traceSummary?.variantCases ?? 0),
2355
+ vectorCases: (current.traceSummary?.vectorCases ?? 0) - (previous?.traceSummary?.vectorCases ?? 0)
2356
+ } : undefined,
2164
2357
  unchangedCases
2165
2358
  };
2166
2359
  };
@@ -2534,7 +2727,8 @@ var compareRAGRerankers = async ({
2534
2727
  label: entry.label,
2535
2728
  response: entry.response,
2536
2729
  startedAt: 0,
2537
- suiteId: suite.id
2730
+ suiteId: suite.id,
2731
+ traceSummary: entry.traceSummary
2538
2732
  })));
2539
2733
  return {
2540
2734
  entries,
@@ -2619,7 +2813,8 @@ var compareRAGRetrievalStrategies = async ({
2619
2813
  label: entry.label,
2620
2814
  response: entry.response,
2621
2815
  startedAt: 0,
2622
- suiteId: suite.id
2816
+ suiteId: suite.id,
2817
+ traceSummary: entry.traceSummary
2623
2818
  })));
2624
2819
  return {
2625
2820
  entries,
@@ -3402,5 +3597,5 @@ export {
3402
3597
  AIStreamKey
3403
3598
  };
3404
3599
 
3405
- //# debugId=28BD639F9F0C6C1364756E2164756E21
3600
+ //# debugId=49142334D6D3EC2564756E2164756E21
3406
3601
  //# sourceMappingURL=index.js.map