@absolutejs/absolute 0.19.0-beta.532 → 0.19.0-beta.534

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1753,6 +1753,23 @@ var buildTraceStageCounts = (traces) => {
1753
1753
  }
1754
1754
  return counts;
1755
1755
  };
1756
+ var diffTraceStageCounts = ({
1757
+ current,
1758
+ previous
1759
+ }) => {
1760
+ const next = {};
1761
+ const stages = new Set([
1762
+ ...Object.keys(current),
1763
+ ...Object.keys(previous)
1764
+ ]);
1765
+ for (const stage of stages) {
1766
+ const delta = (current[stage] ?? 0) - (previous[stage] ?? 0);
1767
+ if (delta !== 0) {
1768
+ next[stage] = delta;
1769
+ }
1770
+ }
1771
+ return next;
1772
+ };
1756
1773
  var roundTraceAverage = (value, total) => total > 0 ? Number((value / total).toFixed(2)) : 0;
1757
1774
  var summarizeRetrievalTraces = (traces) => {
1758
1775
  if (traces.length === 0) {
@@ -2114,6 +2131,166 @@ var buildGroundingCaseSnapshots = ({
2114
2131
  });
2115
2132
  };
2116
2133
  var getStatusRank = (status) => status === "pass" ? 2 : status === "partial" ? 1 : 0;
2134
+ var formatSignedDelta = (value, decimals = 0, suffix = "") => `${value >= 0 ? "+" : ""}${value.toFixed(decimals)}${suffix}`;
2135
+ var formatEvaluationSummary = (response) => `${response.summary.passedCases}/${response.totalCases} pass \xB7 f1 ${response.summary.averageF1.toFixed(3)} \xB7 latency ${response.summary.averageLatencyMs.toFixed(1)}ms`;
2136
+ var formatHistoryCaseLabels = (cases) => cases.length > 0 ? cases.map((entry) => entry.label ?? entry.caseId).join(", ") : "none";
2137
+ var formatTraceModes = (modes) => modes.length > 0 ? modes.join(" / ") : "n/a";
2138
+ var formatTraceStageSummary = (stageCounts) => {
2139
+ const topStages = Object.entries(stageCounts).sort((left, right) => right[1] - left[1]).slice(0, 3);
2140
+ return topStages.length > 0 ? topStages.map(([stage, count]) => `${stage} ${count}`).join(" \xB7 ") : "n/a";
2141
+ };
2142
+ var formatTraceRatio = (count, total) => `${count}/${total}`;
2143
+ var formatTraceCountDelta = (value) => `${value >= 0 ? "+" : ""}${value}`;
2144
+ var buildRAGComparisonTraceSummaryRows = (entry) => {
2145
+ const trace = entry.traceSummary;
2146
+ if (!trace) {
2147
+ return [{ label: "Trace", value: "Unavailable" }];
2148
+ }
2149
+ return [
2150
+ { label: "Modes", value: formatTraceModes(trace.modes) },
2151
+ { label: "Avg final", value: trace.averageFinalCount.toFixed(1) },
2152
+ { label: "Avg vector", value: trace.averageVectorCount.toFixed(1) },
2153
+ { label: "Avg lexical", value: trace.averageLexicalCount.toFixed(1) },
2154
+ {
2155
+ label: "Transforms",
2156
+ value: formatTraceRatio(trace.transformedCases, trace.totalCases)
2157
+ },
2158
+ {
2159
+ label: "Variants",
2160
+ value: formatTraceRatio(trace.variantCases, trace.totalCases)
2161
+ },
2162
+ {
2163
+ label: "TopK",
2164
+ value: `${trace.averageCandidateTopK.toFixed(1)} / ${trace.averageLexicalTopK.toFixed(1)}`
2165
+ },
2166
+ {
2167
+ label: "Stages",
2168
+ value: formatTraceStageSummary(trace.stageCounts)
2169
+ }
2170
+ ];
2171
+ };
2172
+ var buildRAGComparisonTraceDiffRows = (entry, leader) => {
2173
+ const trace = entry.traceSummary;
2174
+ if (!trace) {
2175
+ return [{ label: "Trace", value: "Unavailable for comparison" }];
2176
+ }
2177
+ const leaderTrace = leader?.traceSummary;
2178
+ if (!leaderTrace) {
2179
+ return [{ label: "Baseline", value: "Leader trace unavailable" }];
2180
+ }
2181
+ if (entry === leader) {
2182
+ return [{ label: "Baseline", value: "Leader strategy" }];
2183
+ }
2184
+ const stageDelta = Object.keys({
2185
+ ...leaderTrace.stageCounts,
2186
+ ...trace.stageCounts
2187
+ }).map((stage) => {
2188
+ const typedStage = stage;
2189
+ const delta = (trace.stageCounts[typedStage] ?? 0) - (leaderTrace.stageCounts[typedStage] ?? 0);
2190
+ return delta === 0 ? null : `${typedStage} ${formatTraceCountDelta(delta)}`;
2191
+ }).filter((value) => Boolean(value)).slice(0, 3).join(" \xB7 ");
2192
+ const rows = [
2193
+ { label: "Baseline", value: leader.label }
2194
+ ];
2195
+ if (formatTraceModes(trace.modes) !== formatTraceModes(leaderTrace.modes)) {
2196
+ rows.push({
2197
+ label: "Modes vs leader",
2198
+ value: `${formatTraceModes(trace.modes)} vs ${formatTraceModes(leaderTrace.modes)}`
2199
+ });
2200
+ }
2201
+ rows.push({
2202
+ label: "Final delta",
2203
+ value: formatSignedDelta(trace.averageFinalCount - leaderTrace.averageFinalCount, 1)
2204
+ }, {
2205
+ label: "Vector delta",
2206
+ value: formatSignedDelta(trace.averageVectorCount - leaderTrace.averageVectorCount, 1)
2207
+ }, {
2208
+ label: "Lexical delta",
2209
+ value: formatSignedDelta(trace.averageLexicalCount - leaderTrace.averageLexicalCount, 1)
2210
+ }, {
2211
+ label: "Transform delta",
2212
+ value: formatTraceCountDelta(trace.transformedCases - leaderTrace.transformedCases)
2213
+ });
2214
+ if (stageDelta) {
2215
+ rows.push({ label: "Stage delta", value: stageDelta });
2216
+ }
2217
+ return rows;
2218
+ };
2219
+ var buildRAGEvaluationHistoryRows = (history) => {
2220
+ if (!history?.latestRun) {
2221
+ return [
2222
+ { label: "History", value: "No persisted benchmark runs yet." }
2223
+ ];
2224
+ }
2225
+ const rows = [
2226
+ { label: "Runs recorded", value: String(history.runs.length) },
2227
+ {
2228
+ label: "Latest",
2229
+ value: `${history.latestRun.label} \xB7 ${formatEvaluationSummary(history.latestRun.response)}`
2230
+ }
2231
+ ];
2232
+ if (history.latestRun.traceSummary) {
2233
+ rows.push({
2234
+ label: "Latest trace",
2235
+ value: `${formatTraceModes(history.latestRun.traceSummary.modes)} \xB7 final ${history.latestRun.traceSummary.averageFinalCount.toFixed(1)} \xB7 vector ${history.latestRun.traceSummary.averageVectorCount.toFixed(1)} \xB7 lexical ${history.latestRun.traceSummary.averageLexicalCount.toFixed(1)}`
2236
+ });
2237
+ }
2238
+ if (history.previousRun) {
2239
+ rows.push({
2240
+ label: "Previous",
2241
+ value: `${history.previousRun.label} \xB7 ${formatEvaluationSummary(history.previousRun.response)}`
2242
+ });
2243
+ }
2244
+ if (!history.diff) {
2245
+ rows.push({
2246
+ label: "History diff",
2247
+ value: "Run the benchmark again to diff regressions over time."
2248
+ });
2249
+ return rows;
2250
+ }
2251
+ rows.push({
2252
+ label: "Passing delta",
2253
+ value: formatSignedDelta(history.diff.summaryDelta.passingRate, 1, "%")
2254
+ }, {
2255
+ label: "Average F1 delta",
2256
+ value: formatSignedDelta(history.diff.summaryDelta.averageF1, 3)
2257
+ }, {
2258
+ label: "Latency delta",
2259
+ value: formatSignedDelta(history.diff.summaryDelta.averageLatencyMs, 1, "ms")
2260
+ }, {
2261
+ label: "Improved",
2262
+ value: formatHistoryCaseLabels(history.diff.improvedCases)
2263
+ }, {
2264
+ label: "Regressed",
2265
+ value: formatHistoryCaseLabels(history.diff.regressedCases)
2266
+ });
2267
+ if (history.diff.traceSummaryDelta) {
2268
+ rows.push({
2269
+ label: "Trace mode shift",
2270
+ value: history.diff.traceSummaryDelta.modesChanged ? "changed" : "stable"
2271
+ }, {
2272
+ label: "Trace final delta",
2273
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageFinalCount, 1)
2274
+ }, {
2275
+ label: "Trace vector delta",
2276
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageVectorCount, 1)
2277
+ }, {
2278
+ label: "Trace lexical delta",
2279
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageLexicalCount, 1)
2280
+ }, {
2281
+ label: "Trace transform delta",
2282
+ value: formatTraceCountDelta(history.diff.traceSummaryDelta.transformedCases)
2283
+ }, {
2284
+ label: "Trace variant delta",
2285
+ value: formatTraceCountDelta(history.diff.traceSummaryDelta.variantCases)
2286
+ });
2287
+ const stageDelta = Object.entries(history.diff.traceSummaryDelta.stageCounts ?? {}).map(([stage, count]) => `${stage} ${formatTraceCountDelta(count)}`).join(", ");
2288
+ if (stageDelta) {
2289
+ rows.push({ label: "Trace stage delta", value: stageDelta });
2290
+ }
2291
+ }
2292
+ return rows;
2293
+ };
2117
2294
  var buildRAGEvaluationRunDiff = ({
2118
2295
  current,
2119
2296
  previous
@@ -2137,6 +2314,22 @@ var buildRAGEvaluationRunDiff = ({
2137
2314
  passingRate: current.response.passingRate - (previous?.response.passingRate ?? 0),
2138
2315
  partialCases: current.response.summary.partialCases - (previous?.response.summary.partialCases ?? 0)
2139
2316
  },
2317
+ traceSummaryDelta: current.traceSummary || previous?.traceSummary ? {
2318
+ averageCandidateTopK: (current.traceSummary?.averageCandidateTopK ?? 0) - (previous?.traceSummary?.averageCandidateTopK ?? 0),
2319
+ averageFinalCount: (current.traceSummary?.averageFinalCount ?? 0) - (previous?.traceSummary?.averageFinalCount ?? 0),
2320
+ averageLexicalCount: (current.traceSummary?.averageLexicalCount ?? 0) - (previous?.traceSummary?.averageLexicalCount ?? 0),
2321
+ averageLexicalTopK: (current.traceSummary?.averageLexicalTopK ?? 0) - (previous?.traceSummary?.averageLexicalTopK ?? 0),
2322
+ averageVectorCount: (current.traceSummary?.averageVectorCount ?? 0) - (previous?.traceSummary?.averageVectorCount ?? 0),
2323
+ lexicalCases: (current.traceSummary?.lexicalCases ?? 0) - (previous?.traceSummary?.lexicalCases ?? 0),
2324
+ modesChanged: (current.traceSummary?.modes ?? []).join("|") !== (previous?.traceSummary?.modes ?? []).join("|"),
2325
+ stageCounts: diffTraceStageCounts({
2326
+ current: current.traceSummary?.stageCounts ?? {},
2327
+ previous: previous?.traceSummary?.stageCounts ?? {}
2328
+ }),
2329
+ transformedCases: (current.traceSummary?.transformedCases ?? 0) - (previous?.traceSummary?.transformedCases ?? 0),
2330
+ variantCases: (current.traceSummary?.variantCases ?? 0) - (previous?.traceSummary?.variantCases ?? 0),
2331
+ vectorCases: (current.traceSummary?.vectorCases ?? 0) - (previous?.traceSummary?.vectorCases ?? 0)
2332
+ } : undefined,
2140
2333
  unchangedCases
2141
2334
  };
2142
2335
  };
@@ -2510,7 +2703,8 @@ var compareRAGRerankers = async ({
2510
2703
  label: entry.label,
2511
2704
  response: entry.response,
2512
2705
  startedAt: 0,
2513
- suiteId: suite.id
2706
+ suiteId: suite.id,
2707
+ traceSummary: entry.traceSummary
2514
2708
  })));
2515
2709
  return {
2516
2710
  entries,
@@ -2595,7 +2789,8 @@ var compareRAGRetrievalStrategies = async ({
2595
2789
  label: entry.label,
2596
2790
  response: entry.response,
2597
2791
  startedAt: 0,
2598
- suiteId: suite.id
2792
+ suiteId: suite.id,
2793
+ traceSummary: entry.traceSummary
2599
2794
  })));
2600
2795
  return {
2601
2796
  entries,
@@ -3626,5 +3821,5 @@ export {
3626
3821
  AIStreamProvider
3627
3822
  };
3628
3823
 
3629
- //# debugId=A3847C62324D17B964756E2164756E21
3824
+ //# debugId=7AF88C780C340EF364756E2164756E21
3630
3825
  //# sourceMappingURL=index.js.map