@absolutejs/absolute 0.19.0-beta.533 → 0.19.0-beta.534

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1255,6 +1255,10 @@ export type RAGEvaluationHistory = {
1255
1255
  previousRun?: RAGEvaluationSuiteRun;
1256
1256
  diff?: RAGEvaluationRunDiff;
1257
1257
  };
1258
+ export type RAGLabelValueRow = {
1259
+ label: string;
1260
+ value: string;
1261
+ };
1258
1262
  export type RAGEvaluationLeaderboardEntry = {
1259
1263
  runId: string;
1260
1264
  suiteId: string;
@@ -2155,6 +2155,166 @@ var buildGroundingCaseSnapshots = ({
2155
2155
  });
2156
2156
  };
2157
2157
  var getStatusRank = (status) => status === "pass" ? 2 : status === "partial" ? 1 : 0;
2158
+ var formatSignedDelta = (value, decimals = 0, suffix = "") => `${value >= 0 ? "+" : ""}${value.toFixed(decimals)}${suffix}`;
2159
+ var formatEvaluationSummary = (response) => `${response.summary.passedCases}/${response.totalCases} pass \xB7 f1 ${response.summary.averageF1.toFixed(3)} \xB7 latency ${response.summary.averageLatencyMs.toFixed(1)}ms`;
2160
+ var formatHistoryCaseLabels = (cases) => cases.length > 0 ? cases.map((entry) => entry.label ?? entry.caseId).join(", ") : "none";
2161
+ var formatTraceModes = (modes) => modes.length > 0 ? modes.join(" / ") : "n/a";
2162
+ var formatTraceStageSummary = (stageCounts) => {
2163
+ const topStages = Object.entries(stageCounts).sort((left, right) => right[1] - left[1]).slice(0, 3);
2164
+ return topStages.length > 0 ? topStages.map(([stage, count]) => `${stage} ${count}`).join(" \xB7 ") : "n/a";
2165
+ };
2166
+ var formatTraceRatio = (count, total) => `${count}/${total}`;
2167
+ var formatTraceCountDelta = (value) => `${value >= 0 ? "+" : ""}${value}`;
2168
+ var buildRAGComparisonTraceSummaryRows = (entry) => {
2169
+ const trace = entry.traceSummary;
2170
+ if (!trace) {
2171
+ return [{ label: "Trace", value: "Unavailable" }];
2172
+ }
2173
+ return [
2174
+ { label: "Modes", value: formatTraceModes(trace.modes) },
2175
+ { label: "Avg final", value: trace.averageFinalCount.toFixed(1) },
2176
+ { label: "Avg vector", value: trace.averageVectorCount.toFixed(1) },
2177
+ { label: "Avg lexical", value: trace.averageLexicalCount.toFixed(1) },
2178
+ {
2179
+ label: "Transforms",
2180
+ value: formatTraceRatio(trace.transformedCases, trace.totalCases)
2181
+ },
2182
+ {
2183
+ label: "Variants",
2184
+ value: formatTraceRatio(trace.variantCases, trace.totalCases)
2185
+ },
2186
+ {
2187
+ label: "TopK",
2188
+ value: `${trace.averageCandidateTopK.toFixed(1)} / ${trace.averageLexicalTopK.toFixed(1)}`
2189
+ },
2190
+ {
2191
+ label: "Stages",
2192
+ value: formatTraceStageSummary(trace.stageCounts)
2193
+ }
2194
+ ];
2195
+ };
2196
+ var buildRAGComparisonTraceDiffRows = (entry, leader) => {
2197
+ const trace = entry.traceSummary;
2198
+ if (!trace) {
2199
+ return [{ label: "Trace", value: "Unavailable for comparison" }];
2200
+ }
2201
+ const leaderTrace = leader?.traceSummary;
2202
+ if (!leaderTrace) {
2203
+ return [{ label: "Baseline", value: "Leader trace unavailable" }];
2204
+ }
2205
+ if (entry === leader) {
2206
+ return [{ label: "Baseline", value: "Leader strategy" }];
2207
+ }
2208
+ const stageDelta = Object.keys({
2209
+ ...leaderTrace.stageCounts,
2210
+ ...trace.stageCounts
2211
+ }).map((stage) => {
2212
+ const typedStage = stage;
2213
+ const delta = (trace.stageCounts[typedStage] ?? 0) - (leaderTrace.stageCounts[typedStage] ?? 0);
2214
+ return delta === 0 ? null : `${typedStage} ${formatTraceCountDelta(delta)}`;
2215
+ }).filter((value) => Boolean(value)).slice(0, 3).join(" \xB7 ");
2216
+ const rows = [
2217
+ { label: "Baseline", value: leader.label }
2218
+ ];
2219
+ if (formatTraceModes(trace.modes) !== formatTraceModes(leaderTrace.modes)) {
2220
+ rows.push({
2221
+ label: "Modes vs leader",
2222
+ value: `${formatTraceModes(trace.modes)} vs ${formatTraceModes(leaderTrace.modes)}`
2223
+ });
2224
+ }
2225
+ rows.push({
2226
+ label: "Final delta",
2227
+ value: formatSignedDelta(trace.averageFinalCount - leaderTrace.averageFinalCount, 1)
2228
+ }, {
2229
+ label: "Vector delta",
2230
+ value: formatSignedDelta(trace.averageVectorCount - leaderTrace.averageVectorCount, 1)
2231
+ }, {
2232
+ label: "Lexical delta",
2233
+ value: formatSignedDelta(trace.averageLexicalCount - leaderTrace.averageLexicalCount, 1)
2234
+ }, {
2235
+ label: "Transform delta",
2236
+ value: formatTraceCountDelta(trace.transformedCases - leaderTrace.transformedCases)
2237
+ });
2238
+ if (stageDelta) {
2239
+ rows.push({ label: "Stage delta", value: stageDelta });
2240
+ }
2241
+ return rows;
2242
+ };
2243
+ var buildRAGEvaluationHistoryRows = (history) => {
2244
+ if (!history?.latestRun) {
2245
+ return [
2246
+ { label: "History", value: "No persisted benchmark runs yet." }
2247
+ ];
2248
+ }
2249
+ const rows = [
2250
+ { label: "Runs recorded", value: String(history.runs.length) },
2251
+ {
2252
+ label: "Latest",
2253
+ value: `${history.latestRun.label} \xB7 ${formatEvaluationSummary(history.latestRun.response)}`
2254
+ }
2255
+ ];
2256
+ if (history.latestRun.traceSummary) {
2257
+ rows.push({
2258
+ label: "Latest trace",
2259
+ value: `${formatTraceModes(history.latestRun.traceSummary.modes)} \xB7 final ${history.latestRun.traceSummary.averageFinalCount.toFixed(1)} \xB7 vector ${history.latestRun.traceSummary.averageVectorCount.toFixed(1)} \xB7 lexical ${history.latestRun.traceSummary.averageLexicalCount.toFixed(1)}`
2260
+ });
2261
+ }
2262
+ if (history.previousRun) {
2263
+ rows.push({
2264
+ label: "Previous",
2265
+ value: `${history.previousRun.label} \xB7 ${formatEvaluationSummary(history.previousRun.response)}`
2266
+ });
2267
+ }
2268
+ if (!history.diff) {
2269
+ rows.push({
2270
+ label: "History diff",
2271
+ value: "Run the benchmark again to diff regressions over time."
2272
+ });
2273
+ return rows;
2274
+ }
2275
+ rows.push({
2276
+ label: "Passing delta",
2277
+ value: formatSignedDelta(history.diff.summaryDelta.passingRate, 1, "%")
2278
+ }, {
2279
+ label: "Average F1 delta",
2280
+ value: formatSignedDelta(history.diff.summaryDelta.averageF1, 3)
2281
+ }, {
2282
+ label: "Latency delta",
2283
+ value: formatSignedDelta(history.diff.summaryDelta.averageLatencyMs, 1, "ms")
2284
+ }, {
2285
+ label: "Improved",
2286
+ value: formatHistoryCaseLabels(history.diff.improvedCases)
2287
+ }, {
2288
+ label: "Regressed",
2289
+ value: formatHistoryCaseLabels(history.diff.regressedCases)
2290
+ });
2291
+ if (history.diff.traceSummaryDelta) {
2292
+ rows.push({
2293
+ label: "Trace mode shift",
2294
+ value: history.diff.traceSummaryDelta.modesChanged ? "changed" : "stable"
2295
+ }, {
2296
+ label: "Trace final delta",
2297
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageFinalCount, 1)
2298
+ }, {
2299
+ label: "Trace vector delta",
2300
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageVectorCount, 1)
2301
+ }, {
2302
+ label: "Trace lexical delta",
2303
+ value: formatSignedDelta(history.diff.traceSummaryDelta.averageLexicalCount, 1)
2304
+ }, {
2305
+ label: "Trace transform delta",
2306
+ value: formatTraceCountDelta(history.diff.traceSummaryDelta.transformedCases)
2307
+ }, {
2308
+ label: "Trace variant delta",
2309
+ value: formatTraceCountDelta(history.diff.traceSummaryDelta.variantCases)
2310
+ });
2311
+ const stageDelta = Object.entries(history.diff.traceSummaryDelta.stageCounts ?? {}).map(([stage, count]) => `${stage} ${formatTraceCountDelta(count)}`).join(", ");
2312
+ if (stageDelta) {
2313
+ rows.push({ label: "Trace stage delta", value: stageDelta });
2314
+ }
2315
+ }
2316
+ return rows;
2317
+ };
2158
2318
  var buildRAGEvaluationRunDiff = ({
2159
2319
  current,
2160
2320
  previous
@@ -3437,5 +3597,5 @@ export {
3437
3597
  AIStreamKey
3438
3598
  };
3439
3599
 
3440
- //# debugId=D6FF5517CF2D735064756E2164756E21
3600
+ //# debugId=49142334D6D3EC2564756E2164756E21
3441
3601
  //# sourceMappingURL=index.js.map