@absolutejs/absolute 0.19.0-beta.532 → 0.19.0-beta.534
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/ai/client/index.js +198 -3
- package/dist/ai/client/index.js.map +3 -3
- package/dist/ai/index.js +201 -3
- package/dist/ai/index.js.map +3 -3
- package/dist/react/ai/index.js +198 -3
- package/dist/react/ai/index.js.map +3 -3
- package/dist/src/ai/index.d.ts +1 -1
- package/dist/src/ai/rag/index.d.ts +1 -1
- package/dist/src/ai/rag/quality.d.ts +4 -1
- package/dist/src/vue/ai/useRAG.d.ts +48 -0
- package/dist/src/vue/ai/useRAGEvaluate.d.ts +48 -0
- package/dist/svelte/ai/index.js +198 -3
- package/dist/svelte/ai/index.js.map +3 -3
- package/dist/types/ai.d.ts +18 -0
- package/dist/vue/ai/index.js +198 -3
- package/dist/vue/ai/index.js.map +3 -3
- package/package.json +7 -7
package/dist/types/ai.d.ts
CHANGED
|
@@ -1194,6 +1194,7 @@ export type RAGEvaluationSuiteRun = {
|
|
|
1194
1194
|
finishedAt: number;
|
|
1195
1195
|
elapsedMs: number;
|
|
1196
1196
|
response: RAGEvaluationResponse;
|
|
1197
|
+
traceSummary?: RAGRetrievalTraceComparisonSummary;
|
|
1197
1198
|
metadata?: Record<string, unknown>;
|
|
1198
1199
|
};
|
|
1199
1200
|
export type RAGEvaluationHistoryStore = {
|
|
@@ -1231,6 +1232,19 @@ export type RAGEvaluationRunDiff = {
|
|
|
1231
1232
|
failedCases: number;
|
|
1232
1233
|
partialCases: number;
|
|
1233
1234
|
};
|
|
1235
|
+
traceSummaryDelta?: {
|
|
1236
|
+
modesChanged: boolean;
|
|
1237
|
+
vectorCases: number;
|
|
1238
|
+
lexicalCases: number;
|
|
1239
|
+
transformedCases: number;
|
|
1240
|
+
variantCases: number;
|
|
1241
|
+
averageFinalCount: number;
|
|
1242
|
+
averageVectorCount: number;
|
|
1243
|
+
averageLexicalCount: number;
|
|
1244
|
+
averageCandidateTopK: number;
|
|
1245
|
+
averageLexicalTopK: number;
|
|
1246
|
+
stageCounts: Partial<Record<RAGRetrievalTraceStage, number>>;
|
|
1247
|
+
};
|
|
1234
1248
|
};
|
|
1235
1249
|
export type RAGEvaluationHistory = {
|
|
1236
1250
|
suiteId: string;
|
|
@@ -1241,6 +1255,10 @@ export type RAGEvaluationHistory = {
|
|
|
1241
1255
|
previousRun?: RAGEvaluationSuiteRun;
|
|
1242
1256
|
diff?: RAGEvaluationRunDiff;
|
|
1243
1257
|
};
|
|
1258
|
+
export type RAGLabelValueRow = {
|
|
1259
|
+
label: string;
|
|
1260
|
+
value: string;
|
|
1261
|
+
};
|
|
1244
1262
|
export type RAGEvaluationLeaderboardEntry = {
|
|
1245
1263
|
runId: string;
|
|
1246
1264
|
suiteId: string;
|
package/dist/vue/ai/index.js
CHANGED
|
@@ -1777,6 +1777,23 @@ var buildTraceStageCounts = (traces) => {
|
|
|
1777
1777
|
}
|
|
1778
1778
|
return counts;
|
|
1779
1779
|
};
|
|
1780
|
+
var diffTraceStageCounts = ({
|
|
1781
|
+
current,
|
|
1782
|
+
previous
|
|
1783
|
+
}) => {
|
|
1784
|
+
const next = {};
|
|
1785
|
+
const stages = new Set([
|
|
1786
|
+
...Object.keys(current),
|
|
1787
|
+
...Object.keys(previous)
|
|
1788
|
+
]);
|
|
1789
|
+
for (const stage of stages) {
|
|
1790
|
+
const delta = (current[stage] ?? 0) - (previous[stage] ?? 0);
|
|
1791
|
+
if (delta !== 0) {
|
|
1792
|
+
next[stage] = delta;
|
|
1793
|
+
}
|
|
1794
|
+
}
|
|
1795
|
+
return next;
|
|
1796
|
+
};
|
|
1780
1797
|
var roundTraceAverage = (value, total) => total > 0 ? Number((value / total).toFixed(2)) : 0;
|
|
1781
1798
|
var summarizeRetrievalTraces = (traces) => {
|
|
1782
1799
|
if (traces.length === 0) {
|
|
@@ -2138,6 +2155,166 @@ var buildGroundingCaseSnapshots = ({
|
|
|
2138
2155
|
});
|
|
2139
2156
|
};
|
|
2140
2157
|
var getStatusRank = (status) => status === "pass" ? 2 : status === "partial" ? 1 : 0;
|
|
2158
|
+
var formatSignedDelta = (value, decimals = 0, suffix = "") => `${value >= 0 ? "+" : ""}${value.toFixed(decimals)}${suffix}`;
|
|
2159
|
+
var formatEvaluationSummary = (response) => `${response.summary.passedCases}/${response.totalCases} pass \xB7 f1 ${response.summary.averageF1.toFixed(3)} \xB7 latency ${response.summary.averageLatencyMs.toFixed(1)}ms`;
|
|
2160
|
+
var formatHistoryCaseLabels = (cases) => cases.length > 0 ? cases.map((entry) => entry.label ?? entry.caseId).join(", ") : "none";
|
|
2161
|
+
var formatTraceModes = (modes) => modes.length > 0 ? modes.join(" / ") : "n/a";
|
|
2162
|
+
var formatTraceStageSummary = (stageCounts) => {
|
|
2163
|
+
const topStages = Object.entries(stageCounts).sort((left, right) => right[1] - left[1]).slice(0, 3);
|
|
2164
|
+
return topStages.length > 0 ? topStages.map(([stage, count]) => `${stage} ${count}`).join(" \xB7 ") : "n/a";
|
|
2165
|
+
};
|
|
2166
|
+
var formatTraceRatio = (count, total) => `${count}/${total}`;
|
|
2167
|
+
var formatTraceCountDelta = (value) => `${value >= 0 ? "+" : ""}${value}`;
|
|
2168
|
+
var buildRAGComparisonTraceSummaryRows = (entry) => {
|
|
2169
|
+
const trace = entry.traceSummary;
|
|
2170
|
+
if (!trace) {
|
|
2171
|
+
return [{ label: "Trace", value: "Unavailable" }];
|
|
2172
|
+
}
|
|
2173
|
+
return [
|
|
2174
|
+
{ label: "Modes", value: formatTraceModes(trace.modes) },
|
|
2175
|
+
{ label: "Avg final", value: trace.averageFinalCount.toFixed(1) },
|
|
2176
|
+
{ label: "Avg vector", value: trace.averageVectorCount.toFixed(1) },
|
|
2177
|
+
{ label: "Avg lexical", value: trace.averageLexicalCount.toFixed(1) },
|
|
2178
|
+
{
|
|
2179
|
+
label: "Transforms",
|
|
2180
|
+
value: formatTraceRatio(trace.transformedCases, trace.totalCases)
|
|
2181
|
+
},
|
|
2182
|
+
{
|
|
2183
|
+
label: "Variants",
|
|
2184
|
+
value: formatTraceRatio(trace.variantCases, trace.totalCases)
|
|
2185
|
+
},
|
|
2186
|
+
{
|
|
2187
|
+
label: "TopK",
|
|
2188
|
+
value: `${trace.averageCandidateTopK.toFixed(1)} / ${trace.averageLexicalTopK.toFixed(1)}`
|
|
2189
|
+
},
|
|
2190
|
+
{
|
|
2191
|
+
label: "Stages",
|
|
2192
|
+
value: formatTraceStageSummary(trace.stageCounts)
|
|
2193
|
+
}
|
|
2194
|
+
];
|
|
2195
|
+
};
|
|
2196
|
+
var buildRAGComparisonTraceDiffRows = (entry, leader) => {
|
|
2197
|
+
const trace = entry.traceSummary;
|
|
2198
|
+
if (!trace) {
|
|
2199
|
+
return [{ label: "Trace", value: "Unavailable for comparison" }];
|
|
2200
|
+
}
|
|
2201
|
+
const leaderTrace = leader?.traceSummary;
|
|
2202
|
+
if (!leaderTrace) {
|
|
2203
|
+
return [{ label: "Baseline", value: "Leader trace unavailable" }];
|
|
2204
|
+
}
|
|
2205
|
+
if (entry === leader) {
|
|
2206
|
+
return [{ label: "Baseline", value: "Leader strategy" }];
|
|
2207
|
+
}
|
|
2208
|
+
const stageDelta = Object.keys({
|
|
2209
|
+
...leaderTrace.stageCounts,
|
|
2210
|
+
...trace.stageCounts
|
|
2211
|
+
}).map((stage) => {
|
|
2212
|
+
const typedStage = stage;
|
|
2213
|
+
const delta = (trace.stageCounts[typedStage] ?? 0) - (leaderTrace.stageCounts[typedStage] ?? 0);
|
|
2214
|
+
return delta === 0 ? null : `${typedStage} ${formatTraceCountDelta(delta)}`;
|
|
2215
|
+
}).filter((value) => Boolean(value)).slice(0, 3).join(" \xB7 ");
|
|
2216
|
+
const rows = [
|
|
2217
|
+
{ label: "Baseline", value: leader.label }
|
|
2218
|
+
];
|
|
2219
|
+
if (formatTraceModes(trace.modes) !== formatTraceModes(leaderTrace.modes)) {
|
|
2220
|
+
rows.push({
|
|
2221
|
+
label: "Modes vs leader",
|
|
2222
|
+
value: `${formatTraceModes(trace.modes)} vs ${formatTraceModes(leaderTrace.modes)}`
|
|
2223
|
+
});
|
|
2224
|
+
}
|
|
2225
|
+
rows.push({
|
|
2226
|
+
label: "Final delta",
|
|
2227
|
+
value: formatSignedDelta(trace.averageFinalCount - leaderTrace.averageFinalCount, 1)
|
|
2228
|
+
}, {
|
|
2229
|
+
label: "Vector delta",
|
|
2230
|
+
value: formatSignedDelta(trace.averageVectorCount - leaderTrace.averageVectorCount, 1)
|
|
2231
|
+
}, {
|
|
2232
|
+
label: "Lexical delta",
|
|
2233
|
+
value: formatSignedDelta(trace.averageLexicalCount - leaderTrace.averageLexicalCount, 1)
|
|
2234
|
+
}, {
|
|
2235
|
+
label: "Transform delta",
|
|
2236
|
+
value: formatTraceCountDelta(trace.transformedCases - leaderTrace.transformedCases)
|
|
2237
|
+
});
|
|
2238
|
+
if (stageDelta) {
|
|
2239
|
+
rows.push({ label: "Stage delta", value: stageDelta });
|
|
2240
|
+
}
|
|
2241
|
+
return rows;
|
|
2242
|
+
};
|
|
2243
|
+
var buildRAGEvaluationHistoryRows = (history) => {
|
|
2244
|
+
if (!history?.latestRun) {
|
|
2245
|
+
return [
|
|
2246
|
+
{ label: "History", value: "No persisted benchmark runs yet." }
|
|
2247
|
+
];
|
|
2248
|
+
}
|
|
2249
|
+
const rows = [
|
|
2250
|
+
{ label: "Runs recorded", value: String(history.runs.length) },
|
|
2251
|
+
{
|
|
2252
|
+
label: "Latest",
|
|
2253
|
+
value: `${history.latestRun.label} \xB7 ${formatEvaluationSummary(history.latestRun.response)}`
|
|
2254
|
+
}
|
|
2255
|
+
];
|
|
2256
|
+
if (history.latestRun.traceSummary) {
|
|
2257
|
+
rows.push({
|
|
2258
|
+
label: "Latest trace",
|
|
2259
|
+
value: `${formatTraceModes(history.latestRun.traceSummary.modes)} \xB7 final ${history.latestRun.traceSummary.averageFinalCount.toFixed(1)} \xB7 vector ${history.latestRun.traceSummary.averageVectorCount.toFixed(1)} \xB7 lexical ${history.latestRun.traceSummary.averageLexicalCount.toFixed(1)}`
|
|
2260
|
+
});
|
|
2261
|
+
}
|
|
2262
|
+
if (history.previousRun) {
|
|
2263
|
+
rows.push({
|
|
2264
|
+
label: "Previous",
|
|
2265
|
+
value: `${history.previousRun.label} \xB7 ${formatEvaluationSummary(history.previousRun.response)}`
|
|
2266
|
+
});
|
|
2267
|
+
}
|
|
2268
|
+
if (!history.diff) {
|
|
2269
|
+
rows.push({
|
|
2270
|
+
label: "History diff",
|
|
2271
|
+
value: "Run the benchmark again to diff regressions over time."
|
|
2272
|
+
});
|
|
2273
|
+
return rows;
|
|
2274
|
+
}
|
|
2275
|
+
rows.push({
|
|
2276
|
+
label: "Passing delta",
|
|
2277
|
+
value: formatSignedDelta(history.diff.summaryDelta.passingRate, 1, "%")
|
|
2278
|
+
}, {
|
|
2279
|
+
label: "Average F1 delta",
|
|
2280
|
+
value: formatSignedDelta(history.diff.summaryDelta.averageF1, 3)
|
|
2281
|
+
}, {
|
|
2282
|
+
label: "Latency delta",
|
|
2283
|
+
value: formatSignedDelta(history.diff.summaryDelta.averageLatencyMs, 1, "ms")
|
|
2284
|
+
}, {
|
|
2285
|
+
label: "Improved",
|
|
2286
|
+
value: formatHistoryCaseLabels(history.diff.improvedCases)
|
|
2287
|
+
}, {
|
|
2288
|
+
label: "Regressed",
|
|
2289
|
+
value: formatHistoryCaseLabels(history.diff.regressedCases)
|
|
2290
|
+
});
|
|
2291
|
+
if (history.diff.traceSummaryDelta) {
|
|
2292
|
+
rows.push({
|
|
2293
|
+
label: "Trace mode shift",
|
|
2294
|
+
value: history.diff.traceSummaryDelta.modesChanged ? "changed" : "stable"
|
|
2295
|
+
}, {
|
|
2296
|
+
label: "Trace final delta",
|
|
2297
|
+
value: formatSignedDelta(history.diff.traceSummaryDelta.averageFinalCount, 1)
|
|
2298
|
+
}, {
|
|
2299
|
+
label: "Trace vector delta",
|
|
2300
|
+
value: formatSignedDelta(history.diff.traceSummaryDelta.averageVectorCount, 1)
|
|
2301
|
+
}, {
|
|
2302
|
+
label: "Trace lexical delta",
|
|
2303
|
+
value: formatSignedDelta(history.diff.traceSummaryDelta.averageLexicalCount, 1)
|
|
2304
|
+
}, {
|
|
2305
|
+
label: "Trace transform delta",
|
|
2306
|
+
value: formatTraceCountDelta(history.diff.traceSummaryDelta.transformedCases)
|
|
2307
|
+
}, {
|
|
2308
|
+
label: "Trace variant delta",
|
|
2309
|
+
value: formatTraceCountDelta(history.diff.traceSummaryDelta.variantCases)
|
|
2310
|
+
});
|
|
2311
|
+
const stageDelta = Object.entries(history.diff.traceSummaryDelta.stageCounts ?? {}).map(([stage, count]) => `${stage} ${formatTraceCountDelta(count)}`).join(", ");
|
|
2312
|
+
if (stageDelta) {
|
|
2313
|
+
rows.push({ label: "Trace stage delta", value: stageDelta });
|
|
2314
|
+
}
|
|
2315
|
+
}
|
|
2316
|
+
return rows;
|
|
2317
|
+
};
|
|
2141
2318
|
var buildRAGEvaluationRunDiff = ({
|
|
2142
2319
|
current,
|
|
2143
2320
|
previous
|
|
@@ -2161,6 +2338,22 @@ var buildRAGEvaluationRunDiff = ({
|
|
|
2161
2338
|
passingRate: current.response.passingRate - (previous?.response.passingRate ?? 0),
|
|
2162
2339
|
partialCases: current.response.summary.partialCases - (previous?.response.summary.partialCases ?? 0)
|
|
2163
2340
|
},
|
|
2341
|
+
traceSummaryDelta: current.traceSummary || previous?.traceSummary ? {
|
|
2342
|
+
averageCandidateTopK: (current.traceSummary?.averageCandidateTopK ?? 0) - (previous?.traceSummary?.averageCandidateTopK ?? 0),
|
|
2343
|
+
averageFinalCount: (current.traceSummary?.averageFinalCount ?? 0) - (previous?.traceSummary?.averageFinalCount ?? 0),
|
|
2344
|
+
averageLexicalCount: (current.traceSummary?.averageLexicalCount ?? 0) - (previous?.traceSummary?.averageLexicalCount ?? 0),
|
|
2345
|
+
averageLexicalTopK: (current.traceSummary?.averageLexicalTopK ?? 0) - (previous?.traceSummary?.averageLexicalTopK ?? 0),
|
|
2346
|
+
averageVectorCount: (current.traceSummary?.averageVectorCount ?? 0) - (previous?.traceSummary?.averageVectorCount ?? 0),
|
|
2347
|
+
lexicalCases: (current.traceSummary?.lexicalCases ?? 0) - (previous?.traceSummary?.lexicalCases ?? 0),
|
|
2348
|
+
modesChanged: (current.traceSummary?.modes ?? []).join("|") !== (previous?.traceSummary?.modes ?? []).join("|"),
|
|
2349
|
+
stageCounts: diffTraceStageCounts({
|
|
2350
|
+
current: current.traceSummary?.stageCounts ?? {},
|
|
2351
|
+
previous: previous?.traceSummary?.stageCounts ?? {}
|
|
2352
|
+
}),
|
|
2353
|
+
transformedCases: (current.traceSummary?.transformedCases ?? 0) - (previous?.traceSummary?.transformedCases ?? 0),
|
|
2354
|
+
variantCases: (current.traceSummary?.variantCases ?? 0) - (previous?.traceSummary?.variantCases ?? 0),
|
|
2355
|
+
vectorCases: (current.traceSummary?.vectorCases ?? 0) - (previous?.traceSummary?.vectorCases ?? 0)
|
|
2356
|
+
} : undefined,
|
|
2164
2357
|
unchangedCases
|
|
2165
2358
|
};
|
|
2166
2359
|
};
|
|
@@ -2534,7 +2727,8 @@ var compareRAGRerankers = async ({
|
|
|
2534
2727
|
label: entry.label,
|
|
2535
2728
|
response: entry.response,
|
|
2536
2729
|
startedAt: 0,
|
|
2537
|
-
suiteId: suite.id
|
|
2730
|
+
suiteId: suite.id,
|
|
2731
|
+
traceSummary: entry.traceSummary
|
|
2538
2732
|
})));
|
|
2539
2733
|
return {
|
|
2540
2734
|
entries,
|
|
@@ -2619,7 +2813,8 @@ var compareRAGRetrievalStrategies = async ({
|
|
|
2619
2813
|
label: entry.label,
|
|
2620
2814
|
response: entry.response,
|
|
2621
2815
|
startedAt: 0,
|
|
2622
|
-
suiteId: suite.id
|
|
2816
|
+
suiteId: suite.id,
|
|
2817
|
+
traceSummary: entry.traceSummary
|
|
2623
2818
|
})));
|
|
2624
2819
|
return {
|
|
2625
2820
|
entries,
|
|
@@ -3402,5 +3597,5 @@ export {
|
|
|
3402
3597
|
AIStreamKey
|
|
3403
3598
|
};
|
|
3404
3599
|
|
|
3405
|
-
//# debugId=
|
|
3600
|
+
//# debugId=49142334D6D3EC2564756E2164756E21
|
|
3406
3601
|
//# sourceMappingURL=index.js.map
|