@absolutejs/absolute 0.19.0-beta.533 → 0.19.0-beta.534
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/ai/client/index.js +161 -1
- package/dist/ai/client/index.js.map +3 -3
- package/dist/ai/index.js +164 -1
- package/dist/ai/index.js.map +3 -3
- package/dist/angular/index.js +2 -2
- package/dist/angular/index.js.map +1 -1
- package/dist/angular/server.js +2 -2
- package/dist/angular/server.js.map +1 -1
- package/dist/build.js +2 -2
- package/dist/build.js.map +1 -1
- package/dist/index.js +2 -2
- package/dist/index.js.map +1 -1
- package/dist/react/ai/index.js +161 -1
- package/dist/react/ai/index.js.map +3 -3
- package/dist/src/ai/index.d.ts +1 -1
- package/dist/src/ai/rag/index.d.ts +1 -1
- package/dist/src/ai/rag/quality.d.ts +4 -1
- package/dist/svelte/ai/index.js +161 -1
- package/dist/svelte/ai/index.js.map +3 -3
- package/dist/types/ai.d.ts +4 -0
- package/dist/vue/ai/index.js +161 -1
- package/dist/vue/ai/index.js.map +3 -3
- package/package.json +7 -7
package/dist/types/ai.d.ts
CHANGED
|
@@ -1255,6 +1255,10 @@ export type RAGEvaluationHistory = {
|
|
|
1255
1255
|
previousRun?: RAGEvaluationSuiteRun;
|
|
1256
1256
|
diff?: RAGEvaluationRunDiff;
|
|
1257
1257
|
};
|
|
1258
|
+
export type RAGLabelValueRow = {
|
|
1259
|
+
label: string;
|
|
1260
|
+
value: string;
|
|
1261
|
+
};
|
|
1258
1262
|
export type RAGEvaluationLeaderboardEntry = {
|
|
1259
1263
|
runId: string;
|
|
1260
1264
|
suiteId: string;
|
package/dist/vue/ai/index.js
CHANGED
|
@@ -2155,6 +2155,166 @@ var buildGroundingCaseSnapshots = ({
|
|
|
2155
2155
|
});
|
|
2156
2156
|
};
|
|
2157
2157
|
var getStatusRank = (status) => status === "pass" ? 2 : status === "partial" ? 1 : 0;
|
|
2158
|
+
var formatSignedDelta = (value, decimals = 0, suffix = "") => `${value >= 0 ? "+" : ""}${value.toFixed(decimals)}${suffix}`;
|
|
2159
|
+
var formatEvaluationSummary = (response) => `${response.summary.passedCases}/${response.totalCases} pass \xB7 f1 ${response.summary.averageF1.toFixed(3)} \xB7 latency ${response.summary.averageLatencyMs.toFixed(1)}ms`;
|
|
2160
|
+
var formatHistoryCaseLabels = (cases) => cases.length > 0 ? cases.map((entry) => entry.label ?? entry.caseId).join(", ") : "none";
|
|
2161
|
+
var formatTraceModes = (modes) => modes.length > 0 ? modes.join(" / ") : "n/a";
|
|
2162
|
+
var formatTraceStageSummary = (stageCounts) => {
|
|
2163
|
+
const topStages = Object.entries(stageCounts).sort((left, right) => right[1] - left[1]).slice(0, 3);
|
|
2164
|
+
return topStages.length > 0 ? topStages.map(([stage, count]) => `${stage} ${count}`).join(" \xB7 ") : "n/a";
|
|
2165
|
+
};
|
|
2166
|
+
var formatTraceRatio = (count, total) => `${count}/${total}`;
|
|
2167
|
+
var formatTraceCountDelta = (value) => `${value >= 0 ? "+" : ""}${value}`;
|
|
2168
|
+
var buildRAGComparisonTraceSummaryRows = (entry) => {
|
|
2169
|
+
const trace = entry.traceSummary;
|
|
2170
|
+
if (!trace) {
|
|
2171
|
+
return [{ label: "Trace", value: "Unavailable" }];
|
|
2172
|
+
}
|
|
2173
|
+
return [
|
|
2174
|
+
{ label: "Modes", value: formatTraceModes(trace.modes) },
|
|
2175
|
+
{ label: "Avg final", value: trace.averageFinalCount.toFixed(1) },
|
|
2176
|
+
{ label: "Avg vector", value: trace.averageVectorCount.toFixed(1) },
|
|
2177
|
+
{ label: "Avg lexical", value: trace.averageLexicalCount.toFixed(1) },
|
|
2178
|
+
{
|
|
2179
|
+
label: "Transforms",
|
|
2180
|
+
value: formatTraceRatio(trace.transformedCases, trace.totalCases)
|
|
2181
|
+
},
|
|
2182
|
+
{
|
|
2183
|
+
label: "Variants",
|
|
2184
|
+
value: formatTraceRatio(trace.variantCases, trace.totalCases)
|
|
2185
|
+
},
|
|
2186
|
+
{
|
|
2187
|
+
label: "TopK",
|
|
2188
|
+
value: `${trace.averageCandidateTopK.toFixed(1)} / ${trace.averageLexicalTopK.toFixed(1)}`
|
|
2189
|
+
},
|
|
2190
|
+
{
|
|
2191
|
+
label: "Stages",
|
|
2192
|
+
value: formatTraceStageSummary(trace.stageCounts)
|
|
2193
|
+
}
|
|
2194
|
+
];
|
|
2195
|
+
};
|
|
2196
|
+
var buildRAGComparisonTraceDiffRows = (entry, leader) => {
|
|
2197
|
+
const trace = entry.traceSummary;
|
|
2198
|
+
if (!trace) {
|
|
2199
|
+
return [{ label: "Trace", value: "Unavailable for comparison" }];
|
|
2200
|
+
}
|
|
2201
|
+
const leaderTrace = leader?.traceSummary;
|
|
2202
|
+
if (!leaderTrace) {
|
|
2203
|
+
return [{ label: "Baseline", value: "Leader trace unavailable" }];
|
|
2204
|
+
}
|
|
2205
|
+
if (entry === leader) {
|
|
2206
|
+
return [{ label: "Baseline", value: "Leader strategy" }];
|
|
2207
|
+
}
|
|
2208
|
+
const stageDelta = Object.keys({
|
|
2209
|
+
...leaderTrace.stageCounts,
|
|
2210
|
+
...trace.stageCounts
|
|
2211
|
+
}).map((stage) => {
|
|
2212
|
+
const typedStage = stage;
|
|
2213
|
+
const delta = (trace.stageCounts[typedStage] ?? 0) - (leaderTrace.stageCounts[typedStage] ?? 0);
|
|
2214
|
+
return delta === 0 ? null : `${typedStage} ${formatTraceCountDelta(delta)}`;
|
|
2215
|
+
}).filter((value) => Boolean(value)).slice(0, 3).join(" \xB7 ");
|
|
2216
|
+
const rows = [
|
|
2217
|
+
{ label: "Baseline", value: leader.label }
|
|
2218
|
+
];
|
|
2219
|
+
if (formatTraceModes(trace.modes) !== formatTraceModes(leaderTrace.modes)) {
|
|
2220
|
+
rows.push({
|
|
2221
|
+
label: "Modes vs leader",
|
|
2222
|
+
value: `${formatTraceModes(trace.modes)} vs ${formatTraceModes(leaderTrace.modes)}`
|
|
2223
|
+
});
|
|
2224
|
+
}
|
|
2225
|
+
rows.push({
|
|
2226
|
+
label: "Final delta",
|
|
2227
|
+
value: formatSignedDelta(trace.averageFinalCount - leaderTrace.averageFinalCount, 1)
|
|
2228
|
+
}, {
|
|
2229
|
+
label: "Vector delta",
|
|
2230
|
+
value: formatSignedDelta(trace.averageVectorCount - leaderTrace.averageVectorCount, 1)
|
|
2231
|
+
}, {
|
|
2232
|
+
label: "Lexical delta",
|
|
2233
|
+
value: formatSignedDelta(trace.averageLexicalCount - leaderTrace.averageLexicalCount, 1)
|
|
2234
|
+
}, {
|
|
2235
|
+
label: "Transform delta",
|
|
2236
|
+
value: formatTraceCountDelta(trace.transformedCases - leaderTrace.transformedCases)
|
|
2237
|
+
});
|
|
2238
|
+
if (stageDelta) {
|
|
2239
|
+
rows.push({ label: "Stage delta", value: stageDelta });
|
|
2240
|
+
}
|
|
2241
|
+
return rows;
|
|
2242
|
+
};
|
|
2243
|
+
var buildRAGEvaluationHistoryRows = (history) => {
|
|
2244
|
+
if (!history?.latestRun) {
|
|
2245
|
+
return [
|
|
2246
|
+
{ label: "History", value: "No persisted benchmark runs yet." }
|
|
2247
|
+
];
|
|
2248
|
+
}
|
|
2249
|
+
const rows = [
|
|
2250
|
+
{ label: "Runs recorded", value: String(history.runs.length) },
|
|
2251
|
+
{
|
|
2252
|
+
label: "Latest",
|
|
2253
|
+
value: `${history.latestRun.label} \xB7 ${formatEvaluationSummary(history.latestRun.response)}`
|
|
2254
|
+
}
|
|
2255
|
+
];
|
|
2256
|
+
if (history.latestRun.traceSummary) {
|
|
2257
|
+
rows.push({
|
|
2258
|
+
label: "Latest trace",
|
|
2259
|
+
value: `${formatTraceModes(history.latestRun.traceSummary.modes)} \xB7 final ${history.latestRun.traceSummary.averageFinalCount.toFixed(1)} \xB7 vector ${history.latestRun.traceSummary.averageVectorCount.toFixed(1)} \xB7 lexical ${history.latestRun.traceSummary.averageLexicalCount.toFixed(1)}`
|
|
2260
|
+
});
|
|
2261
|
+
}
|
|
2262
|
+
if (history.previousRun) {
|
|
2263
|
+
rows.push({
|
|
2264
|
+
label: "Previous",
|
|
2265
|
+
value: `${history.previousRun.label} \xB7 ${formatEvaluationSummary(history.previousRun.response)}`
|
|
2266
|
+
});
|
|
2267
|
+
}
|
|
2268
|
+
if (!history.diff) {
|
|
2269
|
+
rows.push({
|
|
2270
|
+
label: "History diff",
|
|
2271
|
+
value: "Run the benchmark again to diff regressions over time."
|
|
2272
|
+
});
|
|
2273
|
+
return rows;
|
|
2274
|
+
}
|
|
2275
|
+
rows.push({
|
|
2276
|
+
label: "Passing delta",
|
|
2277
|
+
value: formatSignedDelta(history.diff.summaryDelta.passingRate, 1, "%")
|
|
2278
|
+
}, {
|
|
2279
|
+
label: "Average F1 delta",
|
|
2280
|
+
value: formatSignedDelta(history.diff.summaryDelta.averageF1, 3)
|
|
2281
|
+
}, {
|
|
2282
|
+
label: "Latency delta",
|
|
2283
|
+
value: formatSignedDelta(history.diff.summaryDelta.averageLatencyMs, 1, "ms")
|
|
2284
|
+
}, {
|
|
2285
|
+
label: "Improved",
|
|
2286
|
+
value: formatHistoryCaseLabels(history.diff.improvedCases)
|
|
2287
|
+
}, {
|
|
2288
|
+
label: "Regressed",
|
|
2289
|
+
value: formatHistoryCaseLabels(history.diff.regressedCases)
|
|
2290
|
+
});
|
|
2291
|
+
if (history.diff.traceSummaryDelta) {
|
|
2292
|
+
rows.push({
|
|
2293
|
+
label: "Trace mode shift",
|
|
2294
|
+
value: history.diff.traceSummaryDelta.modesChanged ? "changed" : "stable"
|
|
2295
|
+
}, {
|
|
2296
|
+
label: "Trace final delta",
|
|
2297
|
+
value: formatSignedDelta(history.diff.traceSummaryDelta.averageFinalCount, 1)
|
|
2298
|
+
}, {
|
|
2299
|
+
label: "Trace vector delta",
|
|
2300
|
+
value: formatSignedDelta(history.diff.traceSummaryDelta.averageVectorCount, 1)
|
|
2301
|
+
}, {
|
|
2302
|
+
label: "Trace lexical delta",
|
|
2303
|
+
value: formatSignedDelta(history.diff.traceSummaryDelta.averageLexicalCount, 1)
|
|
2304
|
+
}, {
|
|
2305
|
+
label: "Trace transform delta",
|
|
2306
|
+
value: formatTraceCountDelta(history.diff.traceSummaryDelta.transformedCases)
|
|
2307
|
+
}, {
|
|
2308
|
+
label: "Trace variant delta",
|
|
2309
|
+
value: formatTraceCountDelta(history.diff.traceSummaryDelta.variantCases)
|
|
2310
|
+
});
|
|
2311
|
+
const stageDelta = Object.entries(history.diff.traceSummaryDelta.stageCounts ?? {}).map(([stage, count]) => `${stage} ${formatTraceCountDelta(count)}`).join(", ");
|
|
2312
|
+
if (stageDelta) {
|
|
2313
|
+
rows.push({ label: "Trace stage delta", value: stageDelta });
|
|
2314
|
+
}
|
|
2315
|
+
}
|
|
2316
|
+
return rows;
|
|
2317
|
+
};
|
|
2158
2318
|
var buildRAGEvaluationRunDiff = ({
|
|
2159
2319
|
current,
|
|
2160
2320
|
previous
|
|
@@ -3437,5 +3597,5 @@ export {
|
|
|
3437
3597
|
AIStreamKey
|
|
3438
3598
|
};
|
|
3439
3599
|
|
|
3440
|
-
//# debugId=
|
|
3600
|
+
//# debugId=49142334D6D3EC2564756E2164756E21
|
|
3441
3601
|
//# sourceMappingURL=index.js.map
|