@absolutejs/absolute 0.19.0-beta.537 → 0.19.0-beta.539
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/ai/client/index.js +132 -1
- package/dist/ai/client/index.js.map +3 -3
- package/dist/ai/index.js +136 -1
- package/dist/ai/index.js.map +3 -3
- package/dist/react/ai/index.js +132 -1
- package/dist/react/ai/index.js.map +3 -3
- package/dist/src/ai/index.d.ts +1 -1
- package/dist/src/ai/rag/index.d.ts +1 -1
- package/dist/src/ai/rag/quality.d.ts +5 -1
- package/dist/svelte/ai/index.js +132 -1
- package/dist/svelte/ai/index.js.map +3 -3
- package/dist/types/ai.d.ts +17 -0
- package/dist/vue/ai/index.js +132 -1
- package/dist/vue/ai/index.js.map +3 -3
- package/package.json +7 -7
package/dist/src/ai/index.d.ts
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
export { aiChat } from '../plugins/aiChat';
|
|
2
2
|
export { streamAI } from './streamAI';
|
|
3
3
|
export { ragChat } from './rag';
|
|
4
|
-
export { buildRAGAnswerGroundingCaseDifficultyLeaderboard, buildRAGAnswerGroundingCaseDifficultyRunDiff, buildRAGAnswerGroundingEvaluationResponse, buildRAGAnswerGroundingEvaluationLeaderboard, buildRAGAnswerGroundingEvaluationRunDiff, buildRAGContext, buildRAGComparisonTraceDiffRows, buildRAGComparisonTraceSummaryRows, buildRAGEvaluationCaseTracePresentations, buildRAGEvaluationLeaderboard, buildRAGEvaluationHistoryRows, buildRAGEvaluationResponse, buildRAGEvaluationRunDiff, compareRAGRetrievalStrategies, compareRAGRerankers, createRAGFileAnswerGroundingCaseDifficultyHistoryStore, createRAGFileAnswerGroundingEvaluationHistoryStore, createRAGBunS3SyncClient, createRAGFileEvaluationHistoryStore, createRAGEvaluationSuite, createRAGDirectorySyncSource, createRAGEmailSyncSource, createRAGGmailEmailSyncClient, createRAGFileSyncStateStore, createRAGGraphEmailSyncClient, createRAGIMAPEmailSyncClient, createRAGStaticEmailSyncClient, createRAGStorageSyncSource, evaluateRAGAnswerGrounding, evaluateRAGAnswerGroundingCase, evaluateRAGCollection, executeDryRunRAGEvaluation, loadRAGAnswerGroundingCaseDifficultyHistory, loadRAGAnswerGroundingEvaluationHistory, loadRAGEvaluationHistory, persistRAGAnswerGroundingCaseDifficultyRun, persistRAGAnswerGroundingEvaluationRun, persistRAGEvaluationSuiteRun, runRAGEvaluationSuite, summarizeRAGEvaluationCase, summarizeRAGRerankerComparison, buildRAGCitations, buildRAGCitationReferenceMap, buildRAGLexicalHaystack, buildRAGGroundedAnswer, buildRAGGroundingReferences, buildRAGRetrievalTracePresentation, buildRAGSourceGroups, buildRAGSourceSummaries, buildRAGUpsertInputFromDirectory, buildRAGUpsertInputFromDocuments, createBuiltinArchiveExpander, createEmailExtractor, createEPUBExtractor, createLegacyDocumentExtractor, createRAGPDFOCRExtractor, createRAGArchiveExpander, createRAGArchiveFileExtractor, createOfficeDocumentExtractor, createPDFFileExtractor, createRAGCollection, createRAGEmbeddingProvider, createRAGFileExtractor, createRAGImageOCRExtractor, createHeuristicRAGReranker, createHeuristicRAGQueryTransform, createRAGHTMXConfig, createRAGMediaFileExtractor, createRAGMediaTranscriber, createRAGSyncManager, createRAGSyncScheduler, createRAGOCRProvider, createRAGUrlSyncSource, createRAGQueryTransform, createRAGReranker, formatRAGTraceValue, fuseRAGQueryResults, createTextFileExtractor, createRAGHTMXWorkflowRenderConfig, alibabaEmbeddings, anthropicOCR, deepseekEmbeddings, geminiEmbeddings, geminiOCR, getLatestAssistantMessage, getLatestRAGSources, buildRAGStreamProgress, googleEmbeddings, ingestDocuments, ingestRAGDocuments, loadRAGDocumentFile, loadRAGDocumentsFromDirectory, loadRAGDocumentFromURL, loadRAGDocumentsFromURLs, metaEmbeddings, mistralaiEmbeddings, moonshotEmbeddings, ollamaEmbeddings, ollamaOCR, ollamaTranscriber, openaiCompatibleEmbeddings, openaiCompatibleOCR, openaiCompatibleTranscriber, openaiEmbeddings, openaiOCR, openaiTranscriber, prepareRAGDirectoryDocuments, buildRAGUpsertInputFromUploads, loadRAGDocumentUpload, loadRAGDocumentsFromUploads, buildRAGUpsertInputFromURLs, prepareRAGDocument, prepareRAGDocumentFile, prepareRAGDocuments, ragPlugin, resolveRAGQueryTransform, resolveRAGEmbeddingProvider, resolveRAGHybridSearchOptions, resolveRAGReranker, resolveRAGStreamStage, searchDocuments, scoreRAGLexicalMatch, applyRAGReranking, applyRAGQueryTransform, validateRAGEmbeddingDimensions, xaiEmbeddings } from './rag';
|
|
4
|
+
export { buildRAGAnswerGroundingCaseDifficultyLeaderboard, buildRAGAnswerGroundingCaseSnapshotPresentations, buildRAGAnswerGroundingHistoryPresentation, buildRAGAnswerGroundingHistoryRows, buildRAGAnswerGroundingCaseDifficultyRunDiff, buildRAGAnswerGroundingEvaluationResponse, buildRAGAnswerGroundingEvaluationLeaderboard, buildRAGAnswerGroundingEvaluationRunDiff, buildRAGContext, buildRAGComparisonTraceDiffRows, buildRAGComparisonTraceSummaryRows, buildRAGEvaluationCaseTracePresentations, buildRAGEvaluationHistoryPresentation, buildRAGEvaluationLeaderboard, buildRAGEvaluationHistoryRows, buildRAGEvaluationResponse, buildRAGEvaluationRunDiff, compareRAGRetrievalStrategies, compareRAGRerankers, createRAGFileAnswerGroundingCaseDifficultyHistoryStore, createRAGFileAnswerGroundingEvaluationHistoryStore, createRAGBunS3SyncClient, createRAGFileEvaluationHistoryStore, createRAGEvaluationSuite, createRAGDirectorySyncSource, createRAGEmailSyncSource, createRAGGmailEmailSyncClient, createRAGFileSyncStateStore, createRAGGraphEmailSyncClient, createRAGIMAPEmailSyncClient, createRAGStaticEmailSyncClient, createRAGStorageSyncSource, evaluateRAGAnswerGrounding, evaluateRAGAnswerGroundingCase, evaluateRAGCollection, executeDryRunRAGEvaluation, loadRAGAnswerGroundingCaseDifficultyHistory, loadRAGAnswerGroundingEvaluationHistory, loadRAGEvaluationHistory, persistRAGAnswerGroundingCaseDifficultyRun, persistRAGAnswerGroundingEvaluationRun, persistRAGEvaluationSuiteRun, runRAGEvaluationSuite, summarizeRAGEvaluationCase, summarizeRAGRerankerComparison, buildRAGCitations, buildRAGCitationReferenceMap, buildRAGLexicalHaystack, buildRAGGroundedAnswer, buildRAGGroundingReferences, buildRAGRetrievalTracePresentation, buildRAGSourceGroups, buildRAGSourceSummaries, buildRAGUpsertInputFromDirectory, buildRAGUpsertInputFromDocuments, createBuiltinArchiveExpander, createEmailExtractor, createEPUBExtractor, createLegacyDocumentExtractor, createRAGPDFOCRExtractor, createRAGArchiveExpander, createRAGArchiveFileExtractor, createOfficeDocumentExtractor, createPDFFileExtractor, createRAGCollection, createRAGEmbeddingProvider, createRAGFileExtractor, createRAGImageOCRExtractor, createHeuristicRAGReranker, createHeuristicRAGQueryTransform, createRAGHTMXConfig, createRAGMediaFileExtractor, createRAGMediaTranscriber, createRAGSyncManager, createRAGSyncScheduler, createRAGOCRProvider, createRAGUrlSyncSource, createRAGQueryTransform, createRAGReranker, formatRAGTraceValue, fuseRAGQueryResults, createTextFileExtractor, createRAGHTMXWorkflowRenderConfig, alibabaEmbeddings, anthropicOCR, deepseekEmbeddings, geminiEmbeddings, geminiOCR, getLatestAssistantMessage, getLatestRAGSources, buildRAGStreamProgress, googleEmbeddings, ingestDocuments, ingestRAGDocuments, loadRAGDocumentFile, loadRAGDocumentsFromDirectory, loadRAGDocumentFromURL, loadRAGDocumentsFromURLs, metaEmbeddings, mistralaiEmbeddings, moonshotEmbeddings, ollamaEmbeddings, ollamaOCR, ollamaTranscriber, openaiCompatibleEmbeddings, openaiCompatibleOCR, openaiCompatibleTranscriber, openaiEmbeddings, openaiOCR, openaiTranscriber, prepareRAGDirectoryDocuments, buildRAGUpsertInputFromUploads, loadRAGDocumentUpload, loadRAGDocumentsFromUploads, buildRAGUpsertInputFromURLs, prepareRAGDocument, prepareRAGDocumentFile, prepareRAGDocuments, ragPlugin, resolveRAGQueryTransform, resolveRAGEmbeddingProvider, resolveRAGHybridSearchOptions, resolveRAGReranker, resolveRAGStreamStage, searchDocuments, scoreRAGLexicalMatch, applyRAGReranking, applyRAGQueryTransform, validateRAGEmbeddingDimensions, xaiEmbeddings } from './rag';
|
|
5
5
|
export { createInMemoryRAGStore } from './rag/adapters/inMemory';
|
|
6
6
|
export { createSQLiteRAGStore } from './rag/adapters/sqlite';
|
|
7
7
|
export { resolveAbsoluteSQLiteVec, resolveAbsoluteSQLiteVecExtensionPath } from './rag/resolveAbsoluteSQLiteVec';
|
|
@@ -10,7 +10,7 @@ export { createRAGGmailEmailSyncClient, createRAGGraphEmailSyncClient, createRAG
|
|
|
10
10
|
export { buildRAGUpsertInputFromDirectory, buildRAGUpsertInputFromDocuments, buildRAGUpsertInputFromUploads, createBuiltinArchiveExpander, createEmailExtractor, createEPUBExtractor, createLegacyDocumentExtractor, createRAGPDFOCRExtractor, createRAGArchiveExpander, createRAGArchiveFileExtractor, createOfficeDocumentExtractor, createPDFFileExtractor, createRAGFileExtractor, createRAGImageOCRExtractor, createRAGMediaFileExtractor, createRAGMediaTranscriber, createRAGOCRProvider, createTextFileExtractor, loadRAGDocumentFromURL, loadRAGDocumentUpload, loadRAGDocumentsFromUploads, buildRAGUpsertInputFromURLs, loadRAGDocumentFile, loadRAGDocumentsFromDirectory, loadRAGDocumentsFromURLs, prepareRAGDirectoryDocuments, prepareRAGDocument, prepareRAGDocumentFile, prepareRAGDocuments } from './ingestion';
|
|
11
11
|
export { buildRAGAnswerWorkflowState, buildRAGCitations, buildRAGCitationReferenceMap, buildRAGGroundedAnswer, buildRAGGroundingReferences, buildRAGRetrievalTracePresentation, buildRAGSourceGroups, buildRAGSourceSummaries, buildRAGStreamProgress, formatRAGTraceValue, getLatestAssistantMessage, getLatestRAGSources, resolveRAGStreamStage } from './presentation';
|
|
12
12
|
export { buildRAGContext } from './types';
|
|
13
|
-
export { buildRAGAnswerGroundingCaseDifficultyLeaderboard, buildRAGAnswerGroundingCaseDifficultyRunDiff, buildRAGAnswerGroundingEvaluationResponse, buildRAGAnswerGroundingEvaluationLeaderboard, buildRAGAnswerGroundingEvaluationRunDiff, buildRAGComparisonTraceDiffRows, buildRAGComparisonTraceSummaryRows, buildRAGEvaluationCaseTracePresentations, buildRAGEvaluationLeaderboard, buildRAGEvaluationHistoryRows, buildRAGEvaluationResponse, buildRAGEvaluationRunDiff, compareRAGRetrievalStrategies, compareRAGRerankers, createRAGFileAnswerGroundingCaseDifficultyHistoryStore, createRAGFileAnswerGroundingEvaluationHistoryStore, createRAGFileEvaluationHistoryStore, createRAGEvaluationSuite, evaluateRAGAnswerGrounding, evaluateRAGAnswerGroundingCase, evaluateRAGCollection, executeDryRunRAGEvaluation, loadRAGAnswerGroundingCaseDifficultyHistory, loadRAGAnswerGroundingEvaluationHistory, loadRAGEvaluationHistory, persistRAGAnswerGroundingCaseDifficultyRun, persistRAGAnswerGroundingEvaluationRun, persistRAGEvaluationSuiteRun, runRAGEvaluationSuite, summarizeRAGEvaluationCase, summarizeRAGRerankerComparison } from './quality';
|
|
13
|
+
export { buildRAGAnswerGroundingCaseDifficultyLeaderboard, buildRAGAnswerGroundingCaseSnapshotPresentations, buildRAGAnswerGroundingHistoryPresentation, buildRAGAnswerGroundingHistoryRows, buildRAGAnswerGroundingCaseDifficultyRunDiff, buildRAGAnswerGroundingEvaluationResponse, buildRAGAnswerGroundingEvaluationLeaderboard, buildRAGAnswerGroundingEvaluationRunDiff, buildRAGComparisonTraceDiffRows, buildRAGComparisonTraceSummaryRows, buildRAGEvaluationCaseTracePresentations, buildRAGEvaluationHistoryPresentation, buildRAGEvaluationLeaderboard, buildRAGEvaluationHistoryRows, buildRAGEvaluationResponse, buildRAGEvaluationRunDiff, compareRAGRetrievalStrategies, compareRAGRerankers, createRAGFileAnswerGroundingCaseDifficultyHistoryStore, createRAGFileAnswerGroundingEvaluationHistoryStore, createRAGFileEvaluationHistoryStore, createRAGEvaluationSuite, evaluateRAGAnswerGrounding, evaluateRAGAnswerGroundingCase, evaluateRAGCollection, executeDryRunRAGEvaluation, loadRAGAnswerGroundingCaseDifficultyHistory, loadRAGAnswerGroundingEvaluationHistory, loadRAGEvaluationHistory, persistRAGAnswerGroundingCaseDifficultyRun, persistRAGAnswerGroundingEvaluationRun, persistRAGEvaluationSuiteRun, runRAGEvaluationSuite, summarizeRAGEvaluationCase, summarizeRAGRerankerComparison } from './quality';
|
|
14
14
|
export { createRAGBunS3SyncClient, createRAGDirectorySyncSource, createRAGEmailSyncSource, createRAGFileSyncStateStore, createRAGStaticEmailSyncClient, createRAGStorageSyncSource, createRAGSyncManager, createRAGSyncScheduler, createRAGUrlSyncSource } from './sync';
|
|
15
15
|
export type { RAGStreamProgress, RAGStreamProgressState } from './presentation';
|
|
16
16
|
export { createRAGCollection, ingestDocuments, ingestRAGDocuments, searchDocuments } from './collection';
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import type { RAGAnswerGroundingCaseDifficultyHistory, RAGAnswerGroundingCaseDifficultyHistoryStore, RAGAnswerGroundingCaseDifficultyRun, RAGAnswerGroundingCaseDifficultyRunDiff, RAGAnswerGroundingEvaluationCase, RAGAnswerGroundingEvaluationCaseDifficultyEntry, RAGAnswerGroundingEvaluationCaseResult, RAGAnswerGroundingEvaluationHistory, RAGAnswerGroundingEvaluationLeaderboardEntry, RAGAnswerGroundingEvaluationHistoryStore, RAGAnswerGroundingEvaluationInput, RAGAnswerGroundingEvaluationResponse, RAGAnswerGroundingEvaluationRun, RAGAnswerGroundingEvaluationRunDiff, RAGCollection, RAGEvaluationCase, RAGEvaluationCaseTracePresentation, RAGEvaluationCaseTraceSnapshot, RAGEvaluationCaseResult, RAGEvaluationHistory, RAGEvaluationHistoryStore, RAGEvaluationInput, RAGEvaluationLeaderboardEntry, RAGEvaluationResponse, RAGEvaluationRunDiff, RAGLabelValueRow, RAGEvaluationSuite, RAGEvaluationSuiteRun, RAGRetrievalCandidate, RAGRetrievalComparison, RAGRetrievalComparisonEntry, RAGRetrievalTraceComparisonSummary, RAGRetrievalComparisonSummary, RAGRerankerCandidate, RAGRerankerComparison, RAGRerankerComparisonEntry, RAGRerankerComparisonSummary, RAGRerankerProviderLike } from '../../../types/ai';
|
|
1
|
+
import type { RAGAnswerGroundingCaseDifficultyHistory, RAGAnswerGroundingCaseDifficultyHistoryStore, RAGAnswerGroundingCaseDifficultyRun, RAGAnswerGroundingCaseDifficultyRunDiff, RAGAnswerGroundingEvaluationCase, RAGAnswerGroundingEvaluationCaseDifficultyEntry, RAGAnswerGroundingCaseSnapshotPresentation, RAGAnswerGroundingEvaluationCaseResult, RAGAnswerGroundingEvaluationHistory, RAGAnswerGroundingHistoryPresentation, RAGAnswerGroundingEvaluationLeaderboardEntry, RAGAnswerGroundingEvaluationHistoryStore, RAGAnswerGroundingEvaluationInput, RAGAnswerGroundingEvaluationResponse, RAGAnswerGroundingEvaluationRun, RAGAnswerGroundingEvaluationRunDiff, RAGCollection, RAGEvaluationCase, RAGEvaluationCaseTracePresentation, RAGEvaluationCaseTraceSnapshot, RAGEvaluationCaseResult, RAGEvaluationHistoryPresentation, RAGEvaluationHistory, RAGEvaluationHistoryStore, RAGEvaluationInput, RAGEvaluationLeaderboardEntry, RAGEvaluationResponse, RAGEvaluationRunDiff, RAGLabelValueRow, RAGEvaluationSuite, RAGEvaluationSuiteRun, RAGRetrievalCandidate, RAGRetrievalComparison, RAGRetrievalComparisonEntry, RAGRetrievalTraceComparisonSummary, RAGRetrievalComparisonSummary, RAGRerankerCandidate, RAGRerankerComparison, RAGRerankerComparisonEntry, RAGRerankerComparisonSummary, RAGRerankerProviderLike } from '../../../types/ai';
|
|
2
2
|
export declare const buildRAGEvaluationLeaderboard: (runs: RAGEvaluationSuiteRun[]) => RAGEvaluationLeaderboardEntry[];
|
|
3
3
|
export declare const buildRAGAnswerGroundingEvaluationLeaderboard: (runs: RAGAnswerGroundingEvaluationRun[]) => RAGAnswerGroundingEvaluationLeaderboardEntry[];
|
|
4
4
|
export declare const buildRAGAnswerGroundingCaseDifficultyLeaderboard: (entries: Array<{
|
|
@@ -13,6 +13,7 @@ export declare const buildRAGComparisonTraceSummaryRows: (entry: RAGRerankerComp
|
|
|
13
13
|
export declare const buildRAGComparisonTraceDiffRows: (entry: RAGRerankerComparisonEntry | RAGRetrievalComparisonEntry, leader?: RAGRerankerComparisonEntry | RAGRetrievalComparisonEntry) => RAGLabelValueRow[];
|
|
14
14
|
export declare const buildRAGEvaluationHistoryRows: (history?: RAGEvaluationHistory) => RAGLabelValueRow[];
|
|
15
15
|
export declare const buildRAGEvaluationCaseTracePresentations: (history?: RAGEvaluationHistory) => RAGEvaluationCaseTracePresentation[];
|
|
16
|
+
export declare const buildRAGEvaluationHistoryPresentation: (history?: RAGEvaluationHistory) => RAGEvaluationHistoryPresentation;
|
|
16
17
|
export declare const buildRAGEvaluationRunDiff: ({ current, previous }: {
|
|
17
18
|
current: RAGEvaluationSuiteRun;
|
|
18
19
|
previous?: RAGEvaluationSuiteRun;
|
|
@@ -21,6 +22,9 @@ export declare const buildRAGAnswerGroundingEvaluationRunDiff: ({ current, previ
|
|
|
21
22
|
current: RAGAnswerGroundingEvaluationRun;
|
|
22
23
|
previous?: RAGAnswerGroundingEvaluationRun;
|
|
23
24
|
}) => RAGAnswerGroundingEvaluationRunDiff;
|
|
25
|
+
export declare const buildRAGAnswerGroundingCaseSnapshotPresentations: (history?: RAGAnswerGroundingEvaluationHistory) => RAGAnswerGroundingCaseSnapshotPresentation[];
|
|
26
|
+
export declare const buildRAGAnswerGroundingHistoryRows: (history?: RAGAnswerGroundingEvaluationHistory) => RAGLabelValueRow[];
|
|
27
|
+
export declare const buildRAGAnswerGroundingHistoryPresentation: (history?: RAGAnswerGroundingEvaluationHistory) => RAGAnswerGroundingHistoryPresentation;
|
|
24
28
|
export declare const createRAGFileEvaluationHistoryStore: (path: string) => RAGEvaluationHistoryStore;
|
|
25
29
|
export declare const createRAGFileAnswerGroundingEvaluationHistoryStore: (path: string) => RAGAnswerGroundingEvaluationHistoryStore;
|
|
26
30
|
export declare const createRAGFileAnswerGroundingCaseDifficultyHistoryStore: (path: string) => RAGAnswerGroundingCaseDifficultyHistoryStore;
|
package/dist/svelte/ai/index.js
CHANGED
|
@@ -2314,8 +2314,11 @@ var buildEvaluationCaseTraceSnapshots = ({
|
|
|
2314
2314
|
};
|
|
2315
2315
|
var getStatusRank = (status) => status === "pass" ? 2 : status === "partial" ? 1 : 0;
|
|
2316
2316
|
var formatSignedDelta = (value, decimals = 0, suffix = "") => `${value >= 0 ? "+" : ""}${value.toFixed(decimals)}${suffix}`;
|
|
2317
|
+
var formatEvaluationPassingRate = (value) => `${value.toFixed(1)}%`;
|
|
2317
2318
|
var formatEvaluationSummary = (response) => `${response.summary.passedCases}/${response.totalCases} pass \xB7 f1 ${response.summary.averageF1.toFixed(3)} \xB7 latency ${response.summary.averageLatencyMs.toFixed(1)}ms`;
|
|
2319
|
+
var formatGroundingHistorySummaryValue = (response) => `${response.summary.passedCases}/${response.summary.totalCases} pass \xB7 grounded ${response.summary.groundedCases} \xB7 partial ${response.summary.partialCases} \xB7 ungrounded ${response.summary.ungroundedCases} \xB7 resolved citations ${(response.summary.averageResolvedCitationRate * 100).toFixed(1)}% \xB7 citation f1 ${response.summary.averageCitationF1.toFixed(3)}`;
|
|
2318
2320
|
var formatHistoryCaseLabels = (cases) => cases.length > 0 ? cases.map((entry) => entry.label ?? entry.caseId).join(", ") : "none";
|
|
2321
|
+
var formatGroundingHistoryCaseLabels = (cases) => cases.length > 0 ? cases.map((entry) => entry.label ?? entry.caseId).join(", ") : "none";
|
|
2319
2322
|
var formatTraceModes = (modes) => modes.length > 0 ? modes.join(" / ") : "n/a";
|
|
2320
2323
|
var formatTraceStageSummary = (stageCounts) => {
|
|
2321
2324
|
const topStages = Object.entries(stageCounts).sort((left, right) => right[1] - left[1]).slice(0, 3);
|
|
@@ -2538,6 +2541,11 @@ var buildRAGEvaluationCaseTracePresentations = (history) => {
|
|
|
2538
2541
|
};
|
|
2539
2542
|
});
|
|
2540
2543
|
};
|
|
2544
|
+
var buildRAGEvaluationHistoryPresentation = (history) => ({
|
|
2545
|
+
caseTraces: buildRAGEvaluationCaseTracePresentations(history),
|
|
2546
|
+
rows: buildRAGEvaluationHistoryRows(history),
|
|
2547
|
+
summary: history?.latestRun ? history.latestRun.label : "No persisted benchmark runs yet."
|
|
2548
|
+
});
|
|
2541
2549
|
var buildRAGEvaluationRunDiff = ({
|
|
2542
2550
|
current,
|
|
2543
2551
|
previous
|
|
@@ -2606,6 +2614,129 @@ var buildRAGAnswerGroundingEvaluationRunDiff = ({
|
|
|
2606
2614
|
unchangedCases
|
|
2607
2615
|
};
|
|
2608
2616
|
};
|
|
2617
|
+
var buildRAGAnswerGroundingCaseSnapshotPresentations = (history) => {
|
|
2618
|
+
if (!history?.caseSnapshots.length) {
|
|
2619
|
+
return [];
|
|
2620
|
+
}
|
|
2621
|
+
return history.caseSnapshots.map((entry) => {
|
|
2622
|
+
const label = entry.label ?? entry.caseId;
|
|
2623
|
+
return {
|
|
2624
|
+
answerChange: entry.answerChange,
|
|
2625
|
+
caseId: entry.caseId,
|
|
2626
|
+
label,
|
|
2627
|
+
rows: [
|
|
2628
|
+
{
|
|
2629
|
+
label: "Query",
|
|
2630
|
+
value: entry.query?.trim().length ? entry.query : "n/a"
|
|
2631
|
+
},
|
|
2632
|
+
{ label: "Answer change", value: entry.answerChange },
|
|
2633
|
+
{ label: "Coverage", value: entry.coverage },
|
|
2634
|
+
{
|
|
2635
|
+
label: "Resolved citations",
|
|
2636
|
+
value: `${entry.resolvedCitationCount}/${entry.citationCount}`
|
|
2637
|
+
},
|
|
2638
|
+
{
|
|
2639
|
+
label: "Resolved citation rate",
|
|
2640
|
+
value: entry.resolvedCitationRate.toFixed(3)
|
|
2641
|
+
},
|
|
2642
|
+
{ label: "Citation F1", value: entry.citationF1.toFixed(3) },
|
|
2643
|
+
{
|
|
2644
|
+
label: "Reference count",
|
|
2645
|
+
value: String(entry.referenceCount)
|
|
2646
|
+
},
|
|
2647
|
+
{
|
|
2648
|
+
label: "Cited IDs",
|
|
2649
|
+
value: entry.citedIds.length > 0 ? entry.citedIds.join(", ") : "none"
|
|
2650
|
+
},
|
|
2651
|
+
{
|
|
2652
|
+
label: "Matched IDs",
|
|
2653
|
+
value: entry.matchedIds.length > 0 ? entry.matchedIds.join(", ") : "none"
|
|
2654
|
+
},
|
|
2655
|
+
{
|
|
2656
|
+
label: "Missing IDs",
|
|
2657
|
+
value: entry.missingIds.length > 0 ? entry.missingIds.join(", ") : "none"
|
|
2658
|
+
},
|
|
2659
|
+
{
|
|
2660
|
+
label: "Extra IDs",
|
|
2661
|
+
value: entry.extraIds.length > 0 ? entry.extraIds.join(", ") : "none"
|
|
2662
|
+
},
|
|
2663
|
+
{
|
|
2664
|
+
label: "Unresolved refs",
|
|
2665
|
+
value: entry.ungroundedReferenceNumbers.length > 0 ? entry.ungroundedReferenceNumbers.join(", ") : "none"
|
|
2666
|
+
},
|
|
2667
|
+
{
|
|
2668
|
+
label: "Answer",
|
|
2669
|
+
value: entry.answer.trim().length > 0 ? entry.answer : "n/a"
|
|
2670
|
+
},
|
|
2671
|
+
{
|
|
2672
|
+
label: "Previous answer",
|
|
2673
|
+
value: entry.previousAnswer && entry.previousAnswer.trim().length > 0 ? entry.previousAnswer : "n/a"
|
|
2674
|
+
}
|
|
2675
|
+
],
|
|
2676
|
+
summary: `${entry.answerChange} \xB7 ${entry.coverage} \xB7 resolved ${entry.resolvedCitationCount}/${entry.citationCount} \xB7 refs ${entry.referenceCount}`
|
|
2677
|
+
};
|
|
2678
|
+
});
|
|
2679
|
+
};
|
|
2680
|
+
var buildRAGAnswerGroundingHistoryRows = (history) => {
|
|
2681
|
+
if (!history?.latestRun) {
|
|
2682
|
+
return [{ label: "History", value: "No persisted provider runs yet." }];
|
|
2683
|
+
}
|
|
2684
|
+
const rows = [
|
|
2685
|
+
{ label: "Runs recorded", value: String(history.runs.length) },
|
|
2686
|
+
{
|
|
2687
|
+
label: "Latest",
|
|
2688
|
+
value: `${history.latestRun.label} \xB7 ${formatGroundingHistorySummaryValue(history.latestRun.response)}`
|
|
2689
|
+
}
|
|
2690
|
+
];
|
|
2691
|
+
if (history.previousRun) {
|
|
2692
|
+
rows.push({
|
|
2693
|
+
label: "Previous",
|
|
2694
|
+
value: `${history.previousRun.label} \xB7 ${formatGroundingHistorySummaryValue(history.previousRun.response)}`
|
|
2695
|
+
});
|
|
2696
|
+
}
|
|
2697
|
+
if (history.leaderboard[0]) {
|
|
2698
|
+
rows.push({
|
|
2699
|
+
label: "Best recorded",
|
|
2700
|
+
value: `#${history.leaderboard[0].rank} \xB7 ${history.leaderboard[0].label} \xB7 passing ${formatEvaluationPassingRate(history.leaderboard[0].passingRate)} \xB7 citation f1 ${history.leaderboard[0].averageCitationF1.toFixed(3)} \xB7 resolved ${formatEvaluationPassingRate(history.leaderboard[0].averageResolvedCitationRate)}`
|
|
2701
|
+
});
|
|
2702
|
+
}
|
|
2703
|
+
if (history.caseSnapshots.length > 0) {
|
|
2704
|
+
const changedAnswers = history.caseSnapshots.filter((entry) => entry.answerChange === "changed").length;
|
|
2705
|
+
rows.push({
|
|
2706
|
+
label: "Answer drift",
|
|
2707
|
+
value: `${changedAnswers}/${history.caseSnapshots.length} changed`
|
|
2708
|
+
});
|
|
2709
|
+
}
|
|
2710
|
+
if (!history.diff) {
|
|
2711
|
+
rows.push({
|
|
2712
|
+
label: "History diff",
|
|
2713
|
+
value: "Run the provider comparison again to diff grounding regressions over time."
|
|
2714
|
+
});
|
|
2715
|
+
return rows;
|
|
2716
|
+
}
|
|
2717
|
+
rows.push({
|
|
2718
|
+
label: "Passing delta",
|
|
2719
|
+
value: formatSignedDelta(history.diff.summaryDelta.passingRate, 1, "%")
|
|
2720
|
+
}, {
|
|
2721
|
+
label: "Citation F1 delta",
|
|
2722
|
+
value: formatSignedDelta(history.diff.summaryDelta.averageCitationF1, 3)
|
|
2723
|
+
}, {
|
|
2724
|
+
label: "Resolved citation delta",
|
|
2725
|
+
value: formatSignedDelta(history.diff.summaryDelta.averageResolvedCitationRate * 100, 1, "%")
|
|
2726
|
+
}, {
|
|
2727
|
+
label: "Improved",
|
|
2728
|
+
value: formatGroundingHistoryCaseLabels(history.diff.improvedCases)
|
|
2729
|
+
}, {
|
|
2730
|
+
label: "Regressed",
|
|
2731
|
+
value: formatGroundingHistoryCaseLabels(history.diff.regressedCases)
|
|
2732
|
+
});
|
|
2733
|
+
return rows;
|
|
2734
|
+
};
|
|
2735
|
+
var buildRAGAnswerGroundingHistoryPresentation = (history) => ({
|
|
2736
|
+
caseSnapshots: buildRAGAnswerGroundingCaseSnapshotPresentations(history),
|
|
2737
|
+
rows: buildRAGAnswerGroundingHistoryRows(history),
|
|
2738
|
+
summary: history?.latestRun ? history.latestRun.label : "No persisted provider runs yet."
|
|
2739
|
+
});
|
|
2609
2740
|
var createRAGFileEvaluationHistoryStore = (path) => ({
|
|
2610
2741
|
listRuns: async ({ limit, suiteId } = {}) => {
|
|
2611
2742
|
let parsed = [];
|
|
@@ -3843,5 +3974,5 @@ export {
|
|
|
3843
3974
|
createAIStream
|
|
3844
3975
|
};
|
|
3845
3976
|
|
|
3846
|
-
//# debugId=
|
|
3977
|
+
//# debugId=12110AF3399232C164756E2164756E21
|
|
3847
3978
|
//# sourceMappingURL=index.js.map
|