@fllf/agent-sdk 0.1.2 → 0.1.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +169 -0
- package/README.md +824 -198
- package/dist/agent/Agent.d.ts +16 -5
- package/dist/agent/Agent.d.ts.map +1 -1
- package/dist/agent/Agent.js +283 -2
- package/dist/agent/Agent.js.map +1 -1
- package/dist/agent/index.d.ts +1 -1
- package/dist/agent/index.d.ts.map +1 -1
- package/dist/agent/types.d.ts +27 -3
- package/dist/agent/types.d.ts.map +1 -1
- package/dist/config/config.d.ts +22 -3
- package/dist/config/config.d.ts.map +1 -1
- package/dist/config/config.js +194 -47
- package/dist/config/config.js.map +1 -1
- package/dist/config/index.d.ts +1 -1
- package/dist/config/index.d.ts.map +1 -1
- package/dist/errors.d.ts +74 -0
- package/dist/errors.d.ts.map +1 -0
- package/dist/errors.js +186 -0
- package/dist/errors.js.map +1 -0
- package/dist/executors/base-executor.d.ts +14 -0
- package/dist/executors/base-executor.d.ts.map +1 -0
- package/dist/executors/base-executor.js +31 -0
- package/dist/executors/base-executor.js.map +1 -0
- package/dist/executors/base.d.ts +36 -5
- package/dist/executors/base.d.ts.map +1 -1
- package/dist/executors/chat-request-builder.d.ts +10 -0
- package/dist/executors/chat-request-builder.d.ts.map +1 -0
- package/dist/executors/chat-request-builder.js +96 -0
- package/dist/executors/chat-request-builder.js.map +1 -0
- package/dist/executors/index.d.ts +4 -1
- package/dist/executors/index.d.ts.map +1 -1
- package/dist/executors/index.js +6 -1
- package/dist/executors/index.js.map +1 -1
- package/dist/executors/rag-executor.js +1 -1
- package/dist/executors/rag-executor.js.map +1 -1
- package/dist/executors/simple-chat-executor.d.ts +4 -2
- package/dist/executors/simple-chat-executor.d.ts.map +1 -1
- package/dist/executors/simple-chat-executor.js +59 -57
- package/dist/executors/simple-chat-executor.js.map +1 -1
- package/dist/executors/tool-calling-executor.d.ts +20 -2
- package/dist/executors/tool-calling-executor.d.ts.map +1 -1
- package/dist/executors/tool-calling-executor.js +189 -91
- package/dist/executors/tool-calling-executor.js.map +1 -1
- package/dist/history/base.d.ts +55 -2
- package/dist/history/base.d.ts.map +1 -1
- package/dist/history/base.js +49 -0
- package/dist/history/base.js.map +1 -1
- package/dist/history/compression.d.ts +49 -0
- package/dist/history/compression.d.ts.map +1 -0
- package/dist/history/compression.js +53 -0
- package/dist/history/compression.js.map +1 -0
- package/dist/history/context-window.d.ts +33 -0
- package/dist/history/context-window.d.ts.map +1 -0
- package/dist/history/context-window.js +68 -0
- package/dist/history/context-window.js.map +1 -0
- package/dist/history/in-memory.d.ts +6 -4
- package/dist/history/in-memory.d.ts.map +1 -1
- package/dist/history/in-memory.js +25 -39
- package/dist/history/in-memory.js.map +1 -1
- package/dist/history/index.d.ts +9 -2
- package/dist/history/index.d.ts.map +1 -1
- package/dist/history/index.js +18 -1
- package/dist/history/index.js.map +1 -1
- package/dist/history/postgres/index.d.ts +4 -0
- package/dist/history/postgres/index.d.ts.map +1 -0
- package/dist/history/postgres/index.js +20 -0
- package/dist/history/postgres/index.js.map +1 -0
- package/dist/history/postgres/postgres-message-history-store.d.ts +35 -0
- package/dist/history/postgres/postgres-message-history-store.d.ts.map +1 -0
- package/dist/history/postgres/postgres-message-history-store.js +195 -0
- package/dist/history/postgres/postgres-message-history-store.js.map +1 -0
- package/dist/history/postgres/schema.d.ts +18 -0
- package/dist/history/postgres/schema.d.ts.map +1 -0
- package/dist/history/postgres/schema.js +46 -0
- package/dist/history/postgres/schema.js.map +1 -0
- package/dist/history/postgres/sql.d.ts +29 -0
- package/dist/history/postgres/sql.d.ts.map +1 -0
- package/dist/history/postgres/sql.js +102 -0
- package/dist/history/postgres/sql.js.map +1 -0
- package/dist/history/postgres/types.d.ts +20 -0
- package/dist/history/postgres/types.d.ts.map +1 -0
- package/dist/history/postgres/types.js +3 -0
- package/dist/history/postgres/types.js.map +1 -0
- package/dist/history/tool-pairing.d.ts +11 -0
- package/dist/history/tool-pairing.d.ts.map +1 -0
- package/dist/history/tool-pairing.js +52 -0
- package/dist/history/tool-pairing.js.map +1 -0
- package/dist/index.d.ts +2 -0
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +2 -0
- package/dist/index.js.map +1 -1
- package/dist/llm/LLM.d.ts +1 -0
- package/dist/llm/LLM.d.ts.map +1 -1
- package/dist/llm/LLM.js +136 -26
- package/dist/llm/LLM.js.map +1 -1
- package/dist/llm/errors.d.ts +11 -1
- package/dist/llm/errors.d.ts.map +1 -1
- package/dist/llm/errors.js +50 -1
- package/dist/llm/errors.js.map +1 -1
- package/dist/llm/factory.d.ts +14 -2
- package/dist/llm/factory.d.ts.map +1 -1
- package/dist/llm/factory.js +48 -9
- package/dist/llm/factory.js.map +1 -1
- package/dist/llm/index.d.ts +8 -3
- package/dist/llm/index.d.ts.map +1 -1
- package/dist/llm/index.js +10 -1
- package/dist/llm/index.js.map +1 -1
- package/dist/llm/providers/anthropic.d.ts +14 -0
- package/dist/llm/providers/anthropic.d.ts.map +1 -0
- package/dist/llm/providers/anthropic.js +336 -0
- package/dist/llm/providers/anthropic.js.map +1 -0
- package/dist/llm/providers/openai-compatible.d.ts +7 -0
- package/dist/llm/providers/openai-compatible.d.ts.map +1 -1
- package/dist/llm/providers/openai-compatible.js +151 -47
- package/dist/llm/providers/openai-compatible.js.map +1 -1
- package/dist/llm/stream-accumulator.d.ts +17 -0
- package/dist/llm/stream-accumulator.d.ts.map +1 -0
- package/dist/llm/stream-accumulator.js +83 -0
- package/dist/llm/stream-accumulator.js.map +1 -0
- package/dist/llm/tool-arguments.d.ts +6 -0
- package/dist/llm/tool-arguments.d.ts.map +1 -0
- package/dist/llm/tool-arguments.js +20 -0
- package/dist/llm/tool-arguments.js.map +1 -0
- package/dist/llm/types.d.ts +76 -4
- package/dist/llm/types.d.ts.map +1 -1
- package/dist/messages/content.d.ts +36 -0
- package/dist/messages/content.d.ts.map +1 -0
- package/dist/messages/content.js +70 -0
- package/dist/messages/content.js.map +1 -0
- package/dist/messages/index.d.ts +4 -2
- package/dist/messages/index.d.ts.map +1 -1
- package/dist/messages/index.js +10 -1
- package/dist/messages/index.js.map +1 -1
- package/dist/messages/message.d.ts +11 -9
- package/dist/messages/message.d.ts.map +1 -1
- package/dist/messages/message.js +69 -4
- package/dist/messages/message.js.map +1 -1
- package/dist/messages/types.d.ts +12 -0
- package/dist/messages/types.d.ts.map +1 -1
- package/dist/observability/collecting-observer.d.ts +8 -0
- package/dist/observability/collecting-observer.d.ts.map +1 -0
- package/dist/observability/collecting-observer.js +15 -0
- package/dist/observability/collecting-observer.js.map +1 -0
- package/dist/observability/index.d.ts +1 -0
- package/dist/observability/index.d.ts.map +1 -1
- package/dist/observability/index.js +3 -1
- package/dist/observability/index.js.map +1 -1
- package/dist/observability/observer.d.ts.map +1 -1
- package/dist/observability/observer.js +14 -1
- package/dist/observability/observer.js.map +1 -1
- package/dist/observability/types.d.ts +16 -1
- package/dist/observability/types.d.ts.map +1 -1
- package/dist/rag/chunking/auto-chunker.d.ts +7 -0
- package/dist/rag/chunking/auto-chunker.d.ts.map +1 -1
- package/dist/rag/chunking/auto-chunker.js +13 -0
- package/dist/rag/chunking/auto-chunker.js.map +1 -1
- package/dist/rag/chunking/chunker.d.ts.map +1 -1
- package/dist/rag/chunking/chunker.js +29 -5
- package/dist/rag/chunking/chunker.js.map +1 -1
- package/dist/rag/chunking/index.d.ts +2 -0
- package/dist/rag/chunking/index.d.ts.map +1 -1
- package/dist/rag/chunking/index.js +2 -0
- package/dist/rag/chunking/index.js.map +1 -1
- package/dist/rag/chunking/markdown-chunker.d.ts.map +1 -1
- package/dist/rag/chunking/markdown-chunker.js.map +1 -1
- package/dist/rag/chunking/qa-pair-chunker.d.ts +23 -0
- package/dist/rag/chunking/qa-pair-chunker.d.ts.map +1 -0
- package/dist/rag/chunking/qa-pair-chunker.js +162 -0
- package/dist/rag/chunking/qa-pair-chunker.js.map +1 -0
- package/dist/rag/chunking/semantic-chunker.d.ts +19 -0
- package/dist/rag/chunking/semantic-chunker.d.ts.map +1 -0
- package/dist/rag/chunking/semantic-chunker.js +291 -0
- package/dist/rag/chunking/semantic-chunker.js.map +1 -0
- package/dist/rag/embeddings/embedder.d.ts.map +1 -1
- package/dist/rag/embeddings/embedder.js +6 -0
- package/dist/rag/embeddings/embedder.js.map +1 -1
- package/dist/rag/generation/context-builder.d.ts +7 -0
- package/dist/rag/generation/context-builder.d.ts.map +1 -1
- package/dist/rag/generation/context-builder.js +4 -1
- package/dist/rag/generation/context-builder.js.map +1 -1
- package/dist/rag/ingestion/metadata.d.ts +6 -1
- package/dist/rag/ingestion/metadata.d.ts.map +1 -1
- package/dist/rag/ingestion/metadata.js +6 -2
- package/dist/rag/ingestion/metadata.js.map +1 -1
- package/dist/rag/pipeline.d.ts.map +1 -1
- package/dist/rag/pipeline.js +34 -11
- package/dist/rag/pipeline.js.map +1 -1
- package/dist/rag/retrieval/index.d.ts +1 -0
- package/dist/rag/retrieval/index.d.ts.map +1 -1
- package/dist/rag/retrieval/index.js +1 -0
- package/dist/rag/retrieval/index.js.map +1 -1
- package/dist/rag/retrieval/parent-child-expanding-retriever.d.ts +31 -0
- package/dist/rag/retrieval/parent-child-expanding-retriever.d.ts.map +1 -0
- package/dist/rag/retrieval/parent-child-expanding-retriever.js +194 -0
- package/dist/rag/retrieval/parent-child-expanding-retriever.js.map +1 -0
- package/dist/rag/stores/in-memory-keyword-store.d.ts.map +1 -1
- package/dist/rag/stores/in-memory-keyword-store.js +3 -8
- package/dist/rag/stores/in-memory-keyword-store.js.map +1 -1
- package/dist/rag/stores/keyword-tokenizer.d.ts +4 -0
- package/dist/rag/stores/keyword-tokenizer.d.ts.map +1 -0
- package/dist/rag/stores/keyword-tokenizer.js +113 -0
- package/dist/rag/stores/keyword-tokenizer.js.map +1 -0
- package/dist/rag/stores/postgres/pg-vector-store.d.ts.map +1 -1
- package/dist/rag/stores/postgres/pg-vector-store.js +21 -8
- package/dist/rag/stores/postgres/pg-vector-store.js.map +1 -1
- package/dist/rag/stores/postgres/postgres-document-store.d.ts.map +1 -1
- package/dist/rag/stores/postgres/postgres-document-store.js +26 -13
- package/dist/rag/stores/postgres/postgres-document-store.js.map +1 -1
- package/dist/rag/stores/postgres/postgres-keyword-store.d.ts.map +1 -1
- package/dist/rag/stores/postgres/postgres-keyword-store.js +43 -43
- package/dist/rag/stores/postgres/postgres-keyword-store.js.map +1 -1
- package/dist/rag/stores/postgres/sql.d.ts +22 -0
- package/dist/rag/stores/postgres/sql.d.ts.map +1 -1
- package/dist/rag/stores/postgres/sql.js +42 -0
- package/dist/rag/stores/postgres/sql.js.map +1 -1
- package/dist/rag/stores/types.d.ts +5 -0
- package/dist/rag/stores/types.d.ts.map +1 -1
- package/dist/rag/types.d.ts +6 -0
- package/dist/rag/types.d.ts.map +1 -1
- package/dist/testing/agent.d.ts +11 -0
- package/dist/testing/agent.d.ts.map +1 -0
- package/dist/testing/agent.js +45 -0
- package/dist/testing/agent.js.map +1 -0
- package/dist/testing/history-contract.d.ts +12 -0
- package/dist/testing/history-contract.d.ts.map +1 -0
- package/dist/testing/history-contract.js +111 -0
- package/dist/testing/history-contract.js.map +1 -0
- package/dist/testing/index.d.ts +11 -0
- package/dist/testing/index.d.ts.map +1 -0
- package/dist/testing/index.js +16 -0
- package/dist/testing/index.js.map +1 -0
- package/dist/testing/models.d.ts +34 -0
- package/dist/testing/models.d.ts.map +1 -0
- package/dist/testing/models.js +74 -0
- package/dist/testing/models.js.map +1 -0
- package/dist/testing/tool-schema.d.ts +6 -0
- package/dist/testing/tool-schema.d.ts.map +1 -0
- package/dist/testing/tool-schema.js +29 -0
- package/dist/testing/tool-schema.js.map +1 -0
- package/dist/testing/tools.d.ts +21 -0
- package/dist/testing/tools.d.ts.map +1 -0
- package/dist/testing/tools.js +43 -0
- package/dist/testing/tools.js.map +1 -0
- package/dist/tools/base.d.ts +38 -7
- package/dist/tools/base.d.ts.map +1 -1
- package/dist/tools/base.js +238 -11
- package/dist/tools/base.js.map +1 -1
- package/dist/tools/builtin/advancedSearchTool.d.ts.map +1 -1
- package/dist/tools/builtin/advancedSearchTool.js +30 -4
- package/dist/tools/builtin/advancedSearchTool.js.map +1 -1
- package/dist/tools/builtin/ragSearchTool.d.ts +6 -3
- package/dist/tools/builtin/ragSearchTool.d.ts.map +1 -1
- package/dist/tools/builtin/ragSearchTool.js +8 -6
- package/dist/tools/builtin/ragSearchTool.js.map +1 -1
- package/dist/tools/executor.d.ts +30 -2
- package/dist/tools/executor.d.ts.map +1 -1
- package/dist/tools/executor.js +83 -15
- package/dist/tools/executor.js.map +1 -1
- package/dist/tools/index.d.ts +3 -1
- package/dist/tools/index.d.ts.map +1 -1
- package/dist/tools/registry.d.ts +15 -3
- package/dist/tools/registry.d.ts.map +1 -1
- package/dist/tools/registry.js +21 -2
- package/dist/tools/registry.js.map +1 -1
- package/package.json +58 -4
|
@@ -0,0 +1,291 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
|
3
|
+
exports.SemanticChunker = void 0;
|
|
4
|
+
const embeddings_1 = require("../embeddings");
|
|
5
|
+
const chunker_1 = require("./chunker");
|
|
6
|
+
const DEFAULT_SIMILARITY_THRESHOLD = 0.72;
|
|
7
|
+
const SENTENCE_ENDINGS = new Set(['。', '!', '?', '!', '?']);
|
|
8
|
+
class SemanticChunker {
|
|
9
|
+
embedder;
|
|
10
|
+
similarityThreshold;
|
|
11
|
+
maxChunkLength;
|
|
12
|
+
minChunkLength;
|
|
13
|
+
overlapLength;
|
|
14
|
+
constructor(options) {
|
|
15
|
+
this.embedder = options.embedder;
|
|
16
|
+
this.similarityThreshold = normalizeSimilarityThreshold(options.similarityThreshold, DEFAULT_SIMILARITY_THRESHOLD);
|
|
17
|
+
this.maxChunkLength = toPositiveInteger(options.maxChunkLength, chunker_1.DEFAULT_MAX_CHUNK_LENGTH);
|
|
18
|
+
this.minChunkLength = Math.min(toPositiveInteger(options.minChunkLength, chunker_1.DEFAULT_MIN_CHUNK_LENGTH), this.maxChunkLength);
|
|
19
|
+
this.overlapLength = Math.min(normalizeNonNegativeInteger(options.overlapLength, 0), Math.max(this.maxChunkLength - 1, 0));
|
|
20
|
+
}
|
|
21
|
+
async chunk(document) {
|
|
22
|
+
const units = createSemanticUnits(document.content, this.maxChunkLength);
|
|
23
|
+
if (units.length === 0) {
|
|
24
|
+
return [];
|
|
25
|
+
}
|
|
26
|
+
const embeddings = await this.embedder.embedDocuments(units.map((unit) => unit.content));
|
|
27
|
+
(0, embeddings_1.assertEmbeddingBatchSize)(embeddings, units.length);
|
|
28
|
+
embeddings.forEach((embedding, index) => {
|
|
29
|
+
(0, embeddings_1.assertEmbeddingDimensions)(embedding, this.embedder.dimensions, `semantic unit ${index} embedding`);
|
|
30
|
+
});
|
|
31
|
+
const groups = createSemanticGroups(units, embeddings, {
|
|
32
|
+
maxChunkLength: this.maxChunkLength,
|
|
33
|
+
minChunkLength: this.minChunkLength,
|
|
34
|
+
overlapLength: this.overlapLength,
|
|
35
|
+
similarityThreshold: this.similarityThreshold,
|
|
36
|
+
});
|
|
37
|
+
return groups.map((group, index) => {
|
|
38
|
+
const startOffset = group.units[0]?.startOffset ?? 0;
|
|
39
|
+
const endOffset = group.units.at(-1)?.endOffset ?? startOffset;
|
|
40
|
+
return (0, chunker_1.createChunk)({
|
|
41
|
+
document,
|
|
42
|
+
content: document.content.slice(startOffset, endOffset),
|
|
43
|
+
kind: 'text',
|
|
44
|
+
chunkIndex: index,
|
|
45
|
+
startOffset,
|
|
46
|
+
endOffset,
|
|
47
|
+
extra: createSemanticExtra({
|
|
48
|
+
embedder: this.embedder,
|
|
49
|
+
group,
|
|
50
|
+
similarityThreshold: this.similarityThreshold,
|
|
51
|
+
}),
|
|
52
|
+
});
|
|
53
|
+
});
|
|
54
|
+
}
|
|
55
|
+
async chunkMany(documents) {
|
|
56
|
+
return await (0, chunker_1.chunkManyDocuments)(this, documents);
|
|
57
|
+
}
|
|
58
|
+
}
|
|
59
|
+
exports.SemanticChunker = SemanticChunker;
|
|
60
|
+
function createSemanticUnits(text, maxChunkLength) {
|
|
61
|
+
const units = [];
|
|
62
|
+
for (const paragraph of splitParagraphs(text)) {
|
|
63
|
+
if (paragraph.content.length <= maxChunkLength) {
|
|
64
|
+
const sentences = splitSentences(paragraph.content, paragraph.startOffset);
|
|
65
|
+
units.push(...sentences.length > 0 ? sentences : [paragraph]);
|
|
66
|
+
continue;
|
|
67
|
+
}
|
|
68
|
+
for (const segment of (0, chunker_1.splitTextSegments)(paragraph.content, {
|
|
69
|
+
maxChunkLength,
|
|
70
|
+
minChunkLength: Math.min(chunker_1.DEFAULT_MIN_CHUNK_LENGTH, maxChunkLength),
|
|
71
|
+
overlapLength: 0,
|
|
72
|
+
})) {
|
|
73
|
+
units.push({
|
|
74
|
+
content: segment.content,
|
|
75
|
+
startOffset: paragraph.startOffset + segment.startOffset,
|
|
76
|
+
endOffset: paragraph.startOffset + segment.endOffset,
|
|
77
|
+
});
|
|
78
|
+
}
|
|
79
|
+
}
|
|
80
|
+
return units;
|
|
81
|
+
}
|
|
82
|
+
function splitParagraphs(text) {
|
|
83
|
+
const paragraphs = [];
|
|
84
|
+
const matches = text.matchAll(/\S(?:[\s\S]*?\S)?(?=\n\s*\n|$)/g);
|
|
85
|
+
for (const match of matches) {
|
|
86
|
+
const content = match[0];
|
|
87
|
+
const startOffset = match.index ?? 0;
|
|
88
|
+
const trimmedStartOffset = startOffset + countLeadingWhitespace(content);
|
|
89
|
+
const trimmedEndOffset = startOffset + content.length - countTrailingWhitespace(content);
|
|
90
|
+
if (trimmedStartOffset < trimmedEndOffset) {
|
|
91
|
+
paragraphs.push({
|
|
92
|
+
content: text.slice(trimmedStartOffset, trimmedEndOffset),
|
|
93
|
+
startOffset: trimmedStartOffset,
|
|
94
|
+
endOffset: trimmedEndOffset,
|
|
95
|
+
});
|
|
96
|
+
}
|
|
97
|
+
}
|
|
98
|
+
return paragraphs;
|
|
99
|
+
}
|
|
100
|
+
function splitSentences(paragraph, paragraphStartOffset) {
|
|
101
|
+
const units = [];
|
|
102
|
+
let start = 0;
|
|
103
|
+
for (let index = 0; index < paragraph.length; index += 1) {
|
|
104
|
+
const character = paragraph[index];
|
|
105
|
+
if (!isSentenceEnding(paragraph, index, character)) {
|
|
106
|
+
continue;
|
|
107
|
+
}
|
|
108
|
+
const end = index + 1;
|
|
109
|
+
appendUnit(units, paragraph, paragraphStartOffset, start, end);
|
|
110
|
+
start = skipWhitespace(paragraph, end);
|
|
111
|
+
}
|
|
112
|
+
appendUnit(units, paragraph, paragraphStartOffset, start, paragraph.length);
|
|
113
|
+
return units;
|
|
114
|
+
}
|
|
115
|
+
function appendUnit(units, text, baseOffset, start, end) {
|
|
116
|
+
const trimmed = trimRange(text, start, end);
|
|
117
|
+
if (trimmed.start >= trimmed.end) {
|
|
118
|
+
return;
|
|
119
|
+
}
|
|
120
|
+
units.push({
|
|
121
|
+
content: text.slice(trimmed.start, trimmed.end),
|
|
122
|
+
startOffset: baseOffset + trimmed.start,
|
|
123
|
+
endOffset: baseOffset + trimmed.end,
|
|
124
|
+
});
|
|
125
|
+
}
|
|
126
|
+
function createSemanticGroups(units, embeddings, options) {
|
|
127
|
+
const groups = [];
|
|
128
|
+
let current = [];
|
|
129
|
+
let pendingBreakSimilarity;
|
|
130
|
+
for (const [index, unit] of units.entries()) {
|
|
131
|
+
const previousEmbedding = index > 0 ? embeddings[index - 1] : undefined;
|
|
132
|
+
const currentEmbedding = embeddings[index];
|
|
133
|
+
const similarity = previousEmbedding !== undefined && currentEmbedding !== undefined
|
|
134
|
+
? cosineSimilarity(previousEmbedding, currentEmbedding)
|
|
135
|
+
: undefined;
|
|
136
|
+
const semanticBreak = (similarity !== undefined
|
|
137
|
+
&& similarity < options.similarityThreshold
|
|
138
|
+
&& getGroupLength(current) >= options.minChunkLength);
|
|
139
|
+
const lengthBreak = (current.length > 0
|
|
140
|
+
&& getRangeLength(current[0], unit) > options.maxChunkLength
|
|
141
|
+
&& getGroupLength(current) >= options.minChunkLength);
|
|
142
|
+
if (current.length > 0 && (semanticBreak || lengthBreak)) {
|
|
143
|
+
groups.push(createGroup(current, pendingBreakSimilarity));
|
|
144
|
+
current = createOverlapUnits(current, options.overlapLength, unit, options.maxChunkLength);
|
|
145
|
+
pendingBreakSimilarity = similarity;
|
|
146
|
+
}
|
|
147
|
+
current.push(unit);
|
|
148
|
+
}
|
|
149
|
+
if (current.length > 0) {
|
|
150
|
+
groups.push(createGroup(current, pendingBreakSimilarity));
|
|
151
|
+
}
|
|
152
|
+
return groups;
|
|
153
|
+
}
|
|
154
|
+
function createGroup(units, breakSimilarity) {
|
|
155
|
+
const group = {
|
|
156
|
+
units: [...units],
|
|
157
|
+
};
|
|
158
|
+
if (breakSimilarity !== undefined) {
|
|
159
|
+
group.breakSimilarity = breakSimilarity;
|
|
160
|
+
}
|
|
161
|
+
return group;
|
|
162
|
+
}
|
|
163
|
+
function createOverlapUnits(units, overlapLength, nextUnit, maxChunkLength) {
|
|
164
|
+
if (overlapLength <= 0) {
|
|
165
|
+
return [];
|
|
166
|
+
}
|
|
167
|
+
const overlap = [];
|
|
168
|
+
for (let index = units.length - 1; index >= 0; index -= 1) {
|
|
169
|
+
const unit = units[index];
|
|
170
|
+
if (unit === undefined) {
|
|
171
|
+
continue;
|
|
172
|
+
}
|
|
173
|
+
const nextOverlap = [unit, ...overlap];
|
|
174
|
+
if (getGroupLength(nextOverlap) > overlapLength) {
|
|
175
|
+
break;
|
|
176
|
+
}
|
|
177
|
+
if (getRangeLength(nextOverlap[0], nextUnit) > maxChunkLength) {
|
|
178
|
+
break;
|
|
179
|
+
}
|
|
180
|
+
overlap.unshift(unit);
|
|
181
|
+
}
|
|
182
|
+
return overlap;
|
|
183
|
+
}
|
|
184
|
+
function createSemanticExtra(input) {
|
|
185
|
+
const extra = {
|
|
186
|
+
strategy: 'semantic',
|
|
187
|
+
experimental: true,
|
|
188
|
+
embeddingModel: input.embedder.model,
|
|
189
|
+
similarityThreshold: input.similarityThreshold,
|
|
190
|
+
unitCount: input.group.units.length,
|
|
191
|
+
};
|
|
192
|
+
if (input.group.breakSimilarity !== undefined) {
|
|
193
|
+
extra.breakSimilarity = input.group.breakSimilarity;
|
|
194
|
+
}
|
|
195
|
+
return extra;
|
|
196
|
+
}
|
|
197
|
+
function cosineSimilarity(left, right) {
|
|
198
|
+
let dot = 0;
|
|
199
|
+
let leftMagnitude = 0;
|
|
200
|
+
let rightMagnitude = 0;
|
|
201
|
+
for (let index = 0; index < left.length; index += 1) {
|
|
202
|
+
const leftValue = left[index] ?? 0;
|
|
203
|
+
const rightValue = right[index] ?? 0;
|
|
204
|
+
dot += leftValue * rightValue;
|
|
205
|
+
leftMagnitude += leftValue * leftValue;
|
|
206
|
+
rightMagnitude += rightValue * rightValue;
|
|
207
|
+
}
|
|
208
|
+
if (leftMagnitude === 0 || rightMagnitude === 0) {
|
|
209
|
+
return 0;
|
|
210
|
+
}
|
|
211
|
+
return dot / (Math.sqrt(leftMagnitude) * Math.sqrt(rightMagnitude));
|
|
212
|
+
}
|
|
213
|
+
function getGroupLength(units) {
|
|
214
|
+
const first = units[0];
|
|
215
|
+
const last = units.at(-1);
|
|
216
|
+
if (first === undefined || last === undefined) {
|
|
217
|
+
return 0;
|
|
218
|
+
}
|
|
219
|
+
return getRangeLength(first, last);
|
|
220
|
+
}
|
|
221
|
+
function getRangeLength(first, last) {
|
|
222
|
+
return first === undefined ? last.content.length : last.endOffset - first.startOffset;
|
|
223
|
+
}
|
|
224
|
+
function isSentenceEnding(text, index, character) {
|
|
225
|
+
if (character === undefined) {
|
|
226
|
+
return false;
|
|
227
|
+
}
|
|
228
|
+
if (SENTENCE_ENDINGS.has(character)) {
|
|
229
|
+
return true;
|
|
230
|
+
}
|
|
231
|
+
if (character !== '.') {
|
|
232
|
+
return false;
|
|
233
|
+
}
|
|
234
|
+
const previous = text[index - 1];
|
|
235
|
+
const next = text[index + 1];
|
|
236
|
+
if (isAsciiAlphanumeric(previous) && isAsciiAlphanumeric(next)) {
|
|
237
|
+
return false;
|
|
238
|
+
}
|
|
239
|
+
return next === undefined || /\s/.test(next);
|
|
240
|
+
}
|
|
241
|
+
function isAsciiAlphanumeric(value) {
|
|
242
|
+
return value !== undefined && /[A-Za-z0-9]/.test(value);
|
|
243
|
+
}
|
|
244
|
+
function countLeadingWhitespace(text) {
|
|
245
|
+
const match = text.match(/^\s*/);
|
|
246
|
+
return match?.[0].length ?? 0;
|
|
247
|
+
}
|
|
248
|
+
function countTrailingWhitespace(text) {
|
|
249
|
+
const match = text.match(/\s*$/);
|
|
250
|
+
return match?.[0].length ?? 0;
|
|
251
|
+
}
|
|
252
|
+
function skipWhitespace(text, start) {
|
|
253
|
+
let index = start;
|
|
254
|
+
while (index < text.length && /\s/.test(text[index] ?? '')) {
|
|
255
|
+
index += 1;
|
|
256
|
+
}
|
|
257
|
+
return index;
|
|
258
|
+
}
|
|
259
|
+
function trimRange(text, start, end) {
|
|
260
|
+
let trimmedStart = start;
|
|
261
|
+
let trimmedEnd = end;
|
|
262
|
+
while (trimmedStart < trimmedEnd && /\s/.test(text[trimmedStart] ?? '')) {
|
|
263
|
+
trimmedStart += 1;
|
|
264
|
+
}
|
|
265
|
+
while (trimmedEnd > trimmedStart && /\s/.test(text[trimmedEnd - 1] ?? '')) {
|
|
266
|
+
trimmedEnd -= 1;
|
|
267
|
+
}
|
|
268
|
+
return {
|
|
269
|
+
start: trimmedStart,
|
|
270
|
+
end: trimmedEnd,
|
|
271
|
+
};
|
|
272
|
+
}
|
|
273
|
+
function normalizeSimilarityThreshold(value, fallback) {
|
|
274
|
+
if (value === undefined || !Number.isFinite(value)) {
|
|
275
|
+
return fallback;
|
|
276
|
+
}
|
|
277
|
+
return Math.max(-1, Math.min(1, value));
|
|
278
|
+
}
|
|
279
|
+
function toPositiveInteger(value, fallback) {
|
|
280
|
+
if (value === undefined || !Number.isFinite(value) || value <= 0) {
|
|
281
|
+
return fallback;
|
|
282
|
+
}
|
|
283
|
+
return Math.floor(value);
|
|
284
|
+
}
|
|
285
|
+
function normalizeNonNegativeInteger(value, fallback) {
|
|
286
|
+
if (value === undefined || !Number.isFinite(value) || value < 0) {
|
|
287
|
+
return fallback;
|
|
288
|
+
}
|
|
289
|
+
return Math.floor(value);
|
|
290
|
+
}
|
|
291
|
+
//# sourceMappingURL=semantic-chunker.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"semantic-chunker.js","sourceRoot":"","sources":["../../../src/rag/chunking/semantic-chunker.ts"],"names":[],"mappings":";;;AACA,8CAGuB;AAKvB,uCAMmB;AAMnB,MAAM,4BAA4B,GAAG,IAAI,CAAC;AAC1C,MAAM,gBAAgB,GAAG,IAAI,GAAG,CAAC,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,CAAC,CAAC;AAmB5D,MAAa,eAAe;IACP,QAAQ,CAAW;IACnB,mBAAmB,CAAS;IAC5B,cAAc,CAAS;IACvB,cAAc,CAAS;IACvB,aAAa,CAAS;IAEvC,YAAY,OAA+B;QACvC,IAAI,CAAC,QAAQ,GAAG,OAAO,CAAC,QAAQ,CAAC;QACjC,IAAI,CAAC,mBAAmB,GAAG,4BAA4B,CACnD,OAAO,CAAC,mBAAmB,EAC3B,4BAA4B,CAC/B,CAAC;QACF,IAAI,CAAC,cAAc,GAAG,iBAAiB,CACnC,OAAO,CAAC,cAAc,EACtB,kCAAwB,CAC3B,CAAC;QACF,IAAI,CAAC,cAAc,GAAG,IAAI,CAAC,GAAG,CAC1B,iBAAiB,CAAC,OAAO,CAAC,cAAc,EAAE,kCAAwB,CAAC,EACnE,IAAI,CAAC,cAAc,CACtB,CAAC;QACF,IAAI,CAAC,aAAa,GAAG,IAAI,CAAC,GAAG,CACzB,2BAA2B,CAAC,OAAO,CAAC,aAAa,EAAE,CAAC,CAAC,EACrD,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,cAAc,GAAG,CAAC,EAAE,CAAC,CAAC,CACvC,CAAC;IACN,CAAC;IAED,KAAK,CAAC,KAAK,CAAC,QAAqB;QAC7B,MAAM,KAAK,GAAG,mBAAmB,CAAC,QAAQ,CAAC,OAAO,EAAE,IAAI,CAAC,cAAc,CAAC,CAAC;QACzE,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YACrB,OAAO,EAAE,CAAC;QACd,CAAC;QAED,MAAM,UAAU,GAAG,MAAM,IAAI,CAAC,QAAQ,CAAC,cAAc,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,IAAI,CAAC,OAAO,CAAC,CAAC,CAAC;QACzF,IAAA,qCAAwB,EAAC,UAAU,EAAE,KAAK,CAAC,MAAM,CAAC,CAAC;QACnD,UAAU,CAAC,OAAO,CAAC,CAAC,SAAS,EAAE,KAAK,EAAE,EAAE;YACpC,IAAA,sCAAyB,EACrB,SAAS,EACT,IAAI,CAAC,QAAQ,CAAC,UAAU,EACxB,iBAAiB,KAAK,YAAY,CACrC,CAAC;QACN,CAAC,CAAC,CAAC;QAEH,MAAM,MAAM,GAAG,oBAAoB,CAAC,KAAK,EAAE,UAAU,EAAE;YACnD,cAAc,EAAE,IAAI,CAAC,cAAc;YACnC,cAAc,EAAE,IAAI,CAAC,cAAc;YACnC,aAAa,EAAE,IAAI,CAAC,aAAa;YACjC,mBAAmB,EAAE,IAAI,CAAC,mBAAmB;SAChD,CAAC,CAAC;QAEH,OAAO,MAAM,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,KAAK,EAAE,EAAE;YAC/B,MAAM,WAAW,GAAG,KAAK,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,WAAW,IAAI,CAAC,CAAC;YACrD,MAAM,SAAS,GAAG,KAAK,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC,EAAE,SAAS,IAAI,WAAW,CAAC;YAE/D,OAAO,IAAA,qBAAW,EAAC;gBACf,QAAQ;gBACR,OAAO,EAAE,QAAQ,CAAC,OAAO,CAAC,KAAK,CAAC,WAAW,EAAE,SAAS,CAAC;gBACvD,IAAI,EAAE,MAAM;gBACZ,UAAU,EAAE,KAAK;gBACjB,WAAW;gBACX,SAAS;gBACT,KAAK,EAAE,mBAAmB,CAAC;oBACvB,QAAQ,EAAE,IAAI,CAAC,QAAQ;oBACvB,KAAK;oBACL,mBAAmB,EAAE,IAAI,CAAC,mBAAmB;iBAChD,CAAC;aACL,CAAC,CAAC;QACP,CAAC,CAAC,CAAC;IACP,CAAC;IAED,KAAK,CAAC,SAAS,CAAC,SAAwB;QACpC,OAAO,MAAM,IAAA,4BAAkB,EAAC,IAAI,EAAE,SAAS,CAAC,CAAC;IACrD,CAAC;CACJ;AAzED,0CAyEC;AAED,SAAS,mBAAmB,CAAC,IAAY,EAAE,cAAsB;IAC7D,MAAM,KAAK,GAAmB,EAAE,CAAC;IAEjC,KAAK,MAAM,SAAS,IAAI,eAAe,CAAC,IAAI,CAAC,EAAE,CAAC;QAC5C,IAAI,SAAS,CAAC,OAAO,CAAC,MAAM,IAAI,cAAc,EAAE,CAAC;YAC7C,MAAM,SAAS,GAAG,cAAc,CAAC,SAAS,CAAC,OAAO,EAAE,SAAS,CAAC,WAAW,CAAC,CAAC;YAC3E,KAAK,CAAC,IAAI,CAAC,GAAG,SAAS,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC;YAC9D,SAAS;QACb,CAAC;QAED,KAAK,MAAM,OAAO,IAAI,IAAA,2BAAiB,EAAC,SAAS,CAAC,OAAO,EAAE;YACvD,cAAc;YACd,cAAc,EAAE,IAAI,CAAC,GAAG,CAAC,kCAAwB,EAAE,cAAc,CAAC;YAClE,aAAa,EAAE,CAAC;SACnB,CAAC,EAAE,CAAC;YACD,KAAK,CAAC,IAAI,CAAC;gBACP,OAAO,EAAE,OAAO,CAAC,OAAO;gBACxB,WAAW,EAAE,SAAS,CAAC,WAAW,GAAG,OAAO,CAAC,WAAW;gBACxD,SAAS,EAAE,SAAS,CAAC,WAAW,GAAG,OAAO,CAAC,SAAS;aACvD,CAAC,CAAC;QACP,CAAC;IACL,CAAC;IAED,OAAO,KAAK,CAAC;AACjB,CAAC;AAED,SAAS,eAAe,CAAC,IAAY;IACjC,MAAM,UAAU,GAAmB,EAAE,CAAC;IACtC,MAAM,OAAO,GAAG,IAAI,CAAC,QAAQ,CAAC,iCAAiC,CAAC,CAAC;IAEjE,KAAK,MAAM,KAAK,IAAI,OAAO,EAAE,CAAC;QAC1B,MAAM,OAAO,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;QACzB,MAAM,WAAW,GAAG,KAAK,CAAC,KAAK,IAAI,CAAC,CAAC;QACrC,MAAM,kBAAkB,GAAG,WAAW,GAAG,sBAAsB,CAAC,OAAO,CAAC,CAAC;QACzE,MAAM,gBAAgB,GAAG,WAAW,GAAG,OAAO,CAAC,MAAM,GAAG,uBAAuB,CAAC,OAAO,CAAC,CAAC;QAEzF,IAAI,kBAAkB,GAAG,gBAAgB,EAAE,CAAC;YACxC,UAAU,CAAC,IAAI,CAAC;gBACZ,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,kBAAkB,EAAE,gBAAgB,CAAC;gBACzD,WAAW,EAAE,kBAAkB;gBAC/B,SAAS,EAAE,gBAAgB;aAC9B,CAAC,CAAC;QACP,CAAC;IACL,CAAC;IAED,OAAO,UAAU,CAAC;AACtB,CAAC;AAED,SAAS,cAAc,CAAC,SAAiB,EAAE,oBAA4B;IACnE,MAAM,KAAK,GAAmB,EAAE,CAAC;IACjC,IAAI,KAAK,GAAG,CAAC,CAAC;IAEd,KAAK,IAAI,KAAK,GAAG,CAAC,EAAE,KAAK,GAAG,SAAS,CAAC,MAAM,EAAE,KAAK,IAAI,CAAC,EAAE,CAAC;QACvD,MAAM,SAAS,GAAG,SAAS,CAAC,KAAK,CAAC,CAAC;QACnC,IAAI,CAAC,gBAAgB,CAAC,SAAS,EAAE,KAAK,EAAE,SAAS,CAAC,EAAE,CAAC;YACjD,SAAS;QACb,CAAC;QAED,MAAM,GAAG,GAAG,KAAK,GAAG,CAAC,CAAC;QACtB,UAAU,CAAC,KAAK,EAAE,SAAS,EAAE,oBAAoB,EAAE,KAAK,EAAE,GAAG,CAAC,CAAC;QAC/D,KAAK,GAAG,cAAc,CAAC,SAAS,EAAE,GAAG,CAAC,CAAC;IAC3C,CAAC;IAED,UAAU,CAAC,KAAK,EAAE,SAAS,EAAE,oBAAoB,EAAE,KAAK,EAAE,SAAS,CAAC,MAAM,CAAC,CAAC;IAE5E,OAAO,KAAK,CAAC;AACjB,CAAC;AAED,SAAS,UAAU,CACf,KAAqB,EACrB,IAAY,EACZ,UAAkB,EAClB,KAAa,EACb,GAAW;IAEX,MAAM,OAAO,GAAG,SAAS,CAAC,IAAI,EAAE,KAAK,EAAE,GAAG,CAAC,CAAC;IAC5C,IAAI,OAAO,CAAC,KAAK,IAAI,OAAO,CAAC,GAAG,EAAE,CAAC;QAC/B,OAAO;IACX,CAAC;IAED,KAAK,CAAC,IAAI,CAAC;QACP,OAAO,EAAE,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,KAAK,EAAE,OAAO,CAAC,GAAG,CAAC;QAC/C,WAAW,EAAE,UAAU,GAAG,OAAO,CAAC,KAAK;QACvC,SAAS,EAAE,UAAU,GAAG,OAAO,CAAC,GAAG;KACtC,CAAC,CAAC;AACP,CAAC;AAED,SAAS,oBAAoB,CACzB,KAAqB,EACrB,UAAsB,EACtB,OAKC;IAED,MAAM,MAAM,GAAoB,EAAE,CAAC;IACnC,IAAI,OAAO,GAAmB,EAAE,CAAC;IACjC,IAAI,sBAA0C,CAAC;IAE/C,KAAK,MAAM,CAAC,KAAK,EAAE,IAAI,CAAC,IAAI,KAAK,CAAC,OAAO,EAAE,EAAE,CAAC;QAC1C,MAAM,iBAAiB,GAAG,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,SAAS,CAAC;QACxE,MAAM,gBAAgB,GAAG,UAAU,CAAC,KAAK,CAAC,CAAC;QAC3C,MAAM,UAAU,GAAG,iBAAiB,KAAK,SAAS,IAAI,gBAAgB,KAAK,SAAS;YAChF,CAAC,CAAC,gBAAgB,CAAC,iBAAiB,EAAE,gBAAgB,CAAC;YACvD,CAAC,CAAC,SAAS,CAAC;QAChB,MAAM,aAAa,GAAG,CAClB,UAAU,KAAK,SAAS;eACrB,UAAU,GAAG,OAAO,CAAC,mBAAmB;eACxC,cAAc,CAAC,OAAO,CAAC,IAAI,OAAO,CAAC,cAAc,CACvD,CAAC;QACF,MAAM,WAAW,GAAG,CAChB,OAAO,CAAC,MAAM,GAAG,CAAC;eACf,cAAc,CAAC,OAAO,CAAC,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,OAAO,CAAC,cAAc;eACzD,cAAc,CAAC,OAAO,CAAC,IAAI,OAAO,CAAC,cAAc,CACvD,CAAC;QAEF,IAAI,OAAO,CAAC,MAAM,GAAG,CAAC,IAAI,CAAC,aAAa,IAAI,WAAW,CAAC,EAAE,CAAC;YACvD,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,OAAO,EAAE,sBAAsB,CAAC,CAAC,CAAC;YAC1D,OAAO,GAAG,kBAAkB,CAAC,OAAO,EAAE,OAAO,CAAC,aAAa,EAAE,IAAI,EAAE,OAAO,CAAC,cAAc,CAAC,CAAC;YAC3F,sBAAsB,GAAG,UAAU,CAAC;QACxC,CAAC;QAED,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IACvB,CAAC;IAED,IAAI,OAAO,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACrB,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,OAAO,EAAE,sBAAsB,CAAC,CAAC,CAAC;IAC9D,CAAC;IAED,OAAO,MAAM,CAAC;AAClB,CAAC;AAED,SAAS,WAAW,CAAC,KAAqB,EAAE,eAAmC;IAC3E,MAAM,KAAK,GAAkB;QACzB,KAAK,EAAE,CAAC,GAAG,KAAK,CAAC;KACpB,CAAC;IAEF,IAAI,eAAe,KAAK,SAAS,EAAE,CAAC;QAChC,KAAK,CAAC,eAAe,GAAG,eAAe,CAAC;IAC5C,CAAC;IAED,OAAO,KAAK,CAAC;AACjB,CAAC;AAED,SAAS,kBAAkB,CACvB,KAAqB,EACrB,aAAqB,EACrB,QAAsB,EACtB,cAAsB;IAEtB,IAAI,aAAa,IAAI,CAAC,EAAE,CAAC;QACrB,OAAO,EAAE,CAAC;IACd,CAAC;IAED,MAAM,OAAO,GAAmB,EAAE,CAAC;IACnC,KAAK,IAAI,KAAK,GAAG,KAAK,CAAC,MAAM,GAAG,CAAC,EAAE,KAAK,IAAI,CAAC,EAAE,KAAK,IAAI,CAAC,EAAE,CAAC;QACxD,MAAM,IAAI,GAAG,KAAK,CAAC,KAAK,CAAC,CAAC;QAC1B,IAAI,IAAI,KAAK,SAAS,EAAE,CAAC;YACrB,SAAS;QACb,CAAC;QAED,MAAM,WAAW,GAAG,CAAC,IAAI,EAAE,GAAG,OAAO,CAAC,CAAC;QACvC,IAAI,cAAc,CAAC,WAAW,CAAC,GAAG,aAAa,EAAE,CAAC;YAC9C,MAAM;QACV,CAAC;QACD,IAAI,cAAc,CAAC,WAAW,CAAC,CAAC,CAAC,EAAE,QAAQ,CAAC,GAAG,cAAc,EAAE,CAAC;YAC5D,MAAM;QACV,CAAC;QAED,OAAO,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;IAC1B,CAAC;IAED,OAAO,OAAO,CAAC;AACnB,CAAC;AAED,SAAS,mBAAmB,CAAC,KAI5B;IACG,MAAM,KAAK,GAA4B;QACnC,QAAQ,EAAE,UAAU;QACpB,YAAY,EAAE,IAAI;QAClB,cAAc,EAAE,KAAK,CAAC,QAAQ,CAAC,KAAK;QACpC,mBAAmB,EAAE,KAAK,CAAC,mBAAmB;QAC9C,SAAS,EAAE,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,MAAM;KACtC,CAAC;IAEF,IAAI,KAAK,CAAC,KAAK,CAAC,eAAe,KAAK,SAAS,EAAE,CAAC;QAC5C,KAAK,CAAC,eAAe,GAAG,KAAK,CAAC,KAAK,CAAC,eAAe,CAAC;IACxD,CAAC;IAED,OAAO,KAAK,CAAC;AACjB,CAAC;AAED,SAAS,gBAAgB,CAAC,IAAuB,EAAE,KAAwB;IACvE,IAAI,GAAG,GAAG,CAAC,CAAC;IACZ,IAAI,aAAa,GAAG,CAAC,CAAC;IACtB,IAAI,cAAc,GAAG,CAAC,CAAC;IAEvB,KAAK,IAAI,KAAK,GAAG,CAAC,EAAE,KAAK,GAAG,IAAI,CAAC,MAAM,EAAE,KAAK,IAAI,CAAC,EAAE,CAAC;QAClD,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC;QACnC,MAAM,UAAU,GAAG,KAAK,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC;QAErC,GAAG,IAAI,SAAS,GAAG,UAAU,CAAC;QAC9B,aAAa,IAAI,SAAS,GAAG,SAAS,CAAC;QACvC,cAAc,IAAI,UAAU,GAAG,UAAU,CAAC;IAC9C,CAAC;IAED,IAAI,aAAa,KAAK,CAAC,IAAI,cAAc,KAAK,CAAC,EAAE,CAAC;QAC9C,OAAO,CAAC,CAAC;IACb,CAAC;IAED,OAAO,GAAG,GAAG,CAAC,IAAI,CAAC,IAAI,CAAC,aAAa,CAAC,GAAG,IAAI,CAAC,IAAI,CAAC,cAAc,CAAC,CAAC,CAAC;AACxE,CAAC;AAED,SAAS,cAAc,CAAC,KAAqB;IACzC,MAAM,KAAK,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;IACvB,MAAM,IAAI,GAAG,KAAK,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC;IAC1B,IAAI,KAAK,KAAK,SAAS,IAAI,IAAI,KAAK,SAAS,EAAE,CAAC;QAC5C,OAAO,CAAC,CAAC;IACb,CAAC;IAED,OAAO,cAAc,CAAC,KAAK,EAAE,IAAI,CAAC,CAAC;AACvC,CAAC;AAED,SAAS,cAAc,CAAC,KAA+B,EAAE,IAAkB;IACvE,OAAO,KAAK,KAAK,SAAS,CAAC,CAAC,CAAC,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,IAAI,CAAC,SAAS,GAAG,KAAK,CAAC,WAAW,CAAC;AAC1F,CAAC;AAED,SAAS,gBAAgB,CACrB,IAAY,EACZ,KAAa,EACb,SAA6B;IAE7B,IAAI,SAAS,KAAK,SAAS,EAAE,CAAC;QAC1B,OAAO,KAAK,CAAC;IACjB,CAAC;IACD,IAAI,gBAAgB,CAAC,GAAG,CAAC,SAAS,CAAC,EAAE,CAAC;QAClC,OAAO,IAAI,CAAC;IAChB,CAAC;IACD,IAAI,SAAS,KAAK,GAAG,EAAE,CAAC;QACpB,OAAO,KAAK,CAAC;IACjB,CAAC;IAED,MAAM,QAAQ,GAAG,IAAI,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;IACjC,MAAM,IAAI,GAAG,IAAI,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;IAC7B,IAAI,mBAAmB,CAAC,QAAQ,CAAC,IAAI,mBAAmB,CAAC,IAAI,CAAC,EAAE,CAAC;QAC7D,OAAO,KAAK,CAAC;IACjB,CAAC;IAED,OAAO,IAAI,KAAK,SAAS,IAAI,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;AACjD,CAAC;AAED,SAAS,mBAAmB,CAAC,KAAyB;IAClD,OAAO,KAAK,KAAK,SAAS,IAAI,aAAa,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;AAC5D,CAAC;AAED,SAAS,sBAAsB,CAAC,IAAY;IACxC,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC;IAEjC,OAAO,KAAK,EAAE,CAAC,CAAC,CAAC,CAAC,MAAM,IAAI,CAAC,CAAC;AAClC,CAAC;AAED,SAAS,uBAAuB,CAAC,IAAY;IACzC,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,MAAM,CAAC,CAAC;IAEjC,OAAO,KAAK,EAAE,CAAC,CAAC,CAAC,CAAC,MAAM,IAAI,CAAC,CAAC;AAClC,CAAC;AAED,SAAS,cAAc,CAAC,IAAY,EAAE,KAAa;IAC/C,IAAI,KAAK,GAAG,KAAK,CAAC;IAClB,OAAO,KAAK,GAAG,IAAI,CAAC,MAAM,IAAI,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,KAAK,CAAC,IAAI,EAAE,CAAC,EAAE,CAAC;QACzD,KAAK,IAAI,CAAC,CAAC;IACf,CAAC;IAED,OAAO,KAAK,CAAC;AACjB,CAAC;AAED,SAAS,SAAS,CAAC,IAAY,EAAE,KAAa,EAAE,GAAW;IACvD,IAAI,YAAY,GAAG,KAAK,CAAC;IACzB,IAAI,UAAU,GAAG,GAAG,CAAC;IAErB,OAAO,YAAY,GAAG,UAAU,IAAI,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,YAAY,CAAC,IAAI,EAAE,CAAC,EAAE,CAAC;QACtE,YAAY,IAAI,CAAC,CAAC;IACtB,CAAC;IACD,OAAO,UAAU,GAAG,YAAY,IAAI,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,UAAU,GAAG,CAAC,CAAC,IAAI,EAAE,CAAC,EAAE,CAAC;QACxE,UAAU,IAAI,CAAC,CAAC;IACpB,CAAC;IAED,OAAO;QACH,KAAK,EAAE,YAAY;QACnB,GAAG,EAAE,UAAU;KAClB,CAAC;AACN,CAAC;AAED,SAAS,4BAA4B,CAAC,KAAyB,EAAE,QAAgB;IAC7E,IAAI,KAAK,KAAK,SAAS,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;QACjD,OAAO,QAAQ,CAAC;IACpB,CAAC;IAED,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,CAAC,CAAC,CAAC;AAC5C,CAAC;AAED,SAAS,iBAAiB,CAAC,KAAyB,EAAE,QAAgB;IAClE,IAAI,KAAK,KAAK,SAAS,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,IAAI,KAAK,IAAI,CAAC,EAAE,CAAC;QAC/D,OAAO,QAAQ,CAAC;IACpB,CAAC;IAED,OAAO,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;AAC7B,CAAC;AAED,SAAS,2BAA2B,CAAC,KAAyB,EAAE,QAAgB;IAC5E,IAAI,KAAK,KAAK,SAAS,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,IAAI,KAAK,GAAG,CAAC,EAAE,CAAC;QAC9D,OAAO,QAAQ,CAAC;IACpB,CAAC;IAED,OAAO,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;AAC7B,CAAC"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"embedder.d.ts","sourceRoot":"","sources":["../../../src/rag/embeddings/embedder.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACR,KAAK,EACL,aAAa,EAChB,MAAM,UAAU,CAAC;AAElB,MAAM,WAAW,QAAQ;IACrB,QAAQ,CAAC,KAAK,EAAE,MAAM,CAAC;IACvB,QAAQ,CAAC,UAAU,EAAE,MAAM,CAAC;IAC5B,cAAc,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC;IACrD,UAAU,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC;CAC/C;AAED,qBAAa,uBAAwB,SAAQ,KAAK;IAC9C,QAAQ,CAAC,kBAAkB,EAAE,MAAM,CAAC;IACpC,QAAQ,CAAC,gBAAgB,EAAE,MAAM,CAAC;gBAEtB,kBAAkB,EAAE,MAAM,EAAE,gBAAgB,EAAE,MAAM,EAAE,KAAK,SAAc;CAQxF;AAED,qBAAa,uBAAwB,SAAQ,KAAK;IAC9C,QAAQ,CAAC,YAAY,EAAE,MAAM,CAAC;IAC9B,QAAQ,CAAC,UAAU,EAAE,MAAM,CAAC;gBAEhB,YAAY,EAAE,MAAM,EAAE,UAAU,EAAE,MAAM;CAMvD;AAED,wBAAsB,WAAW,CAC7B,QAAQ,EAAE,QAAQ,EAClB,MAAM,EAAE,KAAK,EAAE,GAChB,OAAO,CAAC,aAAa,EAAE,CAAC,
|
|
1
|
+
{"version":3,"file":"embedder.d.ts","sourceRoot":"","sources":["../../../src/rag/embeddings/embedder.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACR,KAAK,EACL,aAAa,EAChB,MAAM,UAAU,CAAC;AAElB,MAAM,WAAW,QAAQ;IACrB,QAAQ,CAAC,KAAK,EAAE,MAAM,CAAC;IACvB,QAAQ,CAAC,UAAU,EAAE,MAAM,CAAC;IAC5B,cAAc,CAAC,KAAK,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC,MAAM,EAAE,EAAE,CAAC,CAAC;IACrD,UAAU,CAAC,IAAI,EAAE,MAAM,GAAG,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC;CAC/C;AAED,qBAAa,uBAAwB,SAAQ,KAAK;IAC9C,QAAQ,CAAC,kBAAkB,EAAE,MAAM,CAAC;IACpC,QAAQ,CAAC,gBAAgB,EAAE,MAAM,CAAC;gBAEtB,kBAAkB,EAAE,MAAM,EAAE,gBAAgB,EAAE,MAAM,EAAE,KAAK,SAAc;CAQxF;AAED,qBAAa,uBAAwB,SAAQ,KAAK;IAC9C,QAAQ,CAAC,YAAY,EAAE,MAAM,CAAC;IAC9B,QAAQ,CAAC,UAAU,EAAE,MAAM,CAAC;gBAEhB,YAAY,EAAE,MAAM,EAAE,UAAU,EAAE,MAAM;CAMvD;AAED,wBAAsB,WAAW,CAC7B,QAAQ,EAAE,QAAQ,EAClB,MAAM,EAAE,KAAK,EAAE,GAChB,OAAO,CAAC,aAAa,EAAE,CAAC,CA2B1B;AAED,wBAAgB,yBAAyB,CACrC,SAAS,EAAE,SAAS,MAAM,EAAE,EAC5B,kBAAkB,EAAE,MAAM,EAC1B,KAAK,CAAC,EAAE,MAAM,GACf,IAAI,CAIN;AAED,wBAAgB,wBAAwB,CACpC,UAAU,EAAE,SAAS,OAAO,EAAE,EAC9B,YAAY,EAAE,MAAM,GACrB,IAAI,CAIN;AAED,wBAAgB,cAAc,CAAC,SAAS,EAAE,SAAS,MAAM,EAAE,GAAG,MAAM,EAAE,CAErE;AAED,wBAAgB,kBAAkB,CAAC,SAAS,EAAE,SAAS,MAAM,EAAE,GAAG,MAAM,EAAE,CAUzE;AAED,wBAAgB,8BAA8B,CAAC,UAAU,EAAE,MAAM,GAAG,MAAM,CAMzE"}
|
|
@@ -30,6 +30,12 @@ class EmbeddingBatchSizeError extends Error {
|
|
|
30
30
|
}
|
|
31
31
|
exports.EmbeddingBatchSizeError = EmbeddingBatchSizeError;
|
|
32
32
|
async function embedChunks(embedder, chunks) {
|
|
33
|
+
// 空批次直接返回:replaceExisting 全部 skip 时没有新 chunk,
|
|
34
|
+
// 不应该对远程 embedding 服务发起一次空请求。
|
|
35
|
+
if (chunks.length === 0) {
|
|
36
|
+
return [];
|
|
37
|
+
}
|
|
38
|
+
// TODO 当前只取 content 去 embed,chunk的metadata里还有 headingPath、title等信息,需考虑是否做处理
|
|
33
39
|
const embeddings = await embedder.embedDocuments(chunks.map((chunk) => chunk.content));
|
|
34
40
|
assertEmbeddingBatchSize(embeddings, chunks.length);
|
|
35
41
|
return chunks.map((chunk, index) => {
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"embedder.js","sourceRoot":"","sources":["../../../src/rag/embeddings/embedder.ts"],"names":[],"mappings":";;;AAsCA,
|
|
1
|
+
{"version":3,"file":"embedder.js","sourceRoot":"","sources":["../../../src/rag/embeddings/embedder.ts"],"names":[],"mappings":";;;AAsCA,kCA8BC;AAED,8DAQC;AAED,4DAOC;AAED,wCAEC;AAED,gDAUC;AAED,wEAMC;AAnGD,MAAa,uBAAwB,SAAQ,KAAK;IACrC,kBAAkB,CAAS;IAC3B,gBAAgB,CAAS;IAElC,YAAY,kBAA0B,EAAE,gBAAwB,EAAE,KAAK,GAAG,WAAW;QACjF,KAAK,CACD,GAAG,KAAK,kCAAkC,kBAAkB,SAAS,gBAAgB,GAAG,CAC3F,CAAC;QACF,IAAI,CAAC,IAAI,GAAG,yBAAyB,CAAC;QACtC,IAAI,CAAC,kBAAkB,GAAG,kBAAkB,CAAC;QAC7C,IAAI,CAAC,gBAAgB,GAAG,gBAAgB,CAAC;IAC7C,CAAC;CACJ;AAZD,0DAYC;AAED,MAAa,uBAAwB,SAAQ,KAAK;IACrC,YAAY,CAAS;IACrB,UAAU,CAAS;IAE5B,YAAY,YAAoB,EAAE,UAAkB;QAChD,KAAK,CAAC,2CAA2C,YAAY,SAAS,UAAU,GAAG,CAAC,CAAC;QACrF,IAAI,CAAC,IAAI,GAAG,yBAAyB,CAAC;QACtC,IAAI,CAAC,YAAY,GAAG,YAAY,CAAC;QACjC,IAAI,CAAC,UAAU,GAAG,UAAU,CAAC;IACjC,CAAC;CACJ;AAVD,0DAUC;AAEM,KAAK,UAAU,WAAW,CAC7B,QAAkB,EAClB,MAAe;IAEf,8CAA8C;IAC9C,8BAA8B;IAC9B,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QACtB,OAAO,EAAE,CAAC;IACd,CAAC;IAED,4EAA4E;IAC5E,MAAM,UAAU,GAAG,MAAM,QAAQ,CAAC,cAAc,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC;IACvF,wBAAwB,CAAC,UAAU,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC;IAEpD,OAAO,MAAM,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,KAAK,EAAE,EAAE;QAC/B,MAAM,SAAS,GAAG,UAAU,CAAC,KAAK,CAAC,CAAC;QACpC,IAAI,SAAS,KAAK,SAAS,EAAE,CAAC;YAC1B,MAAM,IAAI,uBAAuB,CAAC,MAAM,CAAC,MAAM,EAAE,UAAU,CAAC,MAAM,CAAC,CAAC;QACxE,CAAC;QACD,yBAAyB,CACrB,SAAS,EACT,QAAQ,CAAC,UAAU,EACnB,SAAS,KAAK,CAAC,EAAE,YAAY,CAChC,CAAC;QAEF,OAAO;YACH,KAAK;YACL,SAAS,EAAE,cAAc,CAAC,SAAS,CAAC;SACvC,CAAC;IACN,CAAC,CAAC,CAAC;AACP,CAAC;AAED,SAAgB,yBAAyB,CACrC,SAA4B,EAC5B,kBAA0B,EAC1B,KAAc;IAEd,IAAI,SAAS,CAAC,MAAM,KAAK,kBAAkB,EAAE,CAAC;QAC1C,MAAM,IAAI,uBAAuB,CAAC,kBAAkB,EAAE,SAAS,CAAC,MAAM,EAAE,KAAK,CAAC,CAAC;IACnF,CAAC;AACL,CAAC;AAED,SAAgB,wBAAwB,CACpC,UAA8B,EAC9B,YAAoB;IAEpB,IAAI,UAAU,CAAC,MAAM,KAAK,YAAY,EAAE,CAAC;QACrC,MAAM,IAAI,uBAAuB,CAAC,YAAY,EAAE,UAAU,CAAC,MAAM,CAAC,CAAC;IACvE,CAAC;AACL,CAAC;AAED,SAAgB,cAAc,CAAC,SAA4B;IACvD,OAAO,CAAC,GAAG,SAAS,CAAC,CAAC;AAC1B,CAAC;AAED,SAAgB,kBAAkB,CAAC,SAA4B;IAC3D,MAAM,SAAS,GAAG,IAAI,CAAC,IAAI,CACvB,SAAS,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,KAAK,EAAE,EAAE,CAAC,GAAG,GAAG,KAAK,GAAG,KAAK,EAAE,CAAC,CAAC,CAC3D,CAAC;IAEF,IAAI,SAAS,KAAK,CAAC,EAAE,CAAC;QAClB,OAAO,CAAC,GAAG,SAAS,CAAC,CAAC;IAC1B,CAAC;IAED,OAAO,SAAS,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,GAAG,SAAS,CAAC,CAAC;AACvD,CAAC;AAED,SAAgB,8BAA8B,CAAC,UAAkB;IAC7D,IAAI,CAAC,MAAM,CAAC,SAAS,CAAC,UAAU,CAAC,IAAI,UAAU,IAAI,CAAC,EAAE,CAAC;QACnD,MAAM,IAAI,UAAU,CAAC,kDAAkD,CAAC,CAAC;IAC7E,CAAC;IAED,OAAO,UAAU,CAAC;AACtB,CAAC"}
|
|
@@ -6,11 +6,18 @@ export interface DefaultContextBuilderOptions {
|
|
|
6
6
|
maxContextTokens?: number;
|
|
7
7
|
maxChunkCharacters?: number;
|
|
8
8
|
includeScores?: boolean;
|
|
9
|
+
/**
|
|
10
|
+
* 融合分数尺度上的过滤阈值(如 RRF)。不要复用检索的 minScore:
|
|
11
|
+
* 那是 retriever 原始分数尺度(cosine / TF-IDF),量级和融合分完全不同。
|
|
12
|
+
* 默认 undefined,不过滤。
|
|
13
|
+
*/
|
|
14
|
+
minFusedScore?: number;
|
|
9
15
|
}
|
|
10
16
|
export declare class DefaultContextBuilder implements ContextBuilder {
|
|
11
17
|
private readonly maxContextTokens;
|
|
12
18
|
private readonly maxChunkCharacters;
|
|
13
19
|
private readonly includeScores;
|
|
20
|
+
private readonly minFusedScore;
|
|
14
21
|
constructor(options?: DefaultContextBuilderOptions);
|
|
15
22
|
build(query: string, retrieved: RetrievedChunk[], options?: AnswerOptions): Promise<RagContext>;
|
|
16
23
|
}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"context-builder.d.ts","sourceRoot":"","sources":["../../../src/rag/generation/context-builder.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACR,aAAa,EAEb,UAAU,EAEV,cAAc,EACjB,MAAM,UAAU,CAAC;AAElB,MAAM,WAAW,cAAc;IAC3B,KAAK,CACD,KAAK,EAAE,MAAM,EACb,SAAS,EAAE,cAAc,EAAE,EAC3B,OAAO,CAAC,EAAE,aAAa,GACxB,OAAO,CAAC,UAAU,CAAC,CAAC;CAC1B;AAED,MAAM,WAAW,4BAA4B;IACzC,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,kBAAkB,CAAC,EAAE,MAAM,CAAC;IAC5B,aAAa,CAAC,EAAE,OAAO,CAAC;
|
|
1
|
+
{"version":3,"file":"context-builder.d.ts","sourceRoot":"","sources":["../../../src/rag/generation/context-builder.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACR,aAAa,EAEb,UAAU,EAEV,cAAc,EACjB,MAAM,UAAU,CAAC;AAElB,MAAM,WAAW,cAAc;IAC3B,KAAK,CACD,KAAK,EAAE,MAAM,EACb,SAAS,EAAE,cAAc,EAAE,EAC3B,OAAO,CAAC,EAAE,aAAa,GACxB,OAAO,CAAC,UAAU,CAAC,CAAC;CAC1B;AAED,MAAM,WAAW,4BAA4B;IACzC,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,kBAAkB,CAAC,EAAE,MAAM,CAAC;IAC5B,aAAa,CAAC,EAAE,OAAO,CAAC;IACxB;;;;OAIG;IACH,aAAa,CAAC,EAAE,MAAM,CAAC;CAC1B;AAED,qBAAa,qBAAsB,YAAW,cAAc;IACxD,OAAO,CAAC,QAAQ,CAAC,gBAAgB,CAAS;IAC1C,OAAO,CAAC,QAAQ,CAAC,kBAAkB,CAAqB;IACxD,OAAO,CAAC,QAAQ,CAAC,aAAa,CAAU;IACxC,OAAO,CAAC,QAAQ,CAAC,aAAa,CAAqB;gBAEvC,OAAO,GAAE,4BAAiC;IAOhD,KAAK,CACP,KAAK,EAAE,MAAM,EACb,SAAS,EAAE,cAAc,EAAE,EAC3B,OAAO,GAAE,aAAkB,GAC5B,OAAO,CAAC,UAAU,CAAC;CAyDzB;AAqHD;;;GAGG;AACH,wBAAgB,cAAc,CAAC,IAAI,EAAE,MAAM,GAAG,MAAM,CAKnD"}
|
|
@@ -6,15 +6,18 @@ class DefaultContextBuilder {
|
|
|
6
6
|
maxContextTokens;
|
|
7
7
|
maxChunkCharacters;
|
|
8
8
|
includeScores;
|
|
9
|
+
minFusedScore;
|
|
9
10
|
constructor(options = {}) {
|
|
10
11
|
this.maxContextTokens = normalizePositiveInteger(options.maxContextTokens, 3000);
|
|
11
12
|
this.maxChunkCharacters = normalizeOptionalPositiveInteger(options.maxChunkCharacters);
|
|
12
13
|
this.includeScores = options.includeScores ?? false;
|
|
14
|
+
this.minFusedScore = options.minFusedScore;
|
|
13
15
|
}
|
|
14
16
|
async build(query, retrieved, options = {}) {
|
|
15
17
|
const maxContextTokens = normalizePositiveInteger(options.maxContextTokens, this.maxContextTokens);
|
|
18
|
+
const minFusedScore = options.minFusedScore ?? this.minFusedScore;
|
|
16
19
|
const candidates = dedupeRetrievedChunks(retrieved)
|
|
17
|
-
.filter((item) =>
|
|
20
|
+
.filter((item) => minFusedScore === undefined || item.score >= minFusedScore);
|
|
18
21
|
const items = [];
|
|
19
22
|
let tokenTotal = 0;
|
|
20
23
|
let citationIndex = 1;
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"context-builder.js","sourceRoot":"","sources":["../../../src/rag/generation/context-builder.ts"],"names":[],"mappings":";;;
|
|
1
|
+
{"version":3,"file":"context-builder.js","sourceRoot":"","sources":["../../../src/rag/generation/context-builder.ts"],"names":[],"mappings":";;;AA+NA,wCAKC;AAxMD,MAAa,qBAAqB;IACb,gBAAgB,CAAS;IACzB,kBAAkB,CAAqB;IACvC,aAAa,CAAU;IACvB,aAAa,CAAqB;IAEnD,YAAY,UAAwC,EAAE;QAClD,IAAI,CAAC,gBAAgB,GAAG,wBAAwB,CAAC,OAAO,CAAC,gBAAgB,EAAE,IAAI,CAAC,CAAC;QACjF,IAAI,CAAC,kBAAkB,GAAG,gCAAgC,CAAC,OAAO,CAAC,kBAAkB,CAAC,CAAC;QACvF,IAAI,CAAC,aAAa,GAAG,OAAO,CAAC,aAAa,IAAI,KAAK,CAAC;QACpD,IAAI,CAAC,aAAa,GAAG,OAAO,CAAC,aAAa,CAAC;IAC/C,CAAC;IAED,KAAK,CAAC,KAAK,CACP,KAAa,EACb,SAA2B,EAC3B,UAAyB,EAAE;QAE3B,MAAM,gBAAgB,GAAG,wBAAwB,CAC7C,OAAO,CAAC,gBAAgB,EACxB,IAAI,CAAC,gBAAgB,CACxB,CAAC;QACF,MAAM,aAAa,GAAG,OAAO,CAAC,aAAa,IAAI,IAAI,CAAC,aAAa,CAAC;QAClE,MAAM,UAAU,GAAG,qBAAqB,CAAC,SAAS,CAAC;aAC9C,MAAM,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,aAAa,KAAK,SAAS,IAAI,IAAI,CAAC,KAAK,IAAI,aAAa,CAAC,CAAC;QAClF,MAAM,KAAK,GAAqB,EAAE,CAAC;QACnC,IAAI,UAAU,GAAG,CAAC,CAAC;QACnB,IAAI,aAAa,GAAG,CAAC,CAAC;QAEtB,KAAK,MAAM,IAAI,IAAI,UAAU,EAAE,CAAC;YAC5B,MAAM,OAAO,GAAG,oBAAoB,CAAC,IAAI,CAAC,KAAK,CAAC,OAAO,EAAE,IAAI,CAAC,kBAAkB,CAAC,CAAC;YAClF,IAAI,OAAO,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;gBACvB,SAAS;YACb,CAAC;YAED,MAAM,QAAQ,GAAG,cAAc,CAAC,aAAa,EAAE,IAAI,EAAE,OAAO,CAAC,CAAC;YAC9D,MAAM,QAAQ,GAAG,kBAAkB,CAC/B,QAAQ,EACR,OAAO,EACP,mBAAmB,CAAC,IAAI,CAAC,aAAa,EAAE,IAAI,CAAC,KAAK,CAAC,CACtD,CAAC;YACF,MAAM,aAAa,GAAG,cAAc,CAAC,QAAQ,CAAC,CAAC;YAC/C,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC,IAAI,UAAU,GAAG,aAAa,GAAG,gBAAgB,EAAE,CAAC;gBACpE,MAAM;YACV,CAAC;YAED,KAAK,CAAC,IAAI,CAAC;gBACP,QAAQ;gBACR,KAAK,EAAE,IAAI,CAAC,KAAK;gBACjB,OAAO;gBACP,KAAK,EAAE,IAAI,CAAC,KAAK;gBACjB,MAAM,EAAE,IAAI,CAAC,MAAM;gBACnB,aAAa;aAChB,CAAC,CAAC;YACH,UAAU,IAAI,aAAa,CAAC;YAC5B,aAAa,IAAI,CAAC,CAAC;QACvB,CAAC;QAED,MAAM,IAAI,GAAG,KAAK;aACb,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,kBAAkB,CAC7B,IAAI,CAAC,QAAQ,EACb,IAAI,CAAC,OAAO,EACZ,mBAAmB,CAAC,IAAI,CAAC,aAAa,EAAE,IAAI,CAAC,KAAK,CAAC,CACtD,CAAC;aACD,IAAI,CAAC,MAAM,CAAC,CAAC;QAElB,OAAO;YACH,KAAK;YACL,IAAI;YACJ,KAAK;YACL,SAAS,EAAE,KAAK,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,IAAI,CAAC,QAAQ,CAAC;YAC7C,eAAe,EAAE,UAAU;SAC9B,CAAC;IACN,CAAC;CACJ;AA1ED,sDA0EC;AAED,SAAS,qBAAqB,CAAC,SAA2B;IACtD,MAAM,YAAY,GAAG,IAAI,GAAG,EAAU,CAAC;IACvC,MAAM,eAAe,GAAG,IAAI,GAAG,EAAU,CAAC;IAC1C,MAAM,MAAM,GAAqB,EAAE,CAAC;IAEpC,KAAK,MAAM,IAAI,IAAI,SAAS,EAAE,CAAC;QAC3B,MAAM,UAAU,GAAG,mBAAmB,CAAC,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;QAC3D,IAAI,YAAY,CAAC,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE,CAAC,IAAI,eAAe,CAAC,GAAG,CAAC,UAAU,CAAC,EAAE,CAAC;YACrE,SAAS;QACb,CAAC;QAED,YAAY,CAAC,GAAG,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC;QAChC,eAAe,CAAC,GAAG,CAAC,UAAU,CAAC,CAAC;QAChC,MAAM,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IACtB,CAAC;IAED,OAAO,MAAM,CAAC;AAClB,CAAC;AAED,SAAS,cAAc,CACnB,KAAa,EACb,SAAyB,EACzB,OAAe;IAEf,MAAM,QAAQ,GAAa;QACvB,KAAK;QACL,OAAO,EAAE,SAAS,CAAC,KAAK,CAAC,EAAE;QAC3B,UAAU,EAAE,SAAS,CAAC,KAAK,CAAC,UAAU;QACtC,MAAM,EAAE,SAAS,CAAC,KAAK,CAAC,QAAQ,CAAC,MAAM;KAC1C,CAAC;IAEF,eAAe,CAAC,QAAQ,EAAE,OAAO,EAAE,SAAS,CAAC,KAAK,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC;IACnE,eAAe,CAAC,QAAQ,EAAE,MAAM,EAAE,SAAS,CAAC,KAAK,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAC;IAEjE,IAAI,SAAS,CAAC,KAAK,CAAC,QAAQ,CAAC,WAAW,KAAK,SAAS,EAAE,CAAC;QACrD,QAAQ,CAAC,WAAW,GAAG,CAAC,GAAG,SAAS,CAAC,KAAK,CAAC,QAAQ,CAAC,WAAW,CAAC,CAAC;IACrE,CAAC;IAED,QAAQ,CAAC,KAAK,GAAG,WAAW,CAAC,OAAO,CAAC,CAAC;IAEtC,MAAM,QAAQ,GAAG;QACb,eAAe,EAAE,SAAS,CAAC,MAAM;QACjC,KAAK,EAAE,SAAS,CAAC,KAAK;QACtB,GAAG,CAAC,SAAS,CAAC,QAAQ,IAAI,EAAE,CAAC;KAChC,CAAC;IACF,QAAQ,CAAC,QAAQ,GAAG,QAAQ,CAAC;IAE7B,OAAO,QAAQ,CAAC;AACpB,CAAC;AAED,SAAS,kBAAkB,CACvB,QAAkB,EAClB,OAAe,EACf,UAA8B,EAAE;IAEhC,MAAM,UAAU,GAAG;QACf,UAAU,eAAe,CAAC,QAAQ,CAAC,MAAM,CAAC,EAAE;KAC/C,CAAC;IAEF,IAAI,QAAQ,CAAC,KAAK,KAAK,SAAS,EAAE,CAAC;QAC/B,UAAU,CAAC,IAAI,CAAC,SAAS,eAAe,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC;IAChE,CAAC;IACD,IAAI,QAAQ,CAAC,WAAW,KAAK,SAAS,IAAI,QAAQ,CAAC,WAAW,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACxE,UAAU,CAAC,IAAI,CAAC,WAAW,eAAe,CAAC,QAAQ,CAAC,WAAW,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC;IACpF,CAAC;IACD,IAAI,QAAQ,CAAC,IAAI,KAAK,SAAS,EAAE,CAAC;QAC9B,UAAU,CAAC,IAAI,CAAC,QAAQ,QAAQ,CAAC,IAAI,EAAE,CAAC,CAAC;IAC7C,CAAC;IACD,IAAI,OAAO,CAAC,KAAK,KAAK,SAAS,EAAE,CAAC;QAC9B,UAAU,CAAC,IAAI,CAAC,SAAS,WAAW,CAAC,OAAO,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC;IAC3D,CAAC;IAED,OAAO,IAAI,QAAQ,CAAC,KAAK,KAAK,UAAU,CAAC,IAAI,CAAC,GAAG,CAAC,KAAK,OAAO,EAAE,CAAC;AACrE,CAAC;AAED,SAAS,mBAAmB,CAAC,aAAsB,EAAE,KAAa;IAC9D,MAAM,OAAO,GAAuB,EAAE,CAAC;IACvC,IAAI,aAAa,EAAE,CAAC;QAChB,OAAO,CAAC,KAAK,GAAG,KAAK,CAAC;IAC1B,CAAC;IAED,OAAO,OAAO,CAAC;AACnB,CAAC;AAED,SAAS,eAAe,CAAC,KAAa;IAClC,IAAI,qBAAqB,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE,CAAC;QACpC,OAAO,KAAK,CAAC;IACjB,CAAC;IAED,OAAO,IAAI,CAAC,SAAS,CAAC,KAAK,CAAC,CAAC;AACjC,CAAC;AAED,SAAS,WAAW,CAAC,KAAa;IAC9B,OAAO,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC;AACrE,CAAC;AAED,SAAS,oBAAoB,CAAC,OAAe,EAAE,kBAAsC;IACjF,MAAM,UAAU,GAAG,OAAO,CAAC,IAAI,EAAE,CAAC;IAClC,IAAI,kBAAkB,KAAK,SAAS,IAAI,UAAU,CAAC,MAAM,IAAI,kBAAkB,EAAE,CAAC;QAC9E,OAAO,UAAU,CAAC;IACtB,CAAC;IAED,OAAO,UAAU,CAAC,KAAK,CAAC,CAAC,EAAE,kBAAkB,CAAC,CAAC,OAAO,EAAE,CAAC;AAC7D,CAAC;AAED,SAAS,WAAW,CAAC,OAAe;IAChC,MAAM,UAAU,GAAG,OAAO,CAAC,OAAO,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC,IAAI,EAAE,CAAC;IAEvD,OAAO,UAAU,CAAC,MAAM,IAAI,GAAG,CAAC,CAAC,CAAC,UAAU,CAAC,CAAC,CAAC,GAAG,UAAU,CAAC,KAAK,CAAC,CAAC,EAAE,GAAG,CAAC,KAAK,CAAC;AACpF,CAAC;AAED,SAAS,mBAAmB,CAAC,OAAe;IACxC,OAAO,OAAO,CAAC,OAAO,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC,IAAI,EAAE,CAAC,WAAW,EAAE,CAAC;AAC7D,CAAC;AAED;;;GAGG;AACH,SAAgB,cAAc,CAAC,IAAY;IACvC,MAAM,QAAQ,GAAG,IAAI,CAAC,KAAK,CAAC,kBAAkB,CAAC,EAAE,MAAM,IAAI,CAAC,CAAC;IAC7D,MAAM,WAAW,GAAG,IAAI,CAAC,MAAM,GAAG,QAAQ,CAAC;IAE3C,OAAO,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,IAAI,CAAC,IAAI,CAAC,QAAQ,GAAG,WAAW,GAAG,CAAC,CAAC,CAAC,CAAC;AAC9D,CAAC;AAED,SAAS,wBAAwB,CAAC,KAAyB,EAAE,QAAgB;IACzE,IAAI,KAAK,KAAK,SAAS,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,IAAI,KAAK,IAAI,CAAC,EAAE,CAAC;QAC/D,OAAO,QAAQ,CAAC;IACpB,CAAC;IAED,OAAO,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;AAC7B,CAAC;AAED,SAAS,gCAAgC,CAAC,KAAyB;IAC/D,IAAI,KAAK,KAAK,SAAS,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,IAAI,KAAK,IAAI,CAAC,EAAE,CAAC;QAC/D,OAAO,SAAS,CAAC;IACrB,CAAC;IAED,OAAO,IAAI,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;AAC7B,CAAC;AAED,SAAS,eAAe,CACpB,MAAS,EACT,GAAM,EACN,KAAuB;IAEvB,IAAI,KAAK,KAAK,SAAS,EAAE,CAAC;QACtB,MAAM,CAAC,GAAG,CAAC,GAAG,KAAK,CAAC;IACxB,CAAC;AACL,CAAC"}
|
|
@@ -21,11 +21,16 @@ export declare class DefaultMetadataResolver implements MetadataResolver {
|
|
|
21
21
|
}
|
|
22
22
|
export interface DocumentIdInput {
|
|
23
23
|
source: string;
|
|
24
|
-
checksum: string;
|
|
25
24
|
tenantId?: string;
|
|
26
25
|
knowledgeBaseId?: string;
|
|
27
26
|
version?: string;
|
|
28
27
|
}
|
|
29
28
|
export declare function createContentChecksum(content: string): string;
|
|
29
|
+
/**
|
|
30
|
+
* documentId 必须是"同一份文档"的稳定标识:只由 [tenantId, knowledgeBaseId, source, version] 派生。
|
|
31
|
+
* 故意不掺入 checksum——否则内容一变 ID 就变,replaceExisting 找不到旧文档,
|
|
32
|
+
* 旧 chunks/vectors/keyword entries 会变成永远检索得到的僵尸数据。
|
|
33
|
+
* 内容指纹保留在 document.metadata.checksum 里,供 pipeline 判断内容是否变化。
|
|
34
|
+
*/
|
|
30
35
|
export declare function createDocumentId(input: DocumentIdInput): string;
|
|
31
36
|
//# sourceMappingURL=metadata.d.ts.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"metadata.d.ts","sourceRoot":"","sources":["../../../src/rag/ingestion/metadata.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,UAAU,CAAC;AAEjD,MAAM,WAAW,uBAAuB;IACpC,OAAO,EAAE,MAAM,CAAC;IAChB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,QAAQ,CAAC,EAAE,OAAO,CAAC,gBAAgB,CAAC,CAAC;IACrC,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,GAAG,CAAC,EAAE,MAAM,EAAE,CAAC;CAClB;AAED,MAAM,WAAW,wBAAwB;IACrC,EAAE,EAAE,MAAM,CAAC;IACX,QAAQ,EAAE,gBAAgB,CAAC;CAC9B;AAED,MAAM,WAAW,gBAAgB;IAC7B,OAAO,CAAC,KAAK,EAAE,uBAAuB,GAAG,wBAAwB,CAAC;CACrE;AAED,qBAAa,uBAAwB,YAAW,gBAAgB;IAC5D,OAAO,CAAC,KAAK,EAAE,uBAAuB,GAAG,wBAAwB;
|
|
1
|
+
{"version":3,"file":"metadata.d.ts","sourceRoot":"","sources":["../../../src/rag/ingestion/metadata.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,UAAU,CAAC;AAEjD,MAAM,WAAW,uBAAuB;IACpC,OAAO,EAAE,MAAM,CAAC;IAChB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,QAAQ,CAAC,EAAE,OAAO,CAAC,gBAAgB,CAAC,CAAC;IACrC,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,GAAG,CAAC,EAAE,MAAM,EAAE,CAAC;CAClB;AAED,MAAM,WAAW,wBAAwB;IACrC,EAAE,EAAE,MAAM,CAAC;IACX,QAAQ,EAAE,gBAAgB,CAAC;CAC9B;AAED,MAAM,WAAW,gBAAgB;IAC7B,OAAO,CAAC,KAAK,EAAE,uBAAuB,GAAG,wBAAwB,CAAC;CACrE;AAED,qBAAa,uBAAwB,YAAW,gBAAgB;IAC5D,OAAO,CAAC,KAAK,EAAE,uBAAuB,GAAG,wBAAwB;CAiDpE;AAED,MAAM,WAAW,eAAe;IAC5B,MAAM,EAAE,MAAM,CAAC;IACf,QAAQ,CAAC,EAAE,MAAM,CAAC;IAClB,eAAe,CAAC,EAAE,MAAM,CAAC;IACzB,OAAO,CAAC,EAAE,MAAM,CAAC;CACpB;AAED,wBAAgB,qBAAqB,CAAC,OAAO,EAAE,MAAM,GAAG,MAAM,CAE7D;AAED;;;;;GAKG;AACH,wBAAgB,gBAAgB,CAAC,KAAK,EAAE,eAAe,GAAG,MAAM,CAS/D"}
|
|
@@ -32,7 +32,6 @@ class DefaultMetadataResolver {
|
|
|
32
32
|
}
|
|
33
33
|
const idInput = {
|
|
34
34
|
source,
|
|
35
|
-
checksum,
|
|
36
35
|
};
|
|
37
36
|
assignIfDefined(idInput, 'tenantId', tenantId);
|
|
38
37
|
assignIfDefined(idInput, 'knowledgeBaseId', knowledgeBaseId);
|
|
@@ -47,13 +46,18 @@ exports.DefaultMetadataResolver = DefaultMetadataResolver;
|
|
|
47
46
|
function createContentChecksum(content) {
|
|
48
47
|
return (0, node_crypto_1.createHash)('sha256').update(content).digest('hex');
|
|
49
48
|
}
|
|
49
|
+
/**
|
|
50
|
+
* documentId 必须是"同一份文档"的稳定标识:只由 [tenantId, knowledgeBaseId, source, version] 派生。
|
|
51
|
+
* 故意不掺入 checksum——否则内容一变 ID 就变,replaceExisting 找不到旧文档,
|
|
52
|
+
* 旧 chunks/vectors/keyword entries 会变成永远检索得到的僵尸数据。
|
|
53
|
+
* 内容指纹保留在 document.metadata.checksum 里,供 pipeline 判断内容是否变化。
|
|
54
|
+
*/
|
|
50
55
|
function createDocumentId(input) {
|
|
51
56
|
const stableKey = [
|
|
52
57
|
input.tenantId ?? '',
|
|
53
58
|
input.knowledgeBaseId ?? '',
|
|
54
59
|
input.source,
|
|
55
60
|
input.version ?? '',
|
|
56
|
-
input.checksum,
|
|
57
61
|
].join('\0');
|
|
58
62
|
return `doc_${createContentChecksum(stableKey).slice(0, 16)}`;
|
|
59
63
|
}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"metadata.js","sourceRoot":"","sources":["../../../src/rag/ingestion/metadata.ts"],"names":[],"mappings":";;;
|
|
1
|
+
{"version":3,"file":"metadata.js","sourceRoot":"","sources":["../../../src/rag/ingestion/metadata.ts"],"names":[],"mappings":";;;AAkFA,sDAEC;AAQD,4CASC;AArGD,6CAAyC;AAuBzC,MAAa,uBAAuB;IAChC,OAAO,CAAC,KAA8B;QAClC,MAAM,MAAM,GAAG,kBAAkB,CAC7B,KAAK,CAAC,QAAQ,EAAE,MAAM,IAAI,KAAK,CAAC,MAAM,IAAI,QAAQ,CACrD,IAAI,QAAQ,CAAC;QACd,MAAM,QAAQ,GAAG,kBAAkB,CAAC,KAAK,CAAC,QAAQ,EAAE,QAAQ,CAAC;eACtD,qBAAqB,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;QAC5C,MAAM,QAAQ,GAAG,kBAAkB,CAAC,KAAK,CAAC,QAAQ,IAAI,KAAK,CAAC,QAAQ,EAAE,QAAQ,CAAC,CAAC;QAChF,MAAM,eAAe,GAAG,kBAAkB,CACtC,KAAK,CAAC,eAAe,IAAI,KAAK,CAAC,QAAQ,EAAE,eAAe,CAC3D,CAAC;QACF,MAAM,OAAO,GAAG,kBAAkB,CAAC,KAAK,CAAC,QAAQ,EAAE,OAAO,CAAC,CAAC;QAC5D,MAAM,QAAQ,GAAqB;YAC/B,MAAM;YACN,QAAQ;SACX,CAAC;QAEF,eAAe,CAAC,QAAQ,EAAE,OAAO,EAAE,kBAAkB,CACjD,KAAK,CAAC,QAAQ,EAAE,KAAK,IAAI,KAAK,CAAC,KAAK,IAAI,oBAAoB,CAAC,MAAM,CAAC,CACvE,CAAC,CAAC;QACH,eAAe,CAAC,QAAQ,EAAE,UAAU,EAAE,kBAAkB,CACpD,KAAK,CAAC,QAAQ,EAAE,QAAQ,IAAI,KAAK,CAAC,QAAQ,CAC7C,CAAC,CAAC;QACH,eAAe,CAAC,QAAQ,EAAE,UAAU,EAAE,QAAQ,CAAC,CAAC;QAChD,eAAe,CAAC,QAAQ,EAAE,iBAAiB,EAAE,eAAe,CAAC,CAAC;QAC9D,eAAe,CAAC,QAAQ,EAAE,SAAS,EAAE,OAAO,CAAC,CAAC;QAC9C,eAAe,CAAC,QAAQ,EAAE,WAAW,EAAE,kBAAkB,CAAC,KAAK,CAAC,QAAQ,EAAE,SAAS,CAAC,CAAC,CAAC;QACtF,eAAe,CAAC,QAAQ,EAAE,WAAW,EAAE,kBAAkB,CAAC,KAAK,CAAC,QAAQ,EAAE,SAAS,CAAC,CAAC,CAAC;QAEtF,MAAM,GAAG,GAAG,KAAK,CAAC,GAAG,IAAI,KAAK,CAAC,QAAQ,EAAE,GAAG,CAAC;QAC7C,IAAI,GAAG,KAAK,SAAS,EAAE,CAAC;YACpB,QAAQ,CAAC,GAAG,GAAG,CAAC,GAAG,GAAG,CAAC,CAAC;QAC5B,CAAC;QAED,IAAI,KAAK,CAAC,QAAQ,EAAE,KAAK,KAAK,SAAS,EAAE,CAAC;YACtC,QAAQ,CAAC,KAAK,GAAG,EAAE,GAAG,KAAK,CAAC,QAAQ,CAAC,KAAK,EAAE,CAAC;QACjD,CAAC;QAED,MAAM,OAAO,GAAoB;YAC7B,MAAM;SACT,CAAC;QACF,eAAe,CAAC,OAAO,EAAE,UAAU,EAAE,QAAQ,CAAC,CAAC;QAC/C,eAAe,CAAC,OAAO,EAAE,iBAAiB,EAAE,eAAe,CAAC,CAAC;QAC7D,eAAe,CAAC,OAAO,EAAE,SAAS,EAAE,OAAO,CAAC,CAAC;QAE7C,OAAO;YACH,EAAE,EAAE,gBAAgB,CAAC,OAAO,CAAC;YAC7B,QAAQ;SACX,CAAC;IACN,CAAC;CACJ;AAlDD,0DAkDC;AASD,SAAgB,qBAAqB,CAAC,OAAe;IACjD,OAAO,IAAA,wBAAU,EAAC,QAAQ,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC;AAC9D,CAAC;AAED;;;;;GAKG;AACH,SAAgB,gBAAgB,CAAC,KAAsB;IACnD,MAAM,SAAS,GAAG;QACd,KAAK,CAAC,QAAQ,IAAI,EAAE;QACpB,KAAK,CAAC,eAAe,IAAI,EAAE;QAC3B,KAAK,CAAC,MAAM;QACZ,KAAK,CAAC,OAAO,IAAI,EAAE;KACtB,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAEb,OAAO,OAAO,qBAAqB,CAAC,SAAS,CAAC,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,EAAE,CAAC;AAClE,CAAC;AAED,SAAS,oBAAoB,CAAC,MAAc;IACxC,IAAI,MAAM,KAAK,QAAQ,EAAE,CAAC;QACtB,OAAO,SAAS,CAAC;IACrB,CAAC;IAED,MAAM,YAAY,GAAG,MAAM,CAAC,KAAK,CAAC,MAAM,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,IAAI,MAAM,CAAC;IAC1D,MAAM,KAAK,GAAG,YAAY,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC;IAC1D,MAAM,QAAQ,GAAG,KAAK,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC;IAC9B,IAAI,QAAQ,KAAK,SAAS,IAAI,QAAQ,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAClD,OAAO,SAAS,CAAC;IACrB,CAAC;IAED,OAAO,QAAQ,CAAC,OAAO,CAAC,UAAU,EAAE,EAAE,CAAC,CAAC;AAC5C,CAAC;AAED,SAAS,kBAAkB,CAAC,KAAyB;IACjD,MAAM,UAAU,GAAG,KAAK,EAAE,IAAI,EAAE,CAAC;IAEjC,OAAO,UAAU,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,UAAU,CAAC,CAAC,CAAC,SAAS,CAAC;AACxE,CAAC;AAED,SAAS,eAAe,CACpB,MAAS,EACT,GAAM,EACN,KAAuB;IAEvB,IAAI,KAAK,KAAK,SAAS,EAAE,CAAC;QACtB,MAAM,CAAC,GAAG,CAAC,GAAG,KAAK,CAAC;IACxB,CAAC;AACL,CAAC"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"pipeline.d.ts","sourceRoot":"","sources":["../../src/rag/pipeline.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACR,aAAa,EACb,WAAW,EACX,YAAY,EACZ,SAAS,EACT,cAAc,EACd,eAAe,EAClB,MAAM,SAAS,CAAC;AAEjB,OAAO,KAAK,EAAE,QAAQ,EAAE,MAAM,uBAAuB,CAAC;AACtD,OAAO,KAAK,EACR,cAAc,EACd,YAAY,EACZ,WAAW,EACd,MAAM,cAAc,CAAC;AACtB,OAAO,KAAK,EACR,OAAO,EACV,MAAM,YAAY,CAAC;AACpB,OAAO,KAAK,EACR,cAAc,EACd,kBAAkB,EACrB,MAAM,aAAa,CAAC;AACrB,OAAO,KAAK,EACR,aAAa,EACb,YAAY,EACZ,WAAW,EACd,MAAM,UAAU,CAAC;AAClB,OAAO,KAAK,EACR,SAAS,EACZ,MAAM,aAAa,CAAC;AAErB;;;GAGG;AACH,MAAM,WAAW,WAAW;IACxB;;OAEG;IACH,MAAM,CAAC,KAAK,EAAE,WAAW,GAAG,OAAO,CAAC,YAAY,CAAC,CAAC;IAElD;;;OAGG;IACH,QAAQ,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,eAAe,GAAG,OAAO,CAAC,cAAc,EAAE,CAAC,CAAC;IAE9E;;OAEG;IACH,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,aAAa,GAAG,OAAO,CAAC,SAAS,CAAC,CAAC;CACtE;AAED,MAAM,WAAW,yBAAyB;IACtC,MAAM,EAAE,cAAc,CAAC;IACvB,UAAU,EAAE,kBAAkB,CAAC;IAC/B,OAAO,EAAE,OAAO,CAAC;IACjB,QAAQ,EAAE,QAAQ,CAAC;IACnB,aAAa,EAAE,aAAa,CAAC;IAC7B,WAAW,EAAE,WAAW,CAAC;IACzB,YAAY,EAAE,YAAY,CAAC;IAC3B,SAAS,EAAE,SAAS,CAAC;IACrB,cAAc,EAAE,cAAc,CAAC;IAC/B,SAAS,EAAE,YAAY,CAAC;IACxB,QAAQ,EAAE,WAAW,CAAC;CACzB;AAED;;;;GAIG;AACH,qBAAa,kBAAmB,YAAW,WAAW;IAClD,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAiB;IACxC,OAAO,CAAC,QAAQ,CAAC,UAAU,CAAqB;IAChD,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAU;IAClC,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAW;IACpC,OAAO,CAAC,QAAQ,CAAC,aAAa,CAAgB;IAC9C,OAAO,CAAC,QAAQ,CAAC,WAAW,CAAc;IAC1C,OAAO,CAAC,QAAQ,CAAC,YAAY,CAAe;IAC5C,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAY;IACtC,OAAO,CAAC,QAAQ,CAAC,cAAc,CAAiB;IAChD,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAe;IACzC,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAc;
|
|
1
|
+
{"version":3,"file":"pipeline.d.ts","sourceRoot":"","sources":["../../src/rag/pipeline.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EACR,aAAa,EACb,WAAW,EACX,YAAY,EACZ,SAAS,EACT,cAAc,EACd,eAAe,EAClB,MAAM,SAAS,CAAC;AAEjB,OAAO,KAAK,EAAE,QAAQ,EAAE,MAAM,uBAAuB,CAAC;AACtD,OAAO,KAAK,EACR,cAAc,EACd,YAAY,EACZ,WAAW,EACd,MAAM,cAAc,CAAC;AACtB,OAAO,KAAK,EACR,OAAO,EACV,MAAM,YAAY,CAAC;AACpB,OAAO,KAAK,EACR,cAAc,EACd,kBAAkB,EACrB,MAAM,aAAa,CAAC;AACrB,OAAO,KAAK,EACR,aAAa,EACb,YAAY,EACZ,WAAW,EACd,MAAM,UAAU,CAAC;AAClB,OAAO,KAAK,EACR,SAAS,EACZ,MAAM,aAAa,CAAC;AAErB;;;GAGG;AACH,MAAM,WAAW,WAAW;IACxB;;OAEG;IACH,MAAM,CAAC,KAAK,EAAE,WAAW,GAAG,OAAO,CAAC,YAAY,CAAC,CAAC;IAElD;;;OAGG;IACH,QAAQ,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,eAAe,GAAG,OAAO,CAAC,cAAc,EAAE,CAAC,CAAC;IAE9E;;OAEG;IACH,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,CAAC,EAAE,aAAa,GAAG,OAAO,CAAC,SAAS,CAAC,CAAC;CACtE;AAED,MAAM,WAAW,yBAAyB;IACtC,MAAM,EAAE,cAAc,CAAC;IACvB,UAAU,EAAE,kBAAkB,CAAC;IAC/B,OAAO,EAAE,OAAO,CAAC;IACjB,QAAQ,EAAE,QAAQ,CAAC;IACnB,aAAa,EAAE,aAAa,CAAC;IAC7B,WAAW,EAAE,WAAW,CAAC;IACzB,YAAY,EAAE,YAAY,CAAC;IAC3B,SAAS,EAAE,SAAS,CAAC;IACrB,cAAc,EAAE,cAAc,CAAC;IAC/B,SAAS,EAAE,YAAY,CAAC;IACxB,QAAQ,EAAE,WAAW,CAAC;CACzB;AAED;;;;GAIG;AACH,qBAAa,kBAAmB,YAAW,WAAW;IAClD,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAiB;IACxC,OAAO,CAAC,QAAQ,CAAC,UAAU,CAAqB;IAChD,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAU;IAClC,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAW;IACpC,OAAO,CAAC,QAAQ,CAAC,aAAa,CAAgB;IAC9C,OAAO,CAAC,QAAQ,CAAC,WAAW,CAAc;IAC1C,OAAO,CAAC,QAAQ,CAAC,YAAY,CAAe;IAC5C,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAY;IACtC,OAAO,CAAC,QAAQ,CAAC,cAAc,CAAiB;IAChD,OAAO,CAAC,QAAQ,CAAC,SAAS,CAAe;IACzC,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAc;gBAG3B,OAAO,EAAE,yBAAyB;IAoBxC,MAAM,CAAC,KAAK,EAAE,WAAW,GAAG,OAAO,CAAC,YAAY,CAAC;IAoDjD,QAAQ,CACV,KAAK,EAAE,MAAM,EACb,OAAO,CAAC,EAAE,eAAe,GAC1B,OAAO,CAAC,cAAc,EAAE,CAAC;IAItB,MAAM,CAAC,KAAK,EAAE,MAAM,EAAE,OAAO,GAAE,aAAkB,GAAG,OAAO,CAAC,SAAS,CAAC;CAW/E"}
|
package/dist/rag/pipeline.js
CHANGED
|
@@ -19,6 +19,7 @@ class DefaultRagPipeline {
|
|
|
19
19
|
contextBuilder;
|
|
20
20
|
generator;
|
|
21
21
|
verifier;
|
|
22
|
+
// TODO options没传应该要有默认的值
|
|
22
23
|
constructor(options) {
|
|
23
24
|
this.loader = options.loader;
|
|
24
25
|
this.normalizer = options.normalizer;
|
|
@@ -41,24 +42,42 @@ class DefaultRagPipeline {
|
|
|
41
42
|
// 统一换行、裁剪多余空白、移除无效控制字符、清理空 block,并规范 metadata/id/acl 等字段。
|
|
42
43
|
// 这一步不负责解析文件格式,也不重新生成 embedding,只处理文档进入索引前的基础数据卫生。
|
|
43
44
|
const normalizedDocuments = await this.normalizer.normalizeMany(documents);
|
|
44
|
-
const
|
|
45
|
-
|
|
45
|
+
const skippedDocumentIds = [];
|
|
46
|
+
let documentsToIngest = normalizedDocuments;
|
|
46
47
|
if (input.replaceExisting === true) {
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
await this.
|
|
50
|
-
|
|
51
|
-
|
|
48
|
+
documentsToIngest = [];
|
|
49
|
+
for (const document of normalizedDocuments) {
|
|
50
|
+
const existing = await this.documentStore.getDocument(document.id);
|
|
51
|
+
if (existing !== undefined) {
|
|
52
|
+
// documentId 稳定(不含 checksum),checksum 相同说明内容没变:
|
|
53
|
+
// 直接跳过,不重复 embedding,也不重写任何索引。
|
|
54
|
+
if (existing.metadata.checksum !== undefined
|
|
55
|
+
&& existing.metadata.checksum === document.metadata.checksum) {
|
|
56
|
+
skippedDocumentIds.push(document.id);
|
|
57
|
+
continue;
|
|
58
|
+
}
|
|
59
|
+
// 内容变了:chunk id 由内容哈希派生,upsert 不会覆盖旧 chunk,
|
|
60
|
+
// 且 in-memory 三个 store 之间没有级联删除,必须逐 store 清理旧数据,
|
|
61
|
+
// 否则旧 chunks/vectors/keyword entries 会成为僵尸数据继续被检索到。
|
|
62
|
+
await this.documentStore.deleteDocument(document.id);
|
|
63
|
+
await this.vectorStore.deleteByDocument(document.id);
|
|
64
|
+
await this.keywordStore.deleteByDocument(document.id);
|
|
65
|
+
}
|
|
66
|
+
documentsToIngest.push(document);
|
|
67
|
+
}
|
|
52
68
|
}
|
|
53
|
-
await this.
|
|
69
|
+
const chunks = await this.chunker.chunkMany(documentsToIngest);
|
|
70
|
+
const embeddedChunks = await (0, embedder_1.embedChunks)(this.embedder, chunks);
|
|
71
|
+
await this.documentStore.upsertDocuments(documentsToIngest);
|
|
54
72
|
await this.documentStore.upsertChunks(chunks);
|
|
55
73
|
await this.vectorStore.upsert(embeddedChunks);
|
|
56
74
|
await this.keywordStore.upsert(chunks);
|
|
57
75
|
return {
|
|
58
|
-
documentCount:
|
|
76
|
+
documentCount: documentsToIngest.length,
|
|
59
77
|
chunkCount: chunks.length,
|
|
60
|
-
documentIds:
|
|
78
|
+
documentIds: documentsToIngest.map((document) => document.id),
|
|
61
79
|
chunkIds: chunks.map((chunk) => chunk.id),
|
|
80
|
+
skippedDocumentIds,
|
|
62
81
|
};
|
|
63
82
|
}
|
|
64
83
|
async retrieve(query, options) {
|
|
@@ -66,7 +85,11 @@ class DefaultRagPipeline {
|
|
|
66
85
|
}
|
|
67
86
|
async answer(query, options = {}) {
|
|
68
87
|
const retrieved = await this.retrieve(query, options);
|
|
69
|
-
|
|
88
|
+
// minScore 只在各 retriever 的原始分数尺度(cosine / TF-IDF)上有意义,
|
|
89
|
+
// 融合后的 RRF 分数量级完全不同(~0.016),透传会把结果误伤清空。
|
|
90
|
+
// ContextBuilder 的过滤阈值由独立的 minFusedScore 控制,这里不透传 minScore。
|
|
91
|
+
const { minScore: _minScore, ...contextOptions } = options;
|
|
92
|
+
const context = await this.contextBuilder.build(query, retrieved, contextOptions);
|
|
70
93
|
const answer = await this.generator.generate(query, context, options);
|
|
71
94
|
return await this.verifier.verify(answer, context, options);
|
|
72
95
|
}
|
package/dist/rag/pipeline.js.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"pipeline.js","sourceRoot":"","sources":["../../src/rag/pipeline.ts"],"names":[],"mappings":";;;AAQA,oDAAoD;AA2DpD;;;;GAIG;AACH,MAAa,kBAAkB;IACV,MAAM,CAAiB;IACvB,UAAU,CAAqB;IAC/B,OAAO,CAAU;IACjB,QAAQ,CAAW;IACnB,aAAa,CAAgB;IAC7B,WAAW,CAAc;IACzB,YAAY,CAAe;IAC3B,SAAS,CAAY;IACrB,cAAc,CAAiB;IAC/B,SAAS,CAAe;IACxB,QAAQ,CAAc;IAEvC,YAAY,OAAkC;QAC1C,IAAI,CAAC,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;QAC7B,IAAI,CAAC,UAAU,GAAG,OAAO,CAAC,UAAU,CAAC;QACrC,IAAI,CAAC,OAAO,GAAG,OAAO,CAAC,OAAO,CAAC;QAC/B,IAAI,CAAC,QAAQ,GAAG,OAAO,CAAC,QAAQ,CAAC;QACjC,IAAI,CAAC,aAAa,GAAG,OAAO,CAAC,aAAa,CAAC;QAC3C,IAAI,CAAC,WAAW,GAAG,OAAO,CAAC,WAAW,CAAC;QACvC,IAAI,CAAC,YAAY,GAAG,OAAO,CAAC,YAAY,CAAC;QACzC,IAAI,CAAC,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;QACnC,IAAI,CAAC,cAAc,GAAG,OAAO,CAAC,cAAc,CAAC;QAC7C,IAAI,CAAC,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;QACnC,IAAI,CAAC,QAAQ,GAAG,OAAO,CAAC,QAAQ,CAAC;QAEjC,IAAI,IAAI,CAAC,QAAQ,CAAC,UAAU,KAAK,IAAI,CAAC,WAAW,CAAC,UAAU,EAAE,CAAC;YAC3D,MAAM,IAAI,KAAK,CACX,wDAAwD,IAAI,CAAC,QAAQ,CAAC,UAAU,iBAAiB,IAAI,CAAC,WAAW,CAAC,UAAU,GAAG,CAClI,CAAC;QACN,CAAC;IACL,CAAC;IAED,KAAK,CAAC,MAAM,CAAC,KAAkB;QAC3B,MAAM,SAAS,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAChD,+CAA+C;QAC/C,0DAA0D;QAC1D,mDAAmD;QACnD,MAAM,mBAAmB,GAAG,MAAM,IAAI,CAAC,UAAU,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;
|
|
1
|
+
{"version":3,"file":"pipeline.js","sourceRoot":"","sources":["../../src/rag/pipeline.ts"],"names":[],"mappings":";;;AAQA,oDAAoD;AA2DpD;;;;GAIG;AACH,MAAa,kBAAkB;IACV,MAAM,CAAiB;IACvB,UAAU,CAAqB;IAC/B,OAAO,CAAU;IACjB,QAAQ,CAAW;IACnB,aAAa,CAAgB;IAC7B,WAAW,CAAc;IACzB,YAAY,CAAe;IAC3B,SAAS,CAAY;IACrB,cAAc,CAAiB;IAC/B,SAAS,CAAe;IACxB,QAAQ,CAAc;IAEvC,yBAAyB;IACzB,YAAY,OAAkC;QAC1C,IAAI,CAAC,MAAM,GAAG,OAAO,CAAC,MAAM,CAAC;QAC7B,IAAI,CAAC,UAAU,GAAG,OAAO,CAAC,UAAU,CAAC;QACrC,IAAI,CAAC,OAAO,GAAG,OAAO,CAAC,OAAO,CAAC;QAC/B,IAAI,CAAC,QAAQ,GAAG,OAAO,CAAC,QAAQ,CAAC;QACjC,IAAI,CAAC,aAAa,GAAG,OAAO,CAAC,aAAa,CAAC;QAC3C,IAAI,CAAC,WAAW,GAAG,OAAO,CAAC,WAAW,CAAC;QACvC,IAAI,CAAC,YAAY,GAAG,OAAO,CAAC,YAAY,CAAC;QACzC,IAAI,CAAC,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;QACnC,IAAI,CAAC,cAAc,GAAG,OAAO,CAAC,cAAc,CAAC;QAC7C,IAAI,CAAC,SAAS,GAAG,OAAO,CAAC,SAAS,CAAC;QACnC,IAAI,CAAC,QAAQ,GAAG,OAAO,CAAC,QAAQ,CAAC;QAEjC,IAAI,IAAI,CAAC,QAAQ,CAAC,UAAU,KAAK,IAAI,CAAC,WAAW,CAAC,UAAU,EAAE,CAAC;YAC3D,MAAM,IAAI,KAAK,CACX,wDAAwD,IAAI,CAAC,QAAQ,CAAC,UAAU,iBAAiB,IAAI,CAAC,WAAW,CAAC,UAAU,GAAG,CAClI,CAAC;QACN,CAAC;IACL,CAAC;IAED,KAAK,CAAC,MAAM,CAAC,KAAkB;QAC3B,MAAM,SAAS,GAAG,MAAM,IAAI,CAAC,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAChD,+CAA+C;QAC/C,0DAA0D;QAC1D,mDAAmD;QACnD,MAAM,mBAAmB,GAAG,MAAM,IAAI,CAAC,UAAU,CAAC,aAAa,CAAC,SAAS,CAAC,CAAC;QAE3E,MAAM,kBAAkB,GAAa,EAAE,CAAC;QACxC,IAAI,iBAAiB,GAAG,mBAAmB,CAAC;QAC5C,IAAI,KAAK,CAAC,eAAe,KAAK,IAAI,EAAE,CAAC;YACjC,iBAAiB,GAAG,EAAE,CAAC;YACvB,KAAK,MAAM,QAAQ,IAAI,mBAAmB,EAAE,CAAC;gBACzC,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,QAAQ,CAAC,EAAE,CAAC,CAAC;gBACnE,IAAI,QAAQ,KAAK,SAAS,EAAE,CAAC;oBACzB,gDAAgD;oBAChD,+BAA+B;oBAC/B,IACI,QAAQ,CAAC,QAAQ,CAAC,QAAQ,KAAK,SAAS;2BACrC,QAAQ,CAAC,QAAQ,CAAC,QAAQ,KAAK,QAAQ,CAAC,QAAQ,CAAC,QAAQ,EAC9D,CAAC;wBACC,kBAAkB,CAAC,IAAI,CAAC,QAAQ,CAAC,EAAE,CAAC,CAAC;wBACrC,SAAS;oBACb,CAAC;oBAED,4CAA4C;oBAC5C,iDAAiD;oBACjD,oDAAoD;oBACpD,MAAM,IAAI,CAAC,aAAa,CAAC,cAAc,CAAC,QAAQ,CAAC,EAAE,CAAC,CAAC;oBACrD,MAAM,IAAI,CAAC,WAAW,CAAC,gBAAgB,CAAC,QAAQ,CAAC,EAAE,CAAC,CAAC;oBACrD,MAAM,IAAI,CAAC,YAAY,CAAC,gBAAgB,CAAC,QAAQ,CAAC,EAAE,CAAC,CAAC;gBAC1D,CAAC;gBACD,iBAAiB,CAAC,IAAI,CAAC,QAAQ,CAAC,CAAC;YACrC,CAAC;QACL,CAAC;QAED,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,SAAS,CAAC,iBAAiB,CAAC,CAAC;QAC/D,MAAM,cAAc,GAAG,MAAM,IAAA,sBAAW,EAAC,IAAI,CAAC,QAAQ,EAAE,MAAM,CAAC,CAAC;QAEhE,MAAM,IAAI,CAAC,aAAa,CAAC,eAAe,CAAC,iBAAiB,CAAC,CAAC;QAC5D,MAAM,IAAI,CAAC,aAAa,CAAC,YAAY,CAAC,MAAM,CAAC,CAAC;QAC9C,MAAM,IAAI,CAAC,WAAW,CAAC,MAAM,CAAC,cAAc,CAAC,CAAC;QAC9C,MAAM,IAAI,CAAC,YAAY,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;QAEvC,OAAO;YACH,aAAa,EAAE,iBAAiB,CAAC,MAAM;YACvC,UAAU,EAAE,MAAM,CAAC,MAAM;YACzB,WAAW,EAAE,iBAAiB,CAAC,GAAG,CAAC,CAAC,QAAQ,EAAE,EAAE,CAAC,QAAQ,CAAC,EAAE,CAAC;YAC7D,QAAQ,EAAE,MAAM,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,CAAC,EAAE,CAAC;YACzC,kBAAkB;SACrB,CAAC;IACN,CAAC;IAED,KAAK,CAAC,QAAQ,CACV,KAAa,EACb,OAAyB;QAEzB,OAAO,MAAM,IAAI,CAAC,SAAS,CAAC,QAAQ,CAAC,KAAK,EAAE,OAAO,CAAC,CAAC;IACzD,CAAC;IAED,KAAK,CAAC,MAAM,CAAC,KAAa,EAAE,UAAyB,EAAE;QACnD,MAAM,SAAS,GAAG,MAAM,IAAI,CAAC,QAAQ,CAAC,KAAK,EAAE,OAAO,CAAC,CAAC;QACtD,uDAAuD;QACvD,wCAAwC;QACxC,4DAA4D;QAC5D,MAAM,EAAE,QAAQ,EAAE,SAAS,EAAE,GAAG,cAAc,EAAE,GAAG,OAAO,CAAC;QAC3D,MAAM,OAAO,GAAG,MAAM,IAAI,CAAC,cAAc,CAAC,KAAK,CAAC,KAAK,EAAE,SAAS,EAAE,cAAc,CAAC,CAAC;QAClF,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,SAAS,CAAC,QAAQ,CAAC,KAAK,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC;QAEtE,OAAO,MAAM,IAAI,CAAC,QAAQ,CAAC,MAAM,CAAC,MAAM,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC;IAChE,CAAC;CACJ;AAxGD,gDAwGC"}
|
|
@@ -3,6 +3,7 @@ export * from './dense-retriever';
|
|
|
3
3
|
export * from './fusion';
|
|
4
4
|
export * from './hybrid-retriever';
|
|
5
5
|
export * from './http-rerank-model-client';
|
|
6
|
+
export * from './parent-child-expanding-retriever';
|
|
6
7
|
export * from './reranker';
|
|
7
8
|
export * from './sparse-retriever';
|
|
8
9
|
//# sourceMappingURL=index.d.ts.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/rag/retrieval/index.ts"],"names":[],"mappings":"AAAA,cAAc,SAAS,CAAC;AACxB,cAAc,mBAAmB,CAAC;AAClC,cAAc,UAAU,CAAC;AACzB,cAAc,oBAAoB,CAAC;AACnC,cAAc,4BAA4B,CAAC;AAC3C,cAAc,YAAY,CAAC;AAC3B,cAAc,oBAAoB,CAAC"}
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/rag/retrieval/index.ts"],"names":[],"mappings":"AAAA,cAAc,SAAS,CAAC;AACxB,cAAc,mBAAmB,CAAC;AAClC,cAAc,UAAU,CAAC;AACzB,cAAc,oBAAoB,CAAC;AACnC,cAAc,4BAA4B,CAAC;AAC3C,cAAc,oCAAoC,CAAC;AACnD,cAAc,YAAY,CAAC;AAC3B,cAAc,oBAAoB,CAAC"}
|
|
@@ -19,6 +19,7 @@ __exportStar(require("./dense-retriever"), exports);
|
|
|
19
19
|
__exportStar(require("./fusion"), exports);
|
|
20
20
|
__exportStar(require("./hybrid-retriever"), exports);
|
|
21
21
|
__exportStar(require("./http-rerank-model-client"), exports);
|
|
22
|
+
__exportStar(require("./parent-child-expanding-retriever"), exports);
|
|
22
23
|
__exportStar(require("./reranker"), exports);
|
|
23
24
|
__exportStar(require("./sparse-retriever"), exports);
|
|
24
25
|
//# sourceMappingURL=index.js.map
|