@vivantel/rag-core 1.1.3 → 2.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/bin/rag-update.d.ts +3 -0
- package/dist/bin/rag-update.d.ts.map +1 -0
- package/dist/bin/rag-update.js +116 -0
- package/dist/bin/rag-update.js.map +1 -0
- package/dist/cli/init.d.ts +2 -0
- package/dist/cli/init.d.ts.map +1 -0
- package/dist/cli/init.js +262 -0
- package/dist/cli/init.js.map +1 -0
- package/dist/cli/validate.d.ts +2 -0
- package/dist/cli/validate.d.ts.map +1 -0
- package/dist/cli/validate.js +54 -0
- package/dist/cli/validate.js.map +1 -0
- package/dist/config-loader.d.ts.map +1 -1
- package/dist/config-loader.js +73 -5
- package/dist/config-loader.js.map +1 -1
- package/dist/core/chunk-processor.d.ts +1 -1
- package/dist/core/chunk-processor.d.ts.map +1 -1
- package/dist/core/chunk-processor.js +23 -1
- package/dist/core/chunk-processor.js.map +1 -1
- package/dist/core/embedder.d.ts +5 -1
- package/dist/core/embedder.d.ts.map +1 -1
- package/dist/core/embedder.js +33 -29
- package/dist/core/embedder.js.map +1 -1
- package/dist/core/errors.d.ts +16 -0
- package/dist/core/errors.d.ts.map +1 -0
- package/dist/core/errors.js +17 -0
- package/dist/core/errors.js.map +1 -0
- package/dist/core/orchestrator.d.ts +8 -0
- package/dist/core/orchestrator.d.ts.map +1 -1
- package/dist/core/orchestrator.js +134 -39
- package/dist/core/orchestrator.js.map +1 -1
- package/dist/core/plugin-discovery.d.ts +19 -0
- package/dist/core/plugin-discovery.d.ts.map +1 -0
- package/dist/core/plugin-discovery.js +47 -0
- package/dist/core/plugin-discovery.js.map +1 -0
- package/dist/core/telemetry.d.ts +61 -0
- package/dist/core/telemetry.d.ts.map +1 -0
- package/dist/core/telemetry.js +50 -0
- package/dist/core/telemetry.js.map +1 -0
- package/dist/core/uploader.d.ts +5 -1
- package/dist/core/uploader.d.ts.map +1 -1
- package/dist/core/uploader.js +11 -4
- package/dist/core/uploader.js.map +1 -1
- package/dist/core/utils.d.ts +7 -0
- package/dist/core/utils.d.ts.map +1 -1
- package/dist/core/utils.js +35 -0
- package/dist/core/utils.js.map +1 -1
- package/dist/index.d.ts +14 -1
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +14 -2
- package/dist/index.js.map +1 -1
- package/dist/interfaces/embedder.d.ts +2 -0
- package/dist/interfaces/embedder.d.ts.map +1 -1
- package/dist/interfaces/vector-store.d.ts +2 -0
- package/dist/interfaces/vector-store.d.ts.map +1 -1
- package/package.json +8 -2
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"chunk-processor.js","sourceRoot":"","sources":["../../src/core/chunk-processor.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,UAAU,EAAE,MAAM,QAAQ,CAAC;AAEpC,SAAS,kBAAkB,CAAC,OAAe;IACzC,OAAO,UAAU,CAAC,QAAQ,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;AACzE,CAAC;AAED,MAAM,OAAO,cAAc;IACjB,QAAQ,CAA2B;IAE3C,YAAY,QAAuB;QACjC,IAAI,CAAC,QAAQ,GAAG,IAAI,GAAG,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC;IAC5D,CAAC;IAED,KAAK,CAAC,WAAW,CACf,QAAgB,EAChB,UAAkB,EAClB,OAAoB;QAEpB,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,KAAK,CAAC,QAAQ,EAAE,UAAU,CAAC,CAAC;QAEzD,KAAK,MAAM,KAAK,IAAI,MAAM,EAAE,CAAC;YAC3B,KAAK,CAAC,WAAW,GAAG,kBAAkB,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;YACtD,KAAK,CAAC,UAAU,GAAG,QAAQ,CAAC;YAC5B,KAAK,CAAC,UAAU,GAAG,UAAU,CAAC;QAChC,CAAC;QAED,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,KAAK,CAAC,YAAY,CAChB,KAAe,EACf,SAAoE;
|
|
1
|
+
{"version":3,"file":"chunk-processor.js","sourceRoot":"","sources":["../../src/core/chunk-processor.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,UAAU,EAAE,MAAM,QAAQ,CAAC;AAEpC,SAAS,kBAAkB,CAAC,OAAe;IACzC,OAAO,UAAU,CAAC,QAAQ,CAAC,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;AACzE,CAAC;AAED,MAAM,OAAO,cAAc;IACjB,QAAQ,CAA2B;IAE3C,YAAY,QAAuB;QACjC,IAAI,CAAC,QAAQ,GAAG,IAAI,GAAG,CAAC,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC;IAC5D,CAAC;IAED,KAAK,CAAC,WAAW,CACf,QAAgB,EAChB,UAAkB,EAClB,OAAoB;QAEpB,MAAM,MAAM,GAAG,MAAM,OAAO,CAAC,KAAK,CAAC,QAAQ,EAAE,UAAU,CAAC,CAAC;QAEzD,KAAK,MAAM,KAAK,IAAI,MAAM,EAAE,CAAC;YAC3B,KAAK,CAAC,WAAW,GAAG,kBAAkB,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;YACtD,KAAK,CAAC,UAAU,GAAG,QAAQ,CAAC;YAC5B,KAAK,CAAC,UAAU,GAAG,UAAU,CAAC;QAChC,CAAC;QAED,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,KAAK,CAAC,YAAY,CAChB,KAAe,EACf,SAAoE,EACpE,iBAA0B,EAAE;QAE5B,MAAM,SAAS,GAAY,EAAE,CAAC;QAC9B,IAAI,UAAU,GAAG,CAAC,CAAC;QAEnB,0DAA0D;QAC1D,MAAM,WAAW,GAAG,IAAI,GAAG,EAGxB,CAAC;QACJ,KAAK,MAAM,KAAK,IAAI,cAAc,EAAE,CAAC;YACnC,MAAM,KAAK,GAAG,WAAW,CAAC,GAAG,CAAC,KAAK,CAAC,UAAU,CAAC,CAAC;YAChD,IAAI,CAAC,KAAK,EAAE,CAAC;gBACX,WAAW,CAAC,GAAG,CAAC,KAAK,CAAC,UAAU,EAAE;oBAChC,UAAU,EAAE,KAAK,CAAC,UAAU;oBAC5B,MAAM,EAAE,CAAC,KAAK,CAAC;iBAChB,CAAC,CAAC;YACL,CAAC;iBAAM,CAAC;gBACN,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YAC3B,CAAC;QACH,CAAC;QAED,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,KAAK,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YACtC,MAAM,QAAQ,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;YAC1B,MAAM,IAAI,GAAG,SAAS,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;YAErC,IAAI,CAAC,IAAI,EAAE,CAAC;gBACV,OAAO,CAAC,GAAG,CAAC,wBAAwB,QAAQ,EAAE,CAAC,CAAC;gBAChD,SAAS;YACX,CAAC;YAED,sDAAsD;YACtD,MAAM,MAAM,GAAG,WAAW,CAAC,GAAG,CAAC,QAAQ,CAAC,CAAC;YACzC,IAAI,MAAM,IAAI,MAAM,CAAC,UAAU,KAAK,IAAI,CAAC,UAAU,EAAE,CAAC;gBACpD,OAAO,CAAC,GAAG,CAAC,MAAM,CAAC,GAAG,CAAC,IAAI,KAAK,CAAC,MAAM,KAAK,QAAQ,EAAE,CAAC,CAAC;gBACxD,OAAO,CAAC,GAAG,CAAC,mBAAmB,MAAM,CAAC,MAAM,CAAC,MAAM,YAAY,CAAC,CAAC;gBACjE,SAAS,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC;gBACjC,SAAS;YACX,CAAC;YAED,OAAO,CAAC,GAAG,CAAC,MAAM,CAAC,GAAG,CAAC,IAAI,KAAK,CAAC,MAAM,KAAK,QAAQ,EAAE,CAAC,CAAC;YAExD,IAAI,CAAC;gBACH,MAAM,MAAM,GAAG,MAAM,IAAI,CAAC,WAAW,CACnC,QAAQ,EACR,IAAI,CAAC,UAAU,EACf,IAAI,CAAC,OAAO,CACb,CAAC;gBAEF,IAAI,MAAM,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;oBACtB,SAAS,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,CAAC;oBAC1B,OAAO,CAAC,GAAG,CAAC,mBAAmB,MAAM,CAAC,MAAM,WAAW,CAAC,CAAC;gBAC3D,CAAC;qBAAM,CAAC;oBACN,OAAO,CAAC,GAAG,CAAC,sCAAsC,CAAC,CAAC;gBACtD,CAAC;YACH,CAAC;YAAC,OAAO,KAAK,EAAE,CAAC;gBACf,UAAU,EAAE,CAAC;gBACb,OAAO,CAAC,KAAK,CAAC,0BAA0B,QAAQ,KAAK,KAAK,EAAE,CAAC,CAAC;YAChE,CAAC;QACH,CAAC;QAED,IAAI,UAAU,GAAG,CAAC,EAAE,CAAC;YACnB,OAAO,CAAC,IAAI,CAAC,QAAQ,UAAU,kCAAkC,CAAC,CAAC;QACrE,CAAC;QAED,OAAO,SAAS,CAAC;IACnB,CAAC;IAED,KAAK,CAAC,eAAe,CAAC,MAAe,EAAE,UAAkB;QACvD,MAAM,EAAE,OAAO,EAAE,GAAG,MAAM,MAAM,CAAC,MAAM,CAAC,CAAC;QACzC,MAAM,EAAE,KAAK,EAAE,SAAS,EAAE,QAAQ,EAAE,GAAG,MAAM,MAAM,CAAC,aAAa,CAAC,CAAC;QAEnE,MAAM,KAAK,CAAC,OAAO,CAAC,UAAU,CAAC,EAAE,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;QAEtD,IAAI,QAAQ,GAAY,EAAE,CAAC;QAC3B,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,MAAM,QAAQ,CAAC,UAAU,EAAE,OAAO,CAAC,CAAC;YACpD,MAAM,MAAM,GAAY,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;YAC5C,IAAI,KAAK,CAAC,OAAO,CAAC,MAAM,CAAC,EAAE,CAAC;gBAC1B,QAAQ,GAAG,MAAiB,CAAC;YAC/B,CAAC;QACH,CAAC;QAAC,MAAM,CAAC;YACP,wDAAwD;QAC1D,CAAC;QAED,MAAM,cAAc,GAAG,IAAI,GAAG,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,UAAU,CAAC,CAAC,CAAC;QAChE,MAAM,QAAQ,GAAG,QAAQ,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,cAAc,CAAC,GAAG,CAAC,CAAC,CAAC,UAAU,CAAC,CAAC,CAAC;QAE3E,MAAM,SAAS,GAAG,CAAC,GAAG,QAAQ,EAAE,GAAG,MAAM,CAAC,CAAC;QAE3C,MAAM,SAAS,CAAC,UAAU,EAAE,IAAI,CAAC,SAAS,CAAC,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,CAAC;QAChE,OAAO,CAAC,GAAG,CAAC,cAAc,SAAS,CAAC,MAAM,cAAc,UAAU,EAAE,CAAC,CAAC;IACxE,CAAC;CACF"}
|
package/dist/core/embedder.d.ts
CHANGED
|
@@ -1,13 +1,17 @@
|
|
|
1
1
|
import { EmbeddingProvider, EmbeddedChunk, Chunk } from "../interfaces/index.js";
|
|
2
|
+
import { RetryOptions } from "./utils.js";
|
|
2
3
|
export declare class EmbedderProcessor {
|
|
3
4
|
private provider;
|
|
4
5
|
private rateLimitMs;
|
|
5
6
|
private batchSize;
|
|
7
|
+
private retryOptions;
|
|
8
|
+
private concurrency;
|
|
6
9
|
constructor(provider: EmbeddingProvider, options?: {
|
|
7
10
|
rateLimitMs?: number;
|
|
8
11
|
batchSize?: number;
|
|
12
|
+
retry?: RetryOptions;
|
|
13
|
+
concurrency?: number;
|
|
9
14
|
});
|
|
10
|
-
private sleep;
|
|
11
15
|
embedChunk(chunk: Chunk): Promise<EmbeddedChunk>;
|
|
12
16
|
embedBatch(chunks: Chunk[]): Promise<EmbeddedChunk[]>;
|
|
13
17
|
getChunksToEmbed(chunksFile: string, force?: boolean): Promise<{
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"embedder.d.ts","sourceRoot":"","sources":["../../src/core/embedder.ts"],"names":[],"mappings":"AAAA,OAAO,EACL,iBAAiB,EACjB,aAAa,EACb,KAAK,EACN,MAAM,wBAAwB,CAAC;
|
|
1
|
+
{"version":3,"file":"embedder.d.ts","sourceRoot":"","sources":["../../src/core/embedder.ts"],"names":[],"mappings":"AAAA,OAAO,EACL,iBAAiB,EACjB,aAAa,EACb,KAAK,EACN,MAAM,wBAAwB,CAAC;AAKhC,OAAO,EAAqC,YAAY,EAAE,MAAM,YAAY,CAAC;AAO7E,qBAAa,iBAAiB;IAC5B,OAAO,CAAC,QAAQ,CAAoB;IACpC,OAAO,CAAC,WAAW,CAAS;IAC5B,OAAO,CAAC,SAAS,CAAS;IAC1B,OAAO,CAAC,YAAY,CAAe;IACnC,OAAO,CAAC,WAAW,CAAS;gBAG1B,QAAQ,EAAE,iBAAiB,EAC3B,OAAO,GAAE;QACP,WAAW,CAAC,EAAE,MAAM,CAAC;QACrB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,KAAK,CAAC,EAAE,YAAY,CAAC;QACrB,WAAW,CAAC,EAAE,MAAM,CAAC;KACjB;IASF,UAAU,CAAC,KAAK,EAAE,KAAK,GAAG,OAAO,CAAC,aAAa,CAAC;IAahD,UAAU,CAAC,MAAM,EAAE,KAAK,EAAE,GAAG,OAAO,CAAC,aAAa,EAAE,CAAC;IA+CrD,gBAAgB,CACpB,UAAU,EAAE,MAAM,EAClB,KAAK,GAAE,OAAe,GACrB,OAAO,CAAC;QACT,aAAa,EAAE,KAAK,EAAE,CAAC;KACxB,CAAC;IAuDI,cAAc,CAClB,aAAa,EAAE,aAAa,EAAE,EAC9B,UAAU,EAAE,MAAM,EAClB,KAAK,GAAE,OAAe,GACrB,OAAO,CAAC,IAAI,CAAC;IAoCV,GAAG,CACP,UAAU,EAAE,MAAM,EAClB,KAAK,GAAE,OAAe,GACrB,OAAO,CAAC,aAAa,EAAE,CAAC;CAiB5B"}
|
package/dist/core/embedder.js
CHANGED
|
@@ -1,6 +1,8 @@
|
|
|
1
1
|
import { readFile, writeFile, mkdir } from "fs/promises";
|
|
2
2
|
import { dirname } from "path";
|
|
3
3
|
import { createHash } from "crypto";
|
|
4
|
+
import { EmbedError } from "./errors.js";
|
|
5
|
+
import { sleep, withRetry, withConcurrency } from "./utils.js";
|
|
4
6
|
function chunkContentHash(chunk) {
|
|
5
7
|
if (chunk.contentHash)
|
|
6
8
|
return chunk.contentHash;
|
|
@@ -10,16 +12,17 @@ export class EmbedderProcessor {
|
|
|
10
12
|
provider;
|
|
11
13
|
rateLimitMs;
|
|
12
14
|
batchSize;
|
|
15
|
+
retryOptions;
|
|
16
|
+
concurrency;
|
|
13
17
|
constructor(provider, options = {}) {
|
|
14
18
|
this.provider = provider;
|
|
15
19
|
this.rateLimitMs = options.rateLimitMs ?? 500;
|
|
16
20
|
this.batchSize = options.batchSize ?? 10;
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
return new Promise((resolve) => setTimeout(resolve, ms));
|
|
21
|
+
this.retryOptions = options.retry ?? {};
|
|
22
|
+
this.concurrency = options.concurrency ?? 1;
|
|
20
23
|
}
|
|
21
24
|
async embedChunk(chunk) {
|
|
22
|
-
const embedding = await this.provider.embed(chunk.content);
|
|
25
|
+
const embedding = await withRetry(() => this.provider.embed(chunk.content), this.retryOptions);
|
|
23
26
|
return {
|
|
24
27
|
...chunk,
|
|
25
28
|
embedding,
|
|
@@ -27,37 +30,35 @@ export class EmbedderProcessor {
|
|
|
27
30
|
};
|
|
28
31
|
}
|
|
29
32
|
async embedBatch(chunks) {
|
|
30
|
-
const results = [];
|
|
31
33
|
if (this.provider.embedBatch && chunks.length >= this.batchSize) {
|
|
32
34
|
const texts = chunks.map((c) => c.content);
|
|
33
|
-
const embeddings = await this.provider.embedBatch(texts);
|
|
35
|
+
const embeddings = await withRetry(() => this.provider.embedBatch(texts), this.retryOptions);
|
|
34
36
|
if (embeddings.length !== chunks.length) {
|
|
35
|
-
throw new
|
|
36
|
-
|
|
37
|
-
for (let i = 0; i < chunks.length; i++) {
|
|
38
|
-
results.push({
|
|
39
|
-
...chunks[i],
|
|
40
|
-
embedding: embeddings[i],
|
|
41
|
-
embeddedAt: Date.now() / 1000,
|
|
37
|
+
throw new EmbedError(`embedBatch returned ${embeddings.length} embeddings for ${chunks.length} chunks`, {
|
|
38
|
+
suggestion: "Check that your EmbeddingProvider.embedBatch() returns one vector per input text.",
|
|
42
39
|
});
|
|
43
40
|
}
|
|
41
|
+
return chunks.map((chunk, i) => ({
|
|
42
|
+
...chunk,
|
|
43
|
+
embedding: embeddings[i],
|
|
44
|
+
embeddedAt: Date.now() / 1000,
|
|
45
|
+
}));
|
|
44
46
|
}
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
await this.sleep(this.rateLimitMs);
|
|
57
|
-
}
|
|
47
|
+
let completed = 0;
|
|
48
|
+
const tasks = chunks.map((chunk) => async () => {
|
|
49
|
+
const label = chunk.metadata.event_type ||
|
|
50
|
+
chunk.metadata.title ||
|
|
51
|
+
chunk.sourceFile.split("/").pop() ||
|
|
52
|
+
"unknown";
|
|
53
|
+
const embedded = await this.embedChunk(chunk);
|
|
54
|
+
completed++;
|
|
55
|
+
console.log(` [${completed}/${chunks.length}] ${label}`);
|
|
56
|
+
if (this.rateLimitMs > 0) {
|
|
57
|
+
await sleep(this.rateLimitMs);
|
|
58
58
|
}
|
|
59
|
-
|
|
60
|
-
|
|
59
|
+
return embedded;
|
|
60
|
+
});
|
|
61
|
+
return withConcurrency(tasks, this.concurrency);
|
|
61
62
|
}
|
|
62
63
|
async getChunksToEmbed(chunksFile, force = false) {
|
|
63
64
|
let chunks;
|
|
@@ -70,7 +71,10 @@ export class EmbedderProcessor {
|
|
|
70
71
|
chunks = parsed;
|
|
71
72
|
}
|
|
72
73
|
catch (err) {
|
|
73
|
-
throw new
|
|
74
|
+
throw new EmbedError(`Failed to load chunks from ${chunksFile}: ${err instanceof Error ? err.message : String(err)}`, {
|
|
75
|
+
suggestion: "Run the pipeline without --skip-upload to regenerate chunks first.",
|
|
76
|
+
cause: err,
|
|
77
|
+
});
|
|
74
78
|
}
|
|
75
79
|
console.log(`📖 Loaded ${chunks.length} chunks from ${chunksFile}`);
|
|
76
80
|
if (force) {
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"embedder.js","sourceRoot":"","sources":["../../src/core/embedder.ts"],"names":[],"mappings":"AAKA,OAAO,EAAE,QAAQ,EAAE,SAAS,EAAE,KAAK,EAAE,MAAM,aAAa,CAAC;AACzD,OAAO,EAAE,OAAO,EAAE,MAAM,MAAM,CAAC;AAC/B,OAAO,EAAE,UAAU,EAAE,MAAM,QAAQ,CAAC;
|
|
1
|
+
{"version":3,"file":"embedder.js","sourceRoot":"","sources":["../../src/core/embedder.ts"],"names":[],"mappings":"AAKA,OAAO,EAAE,QAAQ,EAAE,SAAS,EAAE,KAAK,EAAE,MAAM,aAAa,CAAC;AACzD,OAAO,EAAE,OAAO,EAAE,MAAM,MAAM,CAAC;AAC/B,OAAO,EAAE,UAAU,EAAE,MAAM,QAAQ,CAAC;AACpC,OAAO,EAAE,UAAU,EAAE,MAAM,aAAa,CAAC;AACzC,OAAO,EAAE,KAAK,EAAE,SAAS,EAAE,eAAe,EAAgB,MAAM,YAAY,CAAC;AAE7E,SAAS,gBAAgB,CAAC,KAAY;IACpC,IAAI,KAAK,CAAC,WAAW;QAAE,OAAO,KAAK,CAAC,WAAW,CAAC;IAChD,OAAO,UAAU,CAAC,QAAQ,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC;AAC/E,CAAC;AAED,MAAM,OAAO,iBAAiB;IACpB,QAAQ,CAAoB;IAC5B,WAAW,CAAS;IACpB,SAAS,CAAS;IAClB,YAAY,CAAe;IAC3B,WAAW,CAAS;IAE5B,YACE,QAA2B,EAC3B,UAKI,EAAE;QAEN,IAAI,CAAC,QAAQ,GAAG,QAAQ,CAAC;QACzB,IAAI,CAAC,WAAW,GAAG,OAAO,CAAC,WAAW,IAAI,GAAG,CAAC;QAC9C,IAAI,CAAC,SAAS,GAAG,OAAO,CAAC,SAAS,IAAI,EAAE,CAAC;QACzC,IAAI,CAAC,YAAY,GAAG,OAAO,CAAC,KAAK,IAAI,EAAE,CAAC;QACxC,IAAI,CAAC,WAAW,GAAG,OAAO,CAAC,WAAW,IAAI,CAAC,CAAC;IAC9C,CAAC;IAED,KAAK,CAAC,UAAU,CAAC,KAAY;QAC3B,MAAM,SAAS,GAAG,MAAM,SAAS,CAC/B,GAAG,EAAE,CAAC,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,KAAK,CAAC,OAAO,CAAC,EACxC,IAAI,CAAC,YAAY,CAClB,CAAC;QAEF,OAAO;YACL,GAAG,KAAK;YACR,SAAS;YACT,UAAU,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,IAAI;SAC9B,CAAC;IACJ,CAAC;IAED,KAAK,CAAC,UAAU,CAAC,MAAe;QAC9B,IAAI,IAAI,CAAC,QAAQ,CAAC,UAAU,IAAI,MAAM,CAAC,MAAM,IAAI,IAAI,CAAC,SAAS,EAAE,CAAC;YAChE,MAAM,KAAK,GAAG,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC;YAC3C,MAAM,UAAU,GAAG,MAAM,SAAS,CAChC,GAAG,EAAE,CAAC,IAAI,CAAC,QAAQ,CAAC,UAAW,CAAC,KAAK,CAAC,EACtC,IAAI,CAAC,YAAY,CAClB,CAAC;YAEF,IAAI,UAAU,CAAC,MAAM,KAAK,MAAM,CAAC,MAAM,EAAE,CAAC;gBACxC,MAAM,IAAI,UAAU,CAClB,uBAAuB,UAAU,CAAC,MAAM,mBAAmB,MAAM,CAAC,MAAM,SAAS,EACjF;oBACE,UAAU,EACR,mFAAmF;iBACtF,CACF,CAAC;YACJ,CAAC;YAED,OAAO,MAAM,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC;gBAC/B,GAAG,KAAK;gBACR,SAAS,EAAE,UAAU,CAAC,CAAC,CAAC;gBACxB,UAAU,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,IAAI;aAC9B,CAAC,CAAC,CAAC;QACN,CAAC;QAED,IAAI,SAAS,GAAG,CAAC,CAAC;QAClB,MAAM,KAAK,GAAG,MAAM,CAAC,GAAG,CAAC,CAAC,KAAK,EAAE,EAAE,CAAC,KAAK,IAA4B,EAAE;YACrE,MAAM,KAAK,GACR,KAAK,CAAC,QAAQ,CAAC,UAAqB;gBACpC,KAAK,CAAC,QAAQ,CAAC,KAAgB;gBAChC,KAAK,CAAC,UAAU,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,GAAG,EAAE;gBACjC,SAAS,CAAC;YAEZ,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC;YAC9C,SAAS,EAAE,CAAC;YACZ,OAAO,CAAC,GAAG,CAAC,MAAM,SAAS,IAAI,MAAM,CAAC,MAAM,KAAK,KAAK,EAAE,CAAC,CAAC;YAE1D,IAAI,IAAI,CAAC,WAAW,GAAG,CAAC,EAAE,CAAC;gBACzB,MAAM,KAAK,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;YAChC,CAAC;YAED,OAAO,QAAQ,CAAC;QAClB,CAAC,CAAC,CAAC;QAEH,OAAO,eAAe,CAAC,KAAK,EAAE,IAAI,CAAC,WAAW,CAAC,CAAC;IAClD,CAAC;IAED,KAAK,CAAC,gBAAgB,CACpB,UAAkB,EAClB,QAAiB,KAAK;QAItB,IAAI,MAAe,CAAC;QACpB,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,MAAM,QAAQ,CAAC,UAAU,EAAE,OAAO,CAAC,CAAC;YACpD,MAAM,MAAM,GAAY,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;YAC5C,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,MAAM,CAAC,EAAE,CAAC;gBAC3B,MAAM,IAAI,KAAK,CAAC,2CAA2C,CAAC,CAAC;YAC/D,CAAC;YACD,MAAM,GAAG,MAAiB,CAAC;QAC7B,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,MAAM,IAAI,UAAU,CAClB,8BAA8B,UAAU,KAAK,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,EAC/F;gBACE,UAAU,EACR,oEAAoE;gBACtE,KAAK,EAAE,GAAG;aACX,CACF,CAAC;QACJ,CAAC;QAED,OAAO,CAAC,GAAG,CAAC,aAAa,MAAM,CAAC,MAAM,gBAAgB,UAAU,EAAE,CAAC,CAAC;QAEpE,IAAI,KAAK,EAAE,CAAC;YACV,OAAO,CAAC,GAAG,CAAC,uCAAuC,CAAC,CAAC;YACrD,OAAO,EAAE,aAAa,EAAE,MAAM,EAAE,CAAC;QACnC,CAAC;QAED,IAAI,kBAAkB,GAAoB,EAAE,CAAC;QAC7C,MAAM,cAAc,GAAG,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,YAAY,CAAC,CAAC;QAClE,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,MAAM,QAAQ,CAAC,cAAc,EAAE,OAAO,CAAC,CAAC;YACxD,kBAAkB,GAAG,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;QAC3C,CAAC;QAAC,MAAM,CAAC;YACP,yBAAyB;QAC3B,CAAC;QAED,MAAM,aAAa,GAAG,IAAI,GAAG,EAAyB,CAAC;QACvD,KAAK,MAAM,GAAG,IAAI,kBAAkB,EAAE,CAAC;YACrC,MAAM,IAAI,GAAG,GAAG,CAAC,WAAW,IAAI,gBAAgB,CAAC,GAAG,CAAC,CAAC;YACtD,aAAa,CAAC,GAAG,CAAC,IAAI,EAAE,GAAG,CAAC,CAAC;QAC/B,CAAC;QAED,OAAO,CAAC,GAAG,CAAC,2BAA2B,aAAa,CAAC,IAAI,SAAS,CAAC,CAAC;QAEpE,MAAM,aAAa,GAAY,EAAE,CAAC;QAClC,KAAK,MAAM,KAAK,IAAI,MAAM,EAAE,CAAC;YAC3B,MAAM,SAAS,GAAG,gBAAgB,CAAC,KAAK,CAAC,CAAC;YAC1C,IAAI,CAAC,aAAa,CAAC,GAAG,CAAC,SAAS,CAAC,EAAE,CAAC;gBAClC,aAAa,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YAC5B,CAAC;QACH,CAAC;QAED,OAAO,EAAE,aAAa,EAAE,CAAC;IAC3B,CAAC;IAED,KAAK,CAAC,cAAc,CAClB,aAA8B,EAC9B,UAAkB,EAClB,QAAiB,KAAK;QAEtB,MAAM,cAAc,GAAG,UAAU,CAAC,OAAO,CAAC,QAAQ,EAAE,YAAY,CAAC,CAAC;QAClE,MAAM,KAAK,CAAC,OAAO,CAAC,cAAc,CAAC,EAAE,EAAE,SAAS,EAAE,IAAI,EAAE,CAAC,CAAC;QAE1D,MAAM,SAAS,GAAG,IAAI,GAAG,EAAyB,CAAC;QACnD,KAAK,MAAM,GAAG,IAAI,aAAa,EAAE,CAAC;YAChC,MAAM,IAAI,GAAG,GAAG,CAAC,WAAW,IAAI,gBAAgB,CAAC,GAAG,CAAC,CAAC;YACtD,SAAS,CAAC,GAAG,CAAC,IAAI,EAAE,GAAG,CAAC,CAAC;QAC3B,CAAC;QAED,IAAI,QAAQ,GAAoB,EAAE,CAAC;QACnC,IAAI,CAAC,KAAK,EAAE,CAAC;YACX,IAAI,CAAC;gBACH,MAAM,OAAO,GAAG,MAAM,QAAQ,CAAC,cAAc,EAAE,OAAO,CAAC,CAAC;gBACxD,QAAQ,GAAG,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;YACjC,CAAC;YAAC,MAAM,CAAC;gBACP,yBAAyB;YAC3B,CAAC;QACH,CAAC;QAED,MAAM,KAAK,GAAG,KAAK;YACjB,CAAC,CAAC,EAAE;YACJ,CAAC,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE;gBACpB,MAAM,IAAI,GAAG,CAAC,CAAC,WAAW,IAAI,gBAAgB,CAAC,CAAC,CAAC,CAAC;gBAClD,OAAO,CAAC,SAAS,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;YAC9B,CAAC,CAAC,CAAC;QAEP,KAAK,CAAC,IAAI,CAAC,GAAG,aAAa,CAAC,CAAC;QAE7B,MAAM,SAAS,CAAC,cAAc,EAAE,IAAI,CAAC,SAAS,CAAC,KAAK,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,CAAC;QAChE,OAAO,CAAC,GAAG,CAAC,cAAc,KAAK,CAAC,MAAM,kBAAkB,cAAc,EAAE,CAAC,CAAC;QAC1E,OAAO,CAAC,GAAG,CACT,WAAW,aAAa,CAAC,MAAM,eAAe,KAAK,CAAC,MAAM,GAAG,aAAa,CAAC,MAAM,EAAE,CACpF,CAAC;IACJ,CAAC;IAED,KAAK,CAAC,GAAG,CACP,UAAkB,EAClB,QAAiB,KAAK;QAEtB,OAAO,CAAC,GAAG,CAAC,iDAAiD,CAAC,CAAC;QAE/D,MAAM,EAAE,aAAa,EAAE,GAAG,MAAM,IAAI,CAAC,gBAAgB,CAAC,UAAU,EAAE,KAAK,CAAC,CAAC;QAEzE,IAAI,aAAa,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YAC/B,OAAO,CAAC,GAAG,CAAC,+BAA+B,CAAC,CAAC;YAC7C,OAAO,EAAE,CAAC;QACZ,CAAC;QAED,OAAO,CAAC,GAAG,CAAC,sBAAsB,aAAa,CAAC,MAAM,SAAS,CAAC,CAAC;QAEjE,MAAM,aAAa,GAAG,MAAM,IAAI,CAAC,UAAU,CAAC,aAAa,CAAC,CAAC;QAC3D,MAAM,IAAI,CAAC,cAAc,CAAC,aAAa,EAAE,UAAU,EAAE,KAAK,CAAC,CAAC;QAE5D,OAAO,aAAa,CAAC;IACvB,CAAC;CACF"}
|
|
@@ -0,0 +1,16 @@
|
|
|
1
|
+
export declare class RagError extends Error {
|
|
2
|
+
suggestion?: string;
|
|
3
|
+
constructor(message: string, options?: {
|
|
4
|
+
suggestion?: string;
|
|
5
|
+
cause?: unknown;
|
|
6
|
+
});
|
|
7
|
+
}
|
|
8
|
+
export declare class ConfigError extends RagError {
|
|
9
|
+
}
|
|
10
|
+
export declare class ChunkError extends RagError {
|
|
11
|
+
}
|
|
12
|
+
export declare class EmbedError extends RagError {
|
|
13
|
+
}
|
|
14
|
+
export declare class UploadError extends RagError {
|
|
15
|
+
}
|
|
16
|
+
//# sourceMappingURL=errors.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"errors.d.ts","sourceRoot":"","sources":["../../src/core/errors.ts"],"names":[],"mappings":"AAAA,qBAAa,QAAS,SAAQ,KAAK;IACjC,UAAU,CAAC,EAAE,MAAM,CAAC;gBAGlB,OAAO,EAAE,MAAM,EACf,OAAO,CAAC,EAAE;QAAE,UAAU,CAAC,EAAE,MAAM,CAAC;QAAC,KAAK,CAAC,EAAE,OAAO,CAAA;KAAE;CASrD;AAED,qBAAa,WAAY,SAAQ,QAAQ;CAAG;AAC5C,qBAAa,UAAW,SAAQ,QAAQ;CAAG;AAC3C,qBAAa,UAAW,SAAQ,QAAQ;CAAG;AAC3C,qBAAa,WAAY,SAAQ,QAAQ;CAAG"}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
export class RagError extends Error {
|
|
2
|
+
suggestion;
|
|
3
|
+
constructor(message, options) {
|
|
4
|
+
super(message, options?.cause !== undefined ? { cause: options.cause } : undefined);
|
|
5
|
+
this.name = this.constructor.name;
|
|
6
|
+
this.suggestion = options?.suggestion;
|
|
7
|
+
}
|
|
8
|
+
}
|
|
9
|
+
export class ConfigError extends RagError {
|
|
10
|
+
}
|
|
11
|
+
export class ChunkError extends RagError {
|
|
12
|
+
}
|
|
13
|
+
export class EmbedError extends RagError {
|
|
14
|
+
}
|
|
15
|
+
export class UploadError extends RagError {
|
|
16
|
+
}
|
|
17
|
+
//# sourceMappingURL=errors.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"errors.js","sourceRoot":"","sources":["../../src/core/errors.ts"],"names":[],"mappings":"AAAA,MAAM,OAAO,QAAS,SAAQ,KAAK;IACjC,UAAU,CAAU;IAEpB,YACE,OAAe,EACf,OAAkD;QAElD,KAAK,CACH,OAAO,EACP,OAAO,EAAE,KAAK,KAAK,SAAS,CAAC,CAAC,CAAC,EAAE,KAAK,EAAE,OAAO,CAAC,KAAK,EAAE,CAAC,CAAC,CAAC,SAAS,CACpE,CAAC;QACF,IAAI,CAAC,IAAI,GAAG,IAAI,CAAC,WAAW,CAAC,IAAI,CAAC;QAClC,IAAI,CAAC,UAAU,GAAG,OAAO,EAAE,UAAU,CAAC;IACxC,CAAC;CACF;AAED,MAAM,OAAO,WAAY,SAAQ,QAAQ;CAAG;AAC5C,MAAM,OAAO,UAAW,SAAQ,QAAQ;CAAG;AAC3C,MAAM,OAAO,UAAW,SAAQ,QAAQ;CAAG;AAC3C,MAAM,OAAO,WAAY,SAAQ,QAAQ;CAAG"}
|
|
@@ -1,4 +1,5 @@
|
|
|
1
1
|
import { FileChunker, EmbeddingProvider, VectorStore } from "../interfaces/index.js";
|
|
2
|
+
import { RetryOptions } from "./utils.js";
|
|
2
3
|
export interface RAGPipelineConfig {
|
|
3
4
|
chunkers: FileChunker[];
|
|
4
5
|
embedder: EmbeddingProvider;
|
|
@@ -8,8 +9,15 @@ export interface RAGPipelineConfig {
|
|
|
8
9
|
embeddingsFile?: string;
|
|
9
10
|
force?: boolean;
|
|
10
11
|
skipUpload?: boolean;
|
|
12
|
+
dryRun?: boolean;
|
|
11
13
|
rateLimitMs?: number;
|
|
12
14
|
batchSize?: number;
|
|
15
|
+
retry?: RetryOptions;
|
|
16
|
+
concurrency?: number;
|
|
17
|
+
telemetry?: boolean;
|
|
18
|
+
notifications?: {
|
|
19
|
+
webhookUrl?: string;
|
|
20
|
+
};
|
|
13
21
|
};
|
|
14
22
|
}
|
|
15
23
|
export declare class Orchestrator {
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"orchestrator.d.ts","sourceRoot":"","sources":["../../src/core/orchestrator.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"orchestrator.d.ts","sourceRoot":"","sources":["../../src/core/orchestrator.ts"],"names":[],"mappings":"AAKA,OAAO,EACL,WAAW,EACX,iBAAiB,EACjB,WAAW,EAEZ,MAAM,wBAAwB,CAAC;AAEhC,OAAO,EAAE,YAAY,EAAE,MAAM,YAAY,CAAC;AAE1C,MAAM,WAAW,iBAAiB;IAChC,QAAQ,EAAE,WAAW,EAAE,CAAC;IACxB,QAAQ,EAAE,iBAAiB,CAAC;IAC5B,WAAW,EAAE,WAAW,CAAC;IACzB,OAAO,CAAC,EAAE;QACR,UAAU,CAAC,EAAE,MAAM,CAAC;QACpB,cAAc,CAAC,EAAE,MAAM,CAAC;QACxB,KAAK,CAAC,EAAE,OAAO,CAAC;QAChB,UAAU,CAAC,EAAE,OAAO,CAAC;QACrB,MAAM,CAAC,EAAE,OAAO,CAAC;QACjB,WAAW,CAAC,EAAE,MAAM,CAAC;QACrB,SAAS,CAAC,EAAE,MAAM,CAAC;QACnB,KAAK,CAAC,EAAE,YAAY,CAAC;QACrB,WAAW,CAAC,EAAE,MAAM,CAAC;QACrB,SAAS,CAAC,EAAE,OAAO,CAAC;QACpB,aAAa,CAAC,EAAE;YAAE,UAAU,CAAC,EAAE,MAAM,CAAA;SAAE,CAAC;KACzC,CAAC;CACH;AA+CD,qBAAa,YAAY;IACvB,OAAO,CAAC,MAAM,CAAoB;IAClC,OAAO,CAAC,UAAU,CAAS;IAC3B,OAAO,CAAC,cAAc,CAAS;gBAEnB,MAAM,EAAE,iBAAiB;IAO/B,GAAG,IAAI,OAAO,CAAC,IAAI,CAAC;CA+J3B"}
|
|
@@ -2,6 +2,7 @@ import { GitTracker } from "./git-tracker.js";
|
|
|
2
2
|
import { ChunkProcessor } from "./chunk-processor.js";
|
|
3
3
|
import { EmbedderProcessor } from "./embedder.js";
|
|
4
4
|
import { Uploader } from "./uploader.js";
|
|
5
|
+
import { TelemetryCollector } from "./telemetry.js";
|
|
5
6
|
import { readFile } from "fs/promises";
|
|
6
7
|
async function loadPreviousState(chunksFile) {
|
|
7
8
|
try {
|
|
@@ -21,6 +22,28 @@ async function loadPreviousState(chunksFile) {
|
|
|
21
22
|
return new Map();
|
|
22
23
|
}
|
|
23
24
|
}
|
|
25
|
+
async function loadExistingChunks(chunksFile) {
|
|
26
|
+
try {
|
|
27
|
+
const content = await readFile(chunksFile, "utf-8");
|
|
28
|
+
const parsed = JSON.parse(content);
|
|
29
|
+
return Array.isArray(parsed) ? parsed : [];
|
|
30
|
+
}
|
|
31
|
+
catch {
|
|
32
|
+
return [];
|
|
33
|
+
}
|
|
34
|
+
}
|
|
35
|
+
async function notifyWebhook(url, status, payload) {
|
|
36
|
+
try {
|
|
37
|
+
await fetch(url, {
|
|
38
|
+
method: "POST",
|
|
39
|
+
headers: { "Content-Type": "application/json" },
|
|
40
|
+
body: JSON.stringify({ status, ...payload }),
|
|
41
|
+
});
|
|
42
|
+
}
|
|
43
|
+
catch {
|
|
44
|
+
// Notification failures are non-fatal
|
|
45
|
+
}
|
|
46
|
+
}
|
|
24
47
|
export class Orchestrator {
|
|
25
48
|
config;
|
|
26
49
|
chunksFile;
|
|
@@ -32,47 +55,119 @@ export class Orchestrator {
|
|
|
32
55
|
config.options?.embeddingsFile || "./docs/rag/embeddings.json";
|
|
33
56
|
}
|
|
34
57
|
async run() {
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
:
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
|
|
57
|
-
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
58
|
+
const opts = this.config.options ?? {};
|
|
59
|
+
const telemetry = opts.telemetry ? new TelemetryCollector() : null;
|
|
60
|
+
telemetry?.start();
|
|
61
|
+
let uploadStats = { uploaded: 0, deleted: 0 };
|
|
62
|
+
try {
|
|
63
|
+
console.log("🚀 Starting RAG pipeline...\n");
|
|
64
|
+
// Step 1: Scan for changes
|
|
65
|
+
console.log("📂 Step 1: Scanning for changes...");
|
|
66
|
+
const t1 = Date.now();
|
|
67
|
+
const gitTracker = new GitTracker(this.config.chunkers);
|
|
68
|
+
const currentState = await gitTracker.getCurrentState();
|
|
69
|
+
const previousState = opts.force
|
|
70
|
+
? new Map()
|
|
71
|
+
: await loadPreviousState(this.chunksFile);
|
|
72
|
+
const { toProcess, toDelete } = await gitTracker.getChangedFiles(previousState);
|
|
73
|
+
telemetry?.recordGitTracking({
|
|
74
|
+
durationMs: Date.now() - t1,
|
|
75
|
+
filesScanned: currentState.size,
|
|
76
|
+
toProcess: toProcess.length,
|
|
77
|
+
toDelete: toDelete.length,
|
|
78
|
+
});
|
|
79
|
+
if (toProcess.length === 0 && toDelete.length === 0 && !opts.force) {
|
|
80
|
+
console.log("\n✨ No changes detected.");
|
|
81
|
+
return;
|
|
82
|
+
}
|
|
83
|
+
console.log(`\n📊 Changes: ${toProcess.length} to process, ${toDelete.length} to delete\n`);
|
|
84
|
+
// Step 2: Generate chunks (with resume)
|
|
85
|
+
console.log("🔪 Step 2: Generating chunks...");
|
|
86
|
+
const t2 = Date.now();
|
|
87
|
+
const chunkProcessor = new ChunkProcessor(this.config.chunkers);
|
|
88
|
+
const fileState = new Map();
|
|
89
|
+
for (const file of toProcess) {
|
|
90
|
+
const info = currentState.get(file);
|
|
91
|
+
if (info)
|
|
92
|
+
fileState.set(file, info);
|
|
93
|
+
}
|
|
94
|
+
const existingChunks = opts.force
|
|
95
|
+
? []
|
|
96
|
+
: await loadExistingChunks(this.chunksFile);
|
|
97
|
+
const chunks = await chunkProcessor.processFiles(toProcess, fileState, existingChunks);
|
|
98
|
+
await chunkProcessor.saveChunksLocal(chunks, this.chunksFile);
|
|
99
|
+
telemetry?.recordChunking({
|
|
100
|
+
durationMs: Date.now() - t2,
|
|
101
|
+
filesProcessed: toProcess.length,
|
|
102
|
+
chunksGenerated: chunks.length,
|
|
103
|
+
errors: 0,
|
|
104
|
+
});
|
|
105
|
+
if (chunks.length === 0) {
|
|
106
|
+
console.log("\n⚠️ No chunks generated. Exiting.");
|
|
107
|
+
return;
|
|
108
|
+
}
|
|
109
|
+
// Step 3: Generate embeddings
|
|
110
|
+
console.log("\n🔢 Step 3: Generating embeddings...");
|
|
111
|
+
const t3 = Date.now();
|
|
112
|
+
const embedder = new EmbedderProcessor(this.config.embedder, {
|
|
113
|
+
rateLimitMs: opts.rateLimitMs,
|
|
114
|
+
batchSize: opts.batchSize,
|
|
115
|
+
retry: opts.retry,
|
|
116
|
+
concurrency: opts.concurrency,
|
|
117
|
+
});
|
|
118
|
+
const newEmbeddings = await embedder.run(this.chunksFile, opts.force || false);
|
|
119
|
+
telemetry?.recordEmbedding({
|
|
120
|
+
durationMs: Date.now() - t3,
|
|
121
|
+
chunksEmbedded: newEmbeddings.length,
|
|
122
|
+
chunksSkipped: chunks.length - newEmbeddings.length,
|
|
123
|
+
});
|
|
124
|
+
// Step 4: Upload
|
|
125
|
+
if (opts.dryRun) {
|
|
126
|
+
const uploader = new Uploader(this.config.vectorStore);
|
|
127
|
+
const { toUpload: dryUpload, toDelete: dryDelete } = await uploader.getItemsToUpload(this.embeddingsFile, opts.force || false);
|
|
128
|
+
console.log("\n📤 Step 4: Upload (dry-run — no changes written)");
|
|
129
|
+
console.log(` Would upload: ${dryUpload.length} document(s)`);
|
|
130
|
+
console.log(` Would delete: ${dryDelete.length} source file(s)`);
|
|
131
|
+
}
|
|
132
|
+
else if (!opts.skipUpload) {
|
|
133
|
+
console.log("\n📤 Step 4: Uploading to vector store...");
|
|
134
|
+
const t4 = Date.now();
|
|
135
|
+
const uploader = new Uploader(this.config.vectorStore, {
|
|
136
|
+
retry: opts.retry,
|
|
137
|
+
});
|
|
138
|
+
uploadStats = await uploader.sync(this.embeddingsFile, opts.force || false);
|
|
139
|
+
telemetry?.recordUpload({
|
|
140
|
+
durationMs: Date.now() - t4,
|
|
141
|
+
uploaded: uploadStats.uploaded,
|
|
142
|
+
deleted: uploadStats.deleted,
|
|
143
|
+
});
|
|
144
|
+
}
|
|
145
|
+
console.log("\n✨ RAG pipeline complete!");
|
|
146
|
+
if (telemetry) {
|
|
147
|
+
telemetry.finish();
|
|
148
|
+
telemetry.printSummary();
|
|
149
|
+
const telemetryFile = this.chunksFile.replace("chunks.json", "telemetry.json");
|
|
150
|
+
await telemetry.save(telemetryFile);
|
|
151
|
+
}
|
|
152
|
+
if (opts.notifications?.webhookUrl) {
|
|
153
|
+
await notifyWebhook(opts.notifications.webhookUrl, "success", {
|
|
154
|
+
durationMs: telemetry?.getData().durationMs,
|
|
155
|
+
stages: telemetry?.getData().stages,
|
|
156
|
+
uploaded: uploadStats.uploaded,
|
|
157
|
+
deleted: uploadStats.deleted,
|
|
158
|
+
});
|
|
159
|
+
}
|
|
63
160
|
}
|
|
64
|
-
|
|
65
|
-
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
|
|
73
|
-
await uploader.sync(this.embeddingsFile, this.config.options?.force || false);
|
|
161
|
+
catch (err) {
|
|
162
|
+
telemetry?.finish();
|
|
163
|
+
if (opts.notifications?.webhookUrl) {
|
|
164
|
+
await notifyWebhook(opts.notifications.webhookUrl, "error", {
|
|
165
|
+
error: err instanceof Error ? err.message : String(err),
|
|
166
|
+
durationMs: telemetry?.getData().durationMs,
|
|
167
|
+
});
|
|
168
|
+
}
|
|
169
|
+
throw err;
|
|
74
170
|
}
|
|
75
|
-
console.log("\n✨ RAG pipeline complete!");
|
|
76
171
|
}
|
|
77
172
|
}
|
|
78
173
|
//# sourceMappingURL=orchestrator.js.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"orchestrator.js","sourceRoot":"","sources":["../../src/core/orchestrator.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,UAAU,EAAE,MAAM,kBAAkB,CAAC;AAC9C,OAAO,EAAE,cAAc,EAAE,MAAM,sBAAsB,CAAC;AACtD,OAAO,EAAE,iBAAiB,EAAE,MAAM,eAAe,CAAC;AAClD,OAAO,EAAE,QAAQ,EAAE,MAAM,eAAe,CAAC;
|
|
1
|
+
{"version":3,"file":"orchestrator.js","sourceRoot":"","sources":["../../src/core/orchestrator.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,UAAU,EAAE,MAAM,kBAAkB,CAAC;AAC9C,OAAO,EAAE,cAAc,EAAE,MAAM,sBAAsB,CAAC;AACtD,OAAO,EAAE,iBAAiB,EAAE,MAAM,eAAe,CAAC;AAClD,OAAO,EAAE,QAAQ,EAAE,MAAM,eAAe,CAAC;AACzC,OAAO,EAAE,kBAAkB,EAAE,MAAM,gBAAgB,CAAC;AAOpD,OAAO,EAAE,QAAQ,EAAE,MAAM,aAAa,CAAC;AAsBvC,KAAK,UAAU,iBAAiB,CAC9B,UAAkB;IAElB,IAAI,CAAC;QACH,MAAM,OAAO,GAAG,MAAM,QAAQ,CAAC,UAAU,EAAE,OAAO,CAAC,CAAC;QACpD,MAAM,MAAM,GAAG,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;QACnC,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,MAAM,CAAC;YAAE,OAAO,IAAI,GAAG,EAAE,CAAC;QAC7C,MAAM,KAAK,GAAG,IAAI,GAAG,EAAkB,CAAC;QACxC,KAAK,MAAM,KAAK,IAAI,MAAiB,EAAE,CAAC;YACtC,IAAI,KAAK,CAAC,UAAU,IAAI,KAAK,CAAC,UAAU,EAAE,CAAC;gBACzC,KAAK,CAAC,GAAG,CAAC,KAAK,CAAC,UAAU,EAAE,KAAK,CAAC,UAAU,CAAC,CAAC;YAChD,CAAC;QACH,CAAC;QACD,OAAO,KAAK,CAAC;IACf,CAAC;IAAC,MAAM,CAAC;QACP,OAAO,IAAI,GAAG,EAAE,CAAC;IACnB,CAAC;AACH,CAAC;AAED,KAAK,UAAU,kBAAkB,CAAC,UAAkB;IAClD,IAAI,CAAC;QACH,MAAM,OAAO,GAAG,MAAM,QAAQ,CAAC,UAAU,EAAE,OAAO,CAAC,CAAC;QACpD,MAAM,MAAM,GAAY,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC;QAC5C,OAAO,KAAK,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC,CAAC,CAAE,MAAkB,CAAC,CAAC,CAAC,EAAE,CAAC;IAC1D,CAAC;IAAC,MAAM,CAAC;QACP,OAAO,EAAE,CAAC;IACZ,CAAC;AACH,CAAC;AAED,KAAK,UAAU,aAAa,CAC1B,GAAW,EACX,MAA2B,EAC3B,OAAgC;IAEhC,IAAI,CAAC;QACH,MAAM,KAAK,CAAC,GAAG,EAAE;YACf,MAAM,EAAE,MAAM;YACd,OAAO,EAAE,EAAE,cAAc,EAAE,kBAAkB,EAAE;YAC/C,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC,EAAE,MAAM,EAAE,GAAG,OAAO,EAAE,CAAC;SAC7C,CAAC,CAAC;IACL,CAAC;IAAC,MAAM,CAAC;QACP,sCAAsC;IACxC,CAAC;AACH,CAAC;AAED,MAAM,OAAO,YAAY;IACf,MAAM,CAAoB;IAC1B,UAAU,CAAS;IACnB,cAAc,CAAS;IAE/B,YAAY,MAAyB;QACnC,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC;QACrB,IAAI,CAAC,UAAU,GAAG,MAAM,CAAC,OAAO,EAAE,UAAU,IAAI,wBAAwB,CAAC;QACzE,IAAI,CAAC,cAAc;YACjB,MAAM,CAAC,OAAO,EAAE,cAAc,IAAI,4BAA4B,CAAC;IACnE,CAAC;IAED,KAAK,CAAC,GAAG;QACP,MAAM,IAAI,GAAG,IAAI,CAAC,MAAM,CAAC,OAAO,IAAI,EAAE,CAAC;QACvC,MAAM,SAAS,GAAG,IAAI,CAAC,SAAS,CAAC,CAAC,CAAC,IAAI,kBAAkB,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC;QACnE,SAAS,EAAE,KAAK,EAAE,CAAC;QAEnB,IAAI,WAAW,GAAG,EAAE,QAAQ,EAAE,CAAC,EAAE,OAAO,EAAE,CAAC,EAAE,CAAC;QAE9C,IAAI,CAAC;YACH,OAAO,CAAC,GAAG,CAAC,+BAA+B,CAAC,CAAC;YAE7C,2BAA2B;YAC3B,OAAO,CAAC,GAAG,CAAC,oCAAoC,CAAC,CAAC;YAClD,MAAM,EAAE,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;YACtB,MAAM,UAAU,GAAG,IAAI,UAAU,CAAC,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;YACxD,MAAM,YAAY,GAAG,MAAM,UAAU,CAAC,eAAe,EAAE,CAAC;YAExD,MAAM,aAAa,GAAG,IAAI,CAAC,KAAK;gBAC9B,CAAC,CAAC,IAAI,GAAG,EAAkB;gBAC3B,CAAC,CAAC,MAAM,iBAAiB,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;YAE7C,MAAM,EAAE,SAAS,EAAE,QAAQ,EAAE,GAC3B,MAAM,UAAU,CAAC,eAAe,CAAC,aAAa,CAAC,CAAC;YAElD,SAAS,EAAE,iBAAiB,CAAC;gBAC3B,UAAU,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,EAAE;gBAC3B,YAAY,EAAE,YAAY,CAAC,IAAI;gBAC/B,SAAS,EAAE,SAAS,CAAC,MAAM;gBAC3B,QAAQ,EAAE,QAAQ,CAAC,MAAM;aAC1B,CAAC,CAAC;YAEH,IAAI,SAAS,CAAC,MAAM,KAAK,CAAC,IAAI,QAAQ,CAAC,MAAM,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,KAAK,EAAE,CAAC;gBACnE,OAAO,CAAC,GAAG,CAAC,0BAA0B,CAAC,CAAC;gBACxC,OAAO;YACT,CAAC;YAED,OAAO,CAAC,GAAG,CACT,iBAAiB,SAAS,CAAC,MAAM,gBAAgB,QAAQ,CAAC,MAAM,cAAc,CAC/E,CAAC;YAEF,wCAAwC;YACxC,OAAO,CAAC,GAAG,CAAC,iCAAiC,CAAC,CAAC;YAC/C,MAAM,EAAE,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;YACtB,MAAM,cAAc,GAAG,IAAI,cAAc,CAAC,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;YAEhE,MAAM,SAAS,GAAG,IAAI,GAAG,EAGtB,CAAC;YACJ,KAAK,MAAM,IAAI,IAAI,SAAS,EAAE,CAAC;gBAC7B,MAAM,IAAI,GAAG,YAAY,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC;gBACpC,IAAI,IAAI;oBAAE,SAAS,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC;YACtC,CAAC;YAED,MAAM,cAAc,GAAG,IAAI,CAAC,KAAK;gBAC/B,CAAC,CAAC,EAAE;gBACJ,CAAC,CAAC,MAAM,kBAAkB,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;YAE9C,MAAM,MAAM,GAAG,MAAM,cAAc,CAAC,YAAY,CAC9C,SAAS,EACT,SAAS,EACT,cAAc,CACf,CAAC;YACF,MAAM,cAAc,CAAC,eAAe,CAAC,MAAM,EAAE,IAAI,CAAC,UAAU,CAAC,CAAC;YAE9D,SAAS,EAAE,cAAc,CAAC;gBACxB,UAAU,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,EAAE;gBAC3B,cAAc,EAAE,SAAS,CAAC,MAAM;gBAChC,eAAe,EAAE,MAAM,CAAC,MAAM;gBAC9B,MAAM,EAAE,CAAC;aACV,CAAC,CAAC;YAEH,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;gBACxB,OAAO,CAAC,GAAG,CAAC,oCAAoC,CAAC,CAAC;gBAClD,OAAO;YACT,CAAC;YAED,8BAA8B;YAC9B,OAAO,CAAC,GAAG,CAAC,uCAAuC,CAAC,CAAC;YACrD,MAAM,EAAE,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;YACtB,MAAM,QAAQ,GAAG,IAAI,iBAAiB,CAAC,IAAI,CAAC,MAAM,CAAC,QAAQ,EAAE;gBAC3D,WAAW,EAAE,IAAI,CAAC,WAAW;gBAC7B,SAAS,EAAE,IAAI,CAAC,SAAS;gBACzB,KAAK,EAAE,IAAI,CAAC,KAAK;gBACjB,WAAW,EAAE,IAAI,CAAC,WAAW;aAC9B,CAAC,CAAC;YAEH,MAAM,aAAa,GAAG,MAAM,QAAQ,CAAC,GAAG,CACtC,IAAI,CAAC,UAAU,EACf,IAAI,CAAC,KAAK,IAAI,KAAK,CACpB,CAAC;YAEF,SAAS,EAAE,eAAe,CAAC;gBACzB,UAAU,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,EAAE;gBAC3B,cAAc,EAAE,aAAa,CAAC,MAAM;gBACpC,aAAa,EAAE,MAAM,CAAC,MAAM,GAAG,aAAa,CAAC,MAAM;aACpD,CAAC,CAAC;YAEH,iBAAiB;YACjB,IAAI,IAAI,CAAC,MAAM,EAAE,CAAC;gBAChB,MAAM,QAAQ,GAAG,IAAI,QAAQ,CAAC,IAAI,CAAC,MAAM,CAAC,WAAW,CAAC,CAAC;gBACvD,MAAM,EAAE,QAAQ,EAAE,SAAS,EAAE,QAAQ,EAAE,SAAS,EAAE,GAChD,MAAM,QAAQ,CAAC,gBAAgB,CAC7B,IAAI,CAAC,cAAc,EACnB,IAAI,CAAC,KAAK,IAAI,KAAK,CACpB,CAAC;gBACJ,OAAO,CAAC,GAAG,CAAC,oDAAoD,CAAC,CAAC;gBAClE,OAAO,CAAC,GAAG,CAAC,oBAAoB,SAAS,CAAC,MAAM,cAAc,CAAC,CAAC;gBAChE,OAAO,CAAC,GAAG,CAAC,oBAAoB,SAAS,CAAC,MAAM,iBAAiB,CAAC,CAAC;YACrE,CAAC;iBAAM,IAAI,CAAC,IAAI,CAAC,UAAU,EAAE,CAAC;gBAC5B,OAAO,CAAC,GAAG,CAAC,2CAA2C,CAAC,CAAC;gBACzD,MAAM,EAAE,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;gBACtB,MAAM,QAAQ,GAAG,IAAI,QAAQ,CAAC,IAAI,CAAC,MAAM,CAAC,WAAW,EAAE;oBACrD,KAAK,EAAE,IAAI,CAAC,KAAK;iBAClB,CAAC,CAAC;gBACH,WAAW,GAAG,MAAM,QAAQ,CAAC,IAAI,CAC/B,IAAI,CAAC,cAAc,EACnB,IAAI,CAAC,KAAK,IAAI,KAAK,CACpB,CAAC;gBAEF,SAAS,EAAE,YAAY,CAAC;oBACtB,UAAU,EAAE,IAAI,CAAC,GAAG,EAAE,GAAG,EAAE;oBAC3B,QAAQ,EAAE,WAAW,CAAC,QAAQ;oBAC9B,OAAO,EAAE,WAAW,CAAC,OAAO;iBAC7B,CAAC,CAAC;YACL,CAAC;YAED,OAAO,CAAC,GAAG,CAAC,4BAA4B,CAAC,CAAC;YAE1C,IAAI,SAAS,EAAE,CAAC;gBACd,SAAS,CAAC,MAAM,EAAE,CAAC;gBACnB,SAAS,CAAC,YAAY,EAAE,CAAC;gBACzB,MAAM,aAAa,GAAG,IAAI,CAAC,UAAU,CAAC,OAAO,CAC3C,aAAa,EACb,gBAAgB,CACjB,CAAC;gBACF,MAAM,SAAS,CAAC,IAAI,CAAC,aAAa,CAAC,CAAC;YACtC,CAAC;YAED,IAAI,IAAI,CAAC,aAAa,EAAE,UAAU,EAAE,CAAC;gBACnC,MAAM,aAAa,CAAC,IAAI,CAAC,aAAa,CAAC,UAAU,EAAE,SAAS,EAAE;oBAC5D,UAAU,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC,UAAU;oBAC3C,MAAM,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC,MAAM;oBACnC,QAAQ,EAAE,WAAW,CAAC,QAAQ;oBAC9B,OAAO,EAAE,WAAW,CAAC,OAAO;iBAC7B,CAAC,CAAC;YACL,CAAC;QACH,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,SAAS,EAAE,MAAM,EAAE,CAAC;YAEpB,IAAI,IAAI,CAAC,aAAa,EAAE,UAAU,EAAE,CAAC;gBACnC,MAAM,aAAa,CAAC,IAAI,CAAC,aAAa,CAAC,UAAU,EAAE,OAAO,EAAE;oBAC1D,KAAK,EAAE,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC;oBACvD,UAAU,EAAE,SAAS,EAAE,OAAO,EAAE,CAAC,UAAU;iBAC5C,CAAC,CAAC;YACL,CAAC;YAED,MAAM,GAAG,CAAC;QACZ,CAAC;IACH,CAAC;CACF"}
|
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
export interface RagPlugin {
|
|
2
|
+
name: string;
|
|
3
|
+
type: "embedder" | "store" | "chunker";
|
|
4
|
+
factory: () => unknown;
|
|
5
|
+
}
|
|
6
|
+
/**
|
|
7
|
+
* Discover RAG plugins from installed npm packages.
|
|
8
|
+
*
|
|
9
|
+
* A plugin package must export either:
|
|
10
|
+
* `ragPlugin: RagPlugin` — single plugin
|
|
11
|
+
* `ragPlugins: RagPlugin[]` — multiple plugins
|
|
12
|
+
*
|
|
13
|
+
* Naming convention (not enforced):
|
|
14
|
+
* rag-embedder-* EmbeddingProvider implementations
|
|
15
|
+
* rag-store-* VectorStore implementations
|
|
16
|
+
* rag-chunker-* FileChunker / ChunkStrategy implementations
|
|
17
|
+
*/
|
|
18
|
+
export declare function discoverPlugins(packageNames: string[]): Promise<RagPlugin[]>;
|
|
19
|
+
//# sourceMappingURL=plugin-discovery.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"plugin-discovery.d.ts","sourceRoot":"","sources":["../../src/core/plugin-discovery.ts"],"names":[],"mappings":"AAAA,MAAM,WAAW,SAAS;IACxB,IAAI,EAAE,MAAM,CAAC;IACb,IAAI,EAAE,UAAU,GAAG,OAAO,GAAG,SAAS,CAAC;IACvC,OAAO,EAAE,MAAM,OAAO,CAAC;CACxB;AAED;;;;;;;;;;;GAWG;AACH,wBAAsB,eAAe,CACnC,YAAY,EAAE,MAAM,EAAE,GACrB,OAAO,CAAC,SAAS,EAAE,CAAC,CA0BtB"}
|
|
@@ -0,0 +1,47 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Discover RAG plugins from installed npm packages.
|
|
3
|
+
*
|
|
4
|
+
* A plugin package must export either:
|
|
5
|
+
* `ragPlugin: RagPlugin` — single plugin
|
|
6
|
+
* `ragPlugins: RagPlugin[]` — multiple plugins
|
|
7
|
+
*
|
|
8
|
+
* Naming convention (not enforced):
|
|
9
|
+
* rag-embedder-* EmbeddingProvider implementations
|
|
10
|
+
* rag-store-* VectorStore implementations
|
|
11
|
+
* rag-chunker-* FileChunker / ChunkStrategy implementations
|
|
12
|
+
*/
|
|
13
|
+
export async function discoverPlugins(packageNames) {
|
|
14
|
+
const discovered = [];
|
|
15
|
+
for (const pkg of packageNames) {
|
|
16
|
+
let mod;
|
|
17
|
+
try {
|
|
18
|
+
mod = (await import(pkg));
|
|
19
|
+
}
|
|
20
|
+
catch {
|
|
21
|
+
console.warn(` ⚠️ Could not load plugin package: ${pkg}`);
|
|
22
|
+
continue;
|
|
23
|
+
}
|
|
24
|
+
if (isRagPlugin(mod.ragPlugin)) {
|
|
25
|
+
discovered.push(mod.ragPlugin);
|
|
26
|
+
}
|
|
27
|
+
else if (Array.isArray(mod.ragPlugins)) {
|
|
28
|
+
for (const p of mod.ragPlugins) {
|
|
29
|
+
if (isRagPlugin(p))
|
|
30
|
+
discovered.push(p);
|
|
31
|
+
}
|
|
32
|
+
}
|
|
33
|
+
else {
|
|
34
|
+
console.warn(` ⚠️ Package "${pkg}" has no ragPlugin or ragPlugins export — skipping`);
|
|
35
|
+
}
|
|
36
|
+
}
|
|
37
|
+
return discovered;
|
|
38
|
+
}
|
|
39
|
+
function isRagPlugin(value) {
|
|
40
|
+
if (!value || typeof value !== "object")
|
|
41
|
+
return false;
|
|
42
|
+
const p = value;
|
|
43
|
+
return (typeof p.name === "string" &&
|
|
44
|
+
(p.type === "embedder" || p.type === "store" || p.type === "chunker") &&
|
|
45
|
+
typeof p.factory === "function");
|
|
46
|
+
}
|
|
47
|
+
//# sourceMappingURL=plugin-discovery.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"plugin-discovery.js","sourceRoot":"","sources":["../../src/core/plugin-discovery.ts"],"names":[],"mappings":"AAMA;;;;;;;;;;;GAWG;AACH,MAAM,CAAC,KAAK,UAAU,eAAe,CACnC,YAAsB;IAEtB,MAAM,UAAU,GAAgB,EAAE,CAAC;IAEnC,KAAK,MAAM,GAAG,IAAI,YAAY,EAAE,CAAC;QAC/B,IAAI,GAA4B,CAAC;QACjC,IAAI,CAAC;YACH,GAAG,GAAG,CAAC,MAAM,MAAM,CAAC,GAAG,CAAC,CAA4B,CAAC;QACvD,CAAC;QAAC,MAAM,CAAC;YACP,OAAO,CAAC,IAAI,CAAC,uCAAuC,GAAG,EAAE,CAAC,CAAC;YAC3D,SAAS;QACX,CAAC;QAED,IAAI,WAAW,CAAC,GAAG,CAAC,SAAS,CAAC,EAAE,CAAC;YAC/B,UAAU,CAAC,IAAI,CAAC,GAAG,CAAC,SAAS,CAAC,CAAC;QACjC,CAAC;aAAM,IAAI,KAAK,CAAC,OAAO,CAAC,GAAG,CAAC,UAAU,CAAC,EAAE,CAAC;YACzC,KAAK,MAAM,CAAC,IAAI,GAAG,CAAC,UAAU,EAAE,CAAC;gBAC/B,IAAI,WAAW,CAAC,CAAC,CAAC;oBAAE,UAAU,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC;YACzC,CAAC;QACH,CAAC;aAAM,CAAC;YACN,OAAO,CAAC,IAAI,CACV,iBAAiB,GAAG,oDAAoD,CACzE,CAAC;QACJ,CAAC;IACH,CAAC;IAED,OAAO,UAAU,CAAC;AACpB,CAAC;AAED,SAAS,WAAW,CAAC,KAAc;IACjC,IAAI,CAAC,KAAK,IAAI,OAAO,KAAK,KAAK,QAAQ;QAAE,OAAO,KAAK,CAAC;IACtD,MAAM,CAAC,GAAG,KAAgC,CAAC;IAC3C,OAAO,CACL,OAAO,CAAC,CAAC,IAAI,KAAK,QAAQ;QAC1B,CAAC,CAAC,CAAC,IAAI,KAAK,UAAU,IAAI,CAAC,CAAC,IAAI,KAAK,OAAO,IAAI,CAAC,CAAC,IAAI,KAAK,SAAS,CAAC;QACrE,OAAO,CAAC,CAAC,OAAO,KAAK,UAAU,CAChC,CAAC;AACJ,CAAC"}
|
|
@@ -0,0 +1,61 @@
|
|
|
1
|
+
interface StageStats {
|
|
2
|
+
durationMs: number;
|
|
3
|
+
[key: string]: unknown;
|
|
4
|
+
}
|
|
5
|
+
interface TelemetryData {
|
|
6
|
+
runAt: string;
|
|
7
|
+
durationMs: number;
|
|
8
|
+
stages: {
|
|
9
|
+
gitTracking?: StageStats & {
|
|
10
|
+
filesScanned: number;
|
|
11
|
+
toProcess: number;
|
|
12
|
+
toDelete: number;
|
|
13
|
+
};
|
|
14
|
+
chunking?: StageStats & {
|
|
15
|
+
filesProcessed: number;
|
|
16
|
+
chunksGenerated: number;
|
|
17
|
+
errors: number;
|
|
18
|
+
};
|
|
19
|
+
embedding?: StageStats & {
|
|
20
|
+
chunksEmbedded: number;
|
|
21
|
+
chunksSkipped: number;
|
|
22
|
+
};
|
|
23
|
+
upload?: StageStats & {
|
|
24
|
+
uploaded: number;
|
|
25
|
+
deleted: number;
|
|
26
|
+
};
|
|
27
|
+
};
|
|
28
|
+
}
|
|
29
|
+
export declare class TelemetryCollector {
|
|
30
|
+
private startedAt;
|
|
31
|
+
private data;
|
|
32
|
+
start(): void;
|
|
33
|
+
recordGitTracking(stats: {
|
|
34
|
+
filesScanned: number;
|
|
35
|
+
toProcess: number;
|
|
36
|
+
toDelete: number;
|
|
37
|
+
durationMs: number;
|
|
38
|
+
}): void;
|
|
39
|
+
recordChunking(stats: {
|
|
40
|
+
filesProcessed: number;
|
|
41
|
+
chunksGenerated: number;
|
|
42
|
+
errors: number;
|
|
43
|
+
durationMs: number;
|
|
44
|
+
}): void;
|
|
45
|
+
recordEmbedding(stats: {
|
|
46
|
+
chunksEmbedded: number;
|
|
47
|
+
chunksSkipped: number;
|
|
48
|
+
durationMs: number;
|
|
49
|
+
}): void;
|
|
50
|
+
recordUpload(stats: {
|
|
51
|
+
uploaded: number;
|
|
52
|
+
deleted: number;
|
|
53
|
+
durationMs: number;
|
|
54
|
+
}): void;
|
|
55
|
+
finish(): void;
|
|
56
|
+
getData(): TelemetryData;
|
|
57
|
+
printSummary(): void;
|
|
58
|
+
save(outputPath: string): Promise<void>;
|
|
59
|
+
}
|
|
60
|
+
export {};
|
|
61
|
+
//# sourceMappingURL=telemetry.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"telemetry.d.ts","sourceRoot":"","sources":["../../src/core/telemetry.ts"],"names":[],"mappings":"AAGA,UAAU,UAAU;IAClB,UAAU,EAAE,MAAM,CAAC;IACnB,CAAC,GAAG,EAAE,MAAM,GAAG,OAAO,CAAC;CACxB;AAED,UAAU,aAAa;IACrB,KAAK,EAAE,MAAM,CAAC;IACd,UAAU,EAAE,MAAM,CAAC;IACnB,MAAM,EAAE;QACN,WAAW,CAAC,EAAE,UAAU,GAAG;YACzB,YAAY,EAAE,MAAM,CAAC;YACrB,SAAS,EAAE,MAAM,CAAC;YAClB,QAAQ,EAAE,MAAM,CAAC;SAClB,CAAC;QACF,QAAQ,CAAC,EAAE,UAAU,GAAG;YACtB,cAAc,EAAE,MAAM,CAAC;YACvB,eAAe,EAAE,MAAM,CAAC;YACxB,MAAM,EAAE,MAAM,CAAC;SAChB,CAAC;QACF,SAAS,CAAC,EAAE,UAAU,GAAG;YACvB,cAAc,EAAE,MAAM,CAAC;YACvB,aAAa,EAAE,MAAM,CAAC;SACvB,CAAC;QACF,MAAM,CAAC,EAAE,UAAU,GAAG;YACpB,QAAQ,EAAE,MAAM,CAAC;YACjB,OAAO,EAAE,MAAM,CAAC;SACjB,CAAC;KACH,CAAC;CACH;AAED,qBAAa,kBAAkB;IAC7B,OAAO,CAAC,SAAS,CAAK;IACtB,OAAO,CAAC,IAAI,CAIV;IAEF,KAAK,IAAI,IAAI;IAKb,iBAAiB,CAAC,KAAK,EAAE;QACvB,YAAY,EAAE,MAAM,CAAC;QACrB,SAAS,EAAE,MAAM,CAAC;QAClB,QAAQ,EAAE,MAAM,CAAC;QACjB,UAAU,EAAE,MAAM,CAAC;KACpB,GAAG,IAAI;IAIR,cAAc,CAAC,KAAK,EAAE;QACpB,cAAc,EAAE,MAAM,CAAC;QACvB,eAAe,EAAE,MAAM,CAAC;QACxB,MAAM,EAAE,MAAM,CAAC;QACf,UAAU,EAAE,MAAM,CAAC;KACpB,GAAG,IAAI;IAIR,eAAe,CAAC,KAAK,EAAE;QACrB,cAAc,EAAE,MAAM,CAAC;QACvB,aAAa,EAAE,MAAM,CAAC;QACtB,UAAU,EAAE,MAAM,CAAC;KACpB,GAAG,IAAI;IAIR,YAAY,CAAC,KAAK,EAAE;QAClB,QAAQ,EAAE,MAAM,CAAC;QACjB,OAAO,EAAE,MAAM,CAAC;QAChB,UAAU,EAAE,MAAM,CAAC;KACpB,GAAG,IAAI;IAIR,MAAM,IAAI,IAAI;IAId,OAAO,IAAI,aAAa;IAIxB,YAAY,IAAI,IAAI;IAYd,IAAI,CAAC,UAAU,EAAE,MAAM,GAAG,OAAO,CAAC,IAAI,CAAC;CAK9C"}
|